Strengthen haifa_sched_info callbacks and 3 scheduler hooks
[gcc.git] / gcc / config / mips / mips.c
1 /* Subroutines used for MIPS code generation.
2 Copyright (C) 1989-2014 Free Software Foundation, Inc.
3 Contributed by A. Lichnewsky, lich@inria.inria.fr.
4 Changes by Michael Meissner, meissner@osf.org.
5 64-bit r4000 support by Ian Lance Taylor, ian@cygnus.com, and
6 Brendan Eich, brendan@microunity.com.
7
8 This file is part of GCC.
9
10 GCC is free software; you can redistribute it and/or modify
11 it under the terms of the GNU General Public License as published by
12 the Free Software Foundation; either version 3, or (at your option)
13 any later version.
14
15 GCC is distributed in the hope that it will be useful,
16 but WITHOUT ANY WARRANTY; without even the implied warranty of
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 GNU General Public License for more details.
19
20 You should have received a copy of the GNU General Public License
21 along with GCC; see the file COPYING3. If not see
22 <http://www.gnu.org/licenses/>. */
23
24 #include "config.h"
25 #include "system.h"
26 #include "coretypes.h"
27 #include "tm.h"
28 #include "rtl.h"
29 #include "regs.h"
30 #include "hard-reg-set.h"
31 #include "insn-config.h"
32 #include "conditions.h"
33 #include "insn-attr.h"
34 #include "recog.h"
35 #include "output.h"
36 #include "tree.h"
37 #include "varasm.h"
38 #include "stringpool.h"
39 #include "stor-layout.h"
40 #include "calls.h"
41 #include "function.h"
42 #include "expr.h"
43 #include "optabs.h"
44 #include "libfuncs.h"
45 #include "flags.h"
46 #include "reload.h"
47 #include "tm_p.h"
48 #include "ggc.h"
49 #include "gstab.h"
50 #include "hash-table.h"
51 #include "debug.h"
52 #include "target.h"
53 #include "target-def.h"
54 #include "common/common-target.h"
55 #include "langhooks.h"
56 #include "sched-int.h"
57 #include "vec.h"
58 #include "basic-block.h"
59 #include "tree-ssa-alias.h"
60 #include "internal-fn.h"
61 #include "gimple-fold.h"
62 #include "tree-eh.h"
63 #include "gimple-expr.h"
64 #include "is-a.h"
65 #include "gimple.h"
66 #include "gimplify.h"
67 #include "bitmap.h"
68 #include "diagnostic.h"
69 #include "target-globals.h"
70 #include "opts.h"
71 #include "tree-pass.h"
72 #include "context.h"
73 #include "cgraph.h"
74 #include "builtins.h"
75
76 /* True if X is an UNSPEC wrapper around a SYMBOL_REF or LABEL_REF. */
77 #define UNSPEC_ADDRESS_P(X) \
78 (GET_CODE (X) == UNSPEC \
79 && XINT (X, 1) >= UNSPEC_ADDRESS_FIRST \
80 && XINT (X, 1) < UNSPEC_ADDRESS_FIRST + NUM_SYMBOL_TYPES)
81
82 /* Extract the symbol or label from UNSPEC wrapper X. */
83 #define UNSPEC_ADDRESS(X) \
84 XVECEXP (X, 0, 0)
85
86 /* Extract the symbol type from UNSPEC wrapper X. */
87 #define UNSPEC_ADDRESS_TYPE(X) \
88 ((enum mips_symbol_type) (XINT (X, 1) - UNSPEC_ADDRESS_FIRST))
89
90 /* The maximum distance between the top of the stack frame and the
91 value $sp has when we save and restore registers.
92
93 The value for normal-mode code must be a SMALL_OPERAND and must
94 preserve the maximum stack alignment. We therefore use a value
95 of 0x7ff0 in this case.
96
97 microMIPS LWM and SWM support 12-bit offsets (from -0x800 to 0x7ff),
98 so we use a maximum of 0x7f0 for TARGET_MICROMIPS.
99
100 MIPS16e SAVE and RESTORE instructions can adjust the stack pointer by
101 up to 0x7f8 bytes and can usually save or restore all the registers
102 that we need to save or restore. (Note that we can only use these
103 instructions for o32, for which the stack alignment is 8 bytes.)
104
105 We use a maximum gap of 0x100 or 0x400 for MIPS16 code when SAVE and
106 RESTORE are not available. We can then use unextended instructions
107 to save and restore registers, and to allocate and deallocate the top
108 part of the frame. */
109 #define MIPS_MAX_FIRST_STACK_STEP \
110 (!TARGET_COMPRESSION ? 0x7ff0 \
111 : TARGET_MICROMIPS || GENERATE_MIPS16E_SAVE_RESTORE ? 0x7f8 \
112 : TARGET_64BIT ? 0x100 : 0x400)
113
114 /* True if INSN is a mips.md pattern or asm statement. */
115 /* ??? This test exists through the compiler, perhaps it should be
116 moved to rtl.h. */
117 #define USEFUL_INSN_P(INSN) \
118 (NONDEBUG_INSN_P (INSN) \
119 && GET_CODE (PATTERN (INSN)) != USE \
120 && GET_CODE (PATTERN (INSN)) != CLOBBER)
121
122 /* If INSN is a delayed branch sequence, return the first instruction
123 in the sequence, otherwise return INSN itself. */
124 #define SEQ_BEGIN(INSN) \
125 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \
126 ? as_a <rtx_insn *> (XVECEXP (PATTERN (INSN), 0, 0)) \
127 : (INSN))
128
129 /* Likewise for the last instruction in a delayed branch sequence. */
130 #define SEQ_END(INSN) \
131 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \
132 ? as_a <rtx_insn *> (XVECEXP (PATTERN (INSN), \
133 0, \
134 XVECLEN (PATTERN (INSN), 0) - 1)) \
135 : (INSN))
136
137 /* Execute the following loop body with SUBINSN set to each instruction
138 between SEQ_BEGIN (INSN) and SEQ_END (INSN) inclusive. */
139 #define FOR_EACH_SUBINSN(SUBINSN, INSN) \
140 for ((SUBINSN) = SEQ_BEGIN (INSN); \
141 (SUBINSN) != NEXT_INSN (SEQ_END (INSN)); \
142 (SUBINSN) = NEXT_INSN (SUBINSN))
143
144 /* True if bit BIT is set in VALUE. */
145 #define BITSET_P(VALUE, BIT) (((VALUE) & (1 << (BIT))) != 0)
146
147 /* Return the opcode for a ptr_mode load of the form:
148
149 l[wd] DEST, OFFSET(BASE). */
150 #define MIPS_LOAD_PTR(DEST, OFFSET, BASE) \
151 (((ptr_mode == DImode ? 0x37 : 0x23) << 26) \
152 | ((BASE) << 21) \
153 | ((DEST) << 16) \
154 | (OFFSET))
155
156 /* Return the opcode to move register SRC into register DEST. */
157 #define MIPS_MOVE(DEST, SRC) \
158 ((TARGET_64BIT ? 0x2d : 0x21) \
159 | ((DEST) << 11) \
160 | ((SRC) << 21))
161
162 /* Return the opcode for:
163
164 lui DEST, VALUE. */
165 #define MIPS_LUI(DEST, VALUE) \
166 ((0xf << 26) | ((DEST) << 16) | (VALUE))
167
168 /* Return the opcode to jump to register DEST. */
169 #define MIPS_JR(DEST) \
170 (((DEST) << 21) | 0x8)
171
172 /* Return the opcode for:
173
174 bal . + (1 + OFFSET) * 4. */
175 #define MIPS_BAL(OFFSET) \
176 ((0x1 << 26) | (0x11 << 16) | (OFFSET))
177
178 /* Return the usual opcode for a nop. */
179 #define MIPS_NOP 0
180
181 /* Classifies an address.
182
183 ADDRESS_REG
184 A natural register + offset address. The register satisfies
185 mips_valid_base_register_p and the offset is a const_arith_operand.
186
187 ADDRESS_LO_SUM
188 A LO_SUM rtx. The first operand is a valid base register and
189 the second operand is a symbolic address.
190
191 ADDRESS_CONST_INT
192 A signed 16-bit constant address.
193
194 ADDRESS_SYMBOLIC:
195 A constant symbolic address. */
196 enum mips_address_type {
197 ADDRESS_REG,
198 ADDRESS_LO_SUM,
199 ADDRESS_CONST_INT,
200 ADDRESS_SYMBOLIC
201 };
202
203 /* Macros to create an enumeration identifier for a function prototype. */
204 #define MIPS_FTYPE_NAME1(A, B) MIPS_##A##_FTYPE_##B
205 #define MIPS_FTYPE_NAME2(A, B, C) MIPS_##A##_FTYPE_##B##_##C
206 #define MIPS_FTYPE_NAME3(A, B, C, D) MIPS_##A##_FTYPE_##B##_##C##_##D
207 #define MIPS_FTYPE_NAME4(A, B, C, D, E) MIPS_##A##_FTYPE_##B##_##C##_##D##_##E
208
209 /* Classifies the prototype of a built-in function. */
210 enum mips_function_type {
211 #define DEF_MIPS_FTYPE(NARGS, LIST) MIPS_FTYPE_NAME##NARGS LIST,
212 #include "config/mips/mips-ftypes.def"
213 #undef DEF_MIPS_FTYPE
214 MIPS_MAX_FTYPE_MAX
215 };
216
217 /* Specifies how a built-in function should be converted into rtl. */
218 enum mips_builtin_type {
219 /* The function corresponds directly to an .md pattern. The return
220 value is mapped to operand 0 and the arguments are mapped to
221 operands 1 and above. */
222 MIPS_BUILTIN_DIRECT,
223
224 /* The function corresponds directly to an .md pattern. There is no return
225 value and the arguments are mapped to operands 0 and above. */
226 MIPS_BUILTIN_DIRECT_NO_TARGET,
227
228 /* The function corresponds to a comparison instruction followed by
229 a mips_cond_move_tf_ps pattern. The first two arguments are the
230 values to compare and the second two arguments are the vector
231 operands for the movt.ps or movf.ps instruction (in assembly order). */
232 MIPS_BUILTIN_MOVF,
233 MIPS_BUILTIN_MOVT,
234
235 /* The function corresponds to a V2SF comparison instruction. Operand 0
236 of this instruction is the result of the comparison, which has mode
237 CCV2 or CCV4. The function arguments are mapped to operands 1 and
238 above. The function's return value is an SImode boolean that is
239 true under the following conditions:
240
241 MIPS_BUILTIN_CMP_ANY: one of the registers is true
242 MIPS_BUILTIN_CMP_ALL: all of the registers are true
243 MIPS_BUILTIN_CMP_LOWER: the first register is true
244 MIPS_BUILTIN_CMP_UPPER: the second register is true. */
245 MIPS_BUILTIN_CMP_ANY,
246 MIPS_BUILTIN_CMP_ALL,
247 MIPS_BUILTIN_CMP_UPPER,
248 MIPS_BUILTIN_CMP_LOWER,
249
250 /* As above, but the instruction only sets a single $fcc register. */
251 MIPS_BUILTIN_CMP_SINGLE,
252
253 /* For generating bposge32 branch instructions in MIPS32 DSP ASE. */
254 MIPS_BUILTIN_BPOSGE32
255 };
256
257 /* Invoke MACRO (COND) for each C.cond.fmt condition. */
258 #define MIPS_FP_CONDITIONS(MACRO) \
259 MACRO (f), \
260 MACRO (un), \
261 MACRO (eq), \
262 MACRO (ueq), \
263 MACRO (olt), \
264 MACRO (ult), \
265 MACRO (ole), \
266 MACRO (ule), \
267 MACRO (sf), \
268 MACRO (ngle), \
269 MACRO (seq), \
270 MACRO (ngl), \
271 MACRO (lt), \
272 MACRO (nge), \
273 MACRO (le), \
274 MACRO (ngt)
275
276 /* Enumerates the codes above as MIPS_FP_COND_<X>. */
277 #define DECLARE_MIPS_COND(X) MIPS_FP_COND_ ## X
278 enum mips_fp_condition {
279 MIPS_FP_CONDITIONS (DECLARE_MIPS_COND)
280 };
281 #undef DECLARE_MIPS_COND
282
283 /* Index X provides the string representation of MIPS_FP_COND_<X>. */
284 #define STRINGIFY(X) #X
285 static const char *const mips_fp_conditions[] = {
286 MIPS_FP_CONDITIONS (STRINGIFY)
287 };
288 #undef STRINGIFY
289
290 /* A class used to control a comdat-style stub that we output in each
291 translation unit that needs it. */
292 class mips_one_only_stub {
293 public:
294 virtual ~mips_one_only_stub () {}
295
296 /* Return the name of the stub. */
297 virtual const char *get_name () = 0;
298
299 /* Output the body of the function to asm_out_file. */
300 virtual void output_body () = 0;
301 };
302
303 /* Tuning information that is automatically derived from other sources
304 (such as the scheduler). */
305 static struct {
306 /* The architecture and tuning settings that this structure describes. */
307 enum processor arch;
308 enum processor tune;
309
310 /* True if this structure describes MIPS16 settings. */
311 bool mips16_p;
312
313 /* True if the structure has been initialized. */
314 bool initialized_p;
315
316 /* True if "MULT $0, $0" is preferable to "MTLO $0; MTHI $0"
317 when optimizing for speed. */
318 bool fast_mult_zero_zero_p;
319 } mips_tuning_info;
320
321 /* Information about a function's frame layout. */
322 struct GTY(()) mips_frame_info {
323 /* The size of the frame in bytes. */
324 HOST_WIDE_INT total_size;
325
326 /* The number of bytes allocated to variables. */
327 HOST_WIDE_INT var_size;
328
329 /* The number of bytes allocated to outgoing function arguments. */
330 HOST_WIDE_INT args_size;
331
332 /* The number of bytes allocated to the .cprestore slot, or 0 if there
333 is no such slot. */
334 HOST_WIDE_INT cprestore_size;
335
336 /* Bit X is set if the function saves or restores GPR X. */
337 unsigned int mask;
338
339 /* Likewise FPR X. */
340 unsigned int fmask;
341
342 /* Likewise doubleword accumulator X ($acX). */
343 unsigned int acc_mask;
344
345 /* The number of GPRs, FPRs, doubleword accumulators and COP0
346 registers saved. */
347 unsigned int num_gp;
348 unsigned int num_fp;
349 unsigned int num_acc;
350 unsigned int num_cop0_regs;
351
352 /* The offset of the topmost GPR, FPR, accumulator and COP0-register
353 save slots from the top of the frame, or zero if no such slots are
354 needed. */
355 HOST_WIDE_INT gp_save_offset;
356 HOST_WIDE_INT fp_save_offset;
357 HOST_WIDE_INT acc_save_offset;
358 HOST_WIDE_INT cop0_save_offset;
359
360 /* Likewise, but giving offsets from the bottom of the frame. */
361 HOST_WIDE_INT gp_sp_offset;
362 HOST_WIDE_INT fp_sp_offset;
363 HOST_WIDE_INT acc_sp_offset;
364 HOST_WIDE_INT cop0_sp_offset;
365
366 /* Similar, but the value passed to _mcount. */
367 HOST_WIDE_INT ra_fp_offset;
368
369 /* The offset of arg_pointer_rtx from the bottom of the frame. */
370 HOST_WIDE_INT arg_pointer_offset;
371
372 /* The offset of hard_frame_pointer_rtx from the bottom of the frame. */
373 HOST_WIDE_INT hard_frame_pointer_offset;
374 };
375
376 struct GTY(()) machine_function {
377 /* The next floating-point condition-code register to allocate
378 for ISA_HAS_8CC targets, relative to ST_REG_FIRST. */
379 unsigned int next_fcc;
380
381 /* The register returned by mips16_gp_pseudo_reg; see there for details. */
382 rtx mips16_gp_pseudo_rtx;
383
384 /* The number of extra stack bytes taken up by register varargs.
385 This area is allocated by the callee at the very top of the frame. */
386 int varargs_size;
387
388 /* The current frame information, calculated by mips_compute_frame_info. */
389 struct mips_frame_info frame;
390
391 /* The register to use as the function's global pointer, or INVALID_REGNUM
392 if the function doesn't need one. */
393 unsigned int global_pointer;
394
395 /* How many instructions it takes to load a label into $AT, or 0 if
396 this property hasn't yet been calculated. */
397 unsigned int load_label_num_insns;
398
399 /* True if mips_adjust_insn_length should ignore an instruction's
400 hazard attribute. */
401 bool ignore_hazard_length_p;
402
403 /* True if the whole function is suitable for .set noreorder and
404 .set nomacro. */
405 bool all_noreorder_p;
406
407 /* True if the function has "inflexible" and "flexible" references
408 to the global pointer. See mips_cfun_has_inflexible_gp_ref_p
409 and mips_cfun_has_flexible_gp_ref_p for details. */
410 bool has_inflexible_gp_insn_p;
411 bool has_flexible_gp_insn_p;
412
413 /* True if the function's prologue must load the global pointer
414 value into pic_offset_table_rtx and store the same value in
415 the function's cprestore slot (if any). Even if this value
416 is currently false, we may decide to set it to true later;
417 see mips_must_initialize_gp_p () for details. */
418 bool must_initialize_gp_p;
419
420 /* True if the current function must restore $gp after any potential
421 clobber. This value is only meaningful during the first post-epilogue
422 split_insns pass; see mips_must_initialize_gp_p () for details. */
423 bool must_restore_gp_when_clobbered_p;
424
425 /* True if this is an interrupt handler. */
426 bool interrupt_handler_p;
427
428 /* True if this is an interrupt handler that uses shadow registers. */
429 bool use_shadow_register_set_p;
430
431 /* True if this is an interrupt handler that should keep interrupts
432 masked. */
433 bool keep_interrupts_masked_p;
434
435 /* True if this is an interrupt handler that should use DERET
436 instead of ERET. */
437 bool use_debug_exception_return_p;
438 };
439
440 /* Information about a single argument. */
441 struct mips_arg_info {
442 /* True if the argument is passed in a floating-point register, or
443 would have been if we hadn't run out of registers. */
444 bool fpr_p;
445
446 /* The number of words passed in registers, rounded up. */
447 unsigned int reg_words;
448
449 /* For EABI, the offset of the first register from GP_ARG_FIRST or
450 FP_ARG_FIRST. For other ABIs, the offset of the first register from
451 the start of the ABI's argument structure (see the CUMULATIVE_ARGS
452 comment for details).
453
454 The value is MAX_ARGS_IN_REGISTERS if the argument is passed entirely
455 on the stack. */
456 unsigned int reg_offset;
457
458 /* The number of words that must be passed on the stack, rounded up. */
459 unsigned int stack_words;
460
461 /* The offset from the start of the stack overflow area of the argument's
462 first stack word. Only meaningful when STACK_WORDS is nonzero. */
463 unsigned int stack_offset;
464 };
465
466 /* Information about an address described by mips_address_type.
467
468 ADDRESS_CONST_INT
469 No fields are used.
470
471 ADDRESS_REG
472 REG is the base register and OFFSET is the constant offset.
473
474 ADDRESS_LO_SUM
475 REG and OFFSET are the operands to the LO_SUM and SYMBOL_TYPE
476 is the type of symbol it references.
477
478 ADDRESS_SYMBOLIC
479 SYMBOL_TYPE is the type of symbol that the address references. */
480 struct mips_address_info {
481 enum mips_address_type type;
482 rtx reg;
483 rtx offset;
484 enum mips_symbol_type symbol_type;
485 };
486
487 /* One stage in a constant building sequence. These sequences have
488 the form:
489
490 A = VALUE[0]
491 A = A CODE[1] VALUE[1]
492 A = A CODE[2] VALUE[2]
493 ...
494
495 where A is an accumulator, each CODE[i] is a binary rtl operation
496 and each VALUE[i] is a constant integer. CODE[0] is undefined. */
497 struct mips_integer_op {
498 enum rtx_code code;
499 unsigned HOST_WIDE_INT value;
500 };
501
502 /* The largest number of operations needed to load an integer constant.
503 The worst accepted case for 64-bit constants is LUI,ORI,SLL,ORI,SLL,ORI.
504 When the lowest bit is clear, we can try, but reject a sequence with
505 an extra SLL at the end. */
506 #define MIPS_MAX_INTEGER_OPS 7
507
508 /* Information about a MIPS16e SAVE or RESTORE instruction. */
509 struct mips16e_save_restore_info {
510 /* The number of argument registers saved by a SAVE instruction.
511 0 for RESTORE instructions. */
512 unsigned int nargs;
513
514 /* Bit X is set if the instruction saves or restores GPR X. */
515 unsigned int mask;
516
517 /* The total number of bytes to allocate. */
518 HOST_WIDE_INT size;
519 };
520
521 /* Costs of various operations on the different architectures. */
522
523 struct mips_rtx_cost_data
524 {
525 unsigned short fp_add;
526 unsigned short fp_mult_sf;
527 unsigned short fp_mult_df;
528 unsigned short fp_div_sf;
529 unsigned short fp_div_df;
530 unsigned short int_mult_si;
531 unsigned short int_mult_di;
532 unsigned short int_div_si;
533 unsigned short int_div_di;
534 unsigned short branch_cost;
535 unsigned short memory_latency;
536 };
537
538 /* Global variables for machine-dependent things. */
539
540 /* The -G setting, or the configuration's default small-data limit if
541 no -G option is given. */
542 static unsigned int mips_small_data_threshold;
543
544 /* The number of file directives written by mips_output_filename. */
545 int num_source_filenames;
546
547 /* The name that appeared in the last .file directive written by
548 mips_output_filename, or "" if mips_output_filename hasn't
549 written anything yet. */
550 const char *current_function_file = "";
551
552 /* Arrays that map GCC register numbers to debugger register numbers. */
553 int mips_dbx_regno[FIRST_PSEUDO_REGISTER];
554 int mips_dwarf_regno[FIRST_PSEUDO_REGISTER];
555
556 /* Information about the current function's epilogue, used only while
557 expanding it. */
558 static struct {
559 /* A list of queued REG_CFA_RESTORE notes. */
560 rtx cfa_restores;
561
562 /* The CFA is currently defined as CFA_REG + CFA_OFFSET. */
563 rtx cfa_reg;
564 HOST_WIDE_INT cfa_offset;
565
566 /* The offset of the CFA from the stack pointer while restoring
567 registers. */
568 HOST_WIDE_INT cfa_restore_sp_offset;
569 } mips_epilogue;
570
571 /* The nesting depth of the PRINT_OPERAND '%(', '%<' and '%[' constructs. */
572 struct mips_asm_switch mips_noreorder = { "reorder", 0 };
573 struct mips_asm_switch mips_nomacro = { "macro", 0 };
574 struct mips_asm_switch mips_noat = { "at", 0 };
575
576 /* True if we're writing out a branch-likely instruction rather than a
577 normal branch. */
578 static bool mips_branch_likely;
579
580 /* The current instruction-set architecture. */
581 enum processor mips_arch;
582 const struct mips_cpu_info *mips_arch_info;
583
584 /* The processor that we should tune the code for. */
585 enum processor mips_tune;
586 const struct mips_cpu_info *mips_tune_info;
587
588 /* The ISA level associated with mips_arch. */
589 int mips_isa;
590
591 /* The ISA revision level. This is 0 for MIPS I to V and N for
592 MIPS{32,64}rN. */
593 int mips_isa_rev;
594
595 /* The architecture selected by -mipsN, or null if -mipsN wasn't used. */
596 static const struct mips_cpu_info *mips_isa_option_info;
597
598 /* Which cost information to use. */
599 static const struct mips_rtx_cost_data *mips_cost;
600
601 /* The ambient target flags, excluding MASK_MIPS16. */
602 static int mips_base_target_flags;
603
604 /* The default compression mode. */
605 unsigned int mips_base_compression_flags;
606
607 /* The ambient values of other global variables. */
608 static int mips_base_schedule_insns; /* flag_schedule_insns */
609 static int mips_base_reorder_blocks_and_partition; /* flag_reorder... */
610 static int mips_base_move_loop_invariants; /* flag_move_loop_invariants */
611 static int mips_base_align_loops; /* align_loops */
612 static int mips_base_align_jumps; /* align_jumps */
613 static int mips_base_align_functions; /* align_functions */
614
615 /* Index [M][R] is true if register R is allowed to hold a value of mode M. */
616 bool mips_hard_regno_mode_ok[(int) MAX_MACHINE_MODE][FIRST_PSEUDO_REGISTER];
617
618 /* Index C is true if character C is a valid PRINT_OPERAND punctation
619 character. */
620 static bool mips_print_operand_punct[256];
621
622 static GTY (()) int mips_output_filename_first_time = 1;
623
624 /* mips_split_p[X] is true if symbols of type X can be split by
625 mips_split_symbol. */
626 bool mips_split_p[NUM_SYMBOL_TYPES];
627
628 /* mips_split_hi_p[X] is true if the high parts of symbols of type X
629 can be split by mips_split_symbol. */
630 bool mips_split_hi_p[NUM_SYMBOL_TYPES];
631
632 /* mips_use_pcrel_pool_p[X] is true if symbols of type X should be
633 forced into a PC-relative constant pool. */
634 bool mips_use_pcrel_pool_p[NUM_SYMBOL_TYPES];
635
636 /* mips_lo_relocs[X] is the relocation to use when a symbol of type X
637 appears in a LO_SUM. It can be null if such LO_SUMs aren't valid or
638 if they are matched by a special .md file pattern. */
639 const char *mips_lo_relocs[NUM_SYMBOL_TYPES];
640
641 /* Likewise for HIGHs. */
642 const char *mips_hi_relocs[NUM_SYMBOL_TYPES];
643
644 /* Target state for MIPS16. */
645 struct target_globals *mips16_globals;
646
647 /* Cached value of can_issue_more. This is cached in mips_variable_issue hook
648 and returned from mips_sched_reorder2. */
649 static int cached_can_issue_more;
650
651 /* The stubs for various MIPS16 support functions, if used. */
652 static mips_one_only_stub *mips16_rdhwr_stub;
653 static mips_one_only_stub *mips16_get_fcsr_stub;
654 static mips_one_only_stub *mips16_set_fcsr_stub;
655
656 /* Index R is the smallest register class that contains register R. */
657 const enum reg_class mips_regno_to_class[FIRST_PSEUDO_REGISTER] = {
658 LEA_REGS, LEA_REGS, M16_STORE_REGS, V1_REG,
659 M16_STORE_REGS, M16_STORE_REGS, M16_STORE_REGS, M16_STORE_REGS,
660 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
661 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
662 M16_REGS, M16_STORE_REGS, LEA_REGS, LEA_REGS,
663 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
664 T_REG, PIC_FN_ADDR_REG, LEA_REGS, LEA_REGS,
665 LEA_REGS, M16_SP_REGS, LEA_REGS, LEA_REGS,
666
667 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
668 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
669 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
670 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
671 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
672 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
673 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
674 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
675 MD0_REG, MD1_REG, NO_REGS, ST_REGS,
676 ST_REGS, ST_REGS, ST_REGS, ST_REGS,
677 ST_REGS, ST_REGS, ST_REGS, NO_REGS,
678 NO_REGS, FRAME_REGS, FRAME_REGS, NO_REGS,
679 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
680 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
681 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
682 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
683 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
684 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
685 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
686 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
687 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
688 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
689 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
690 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
691 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
692 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
693 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
694 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
695 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
696 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
697 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
698 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
699 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
700 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
701 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
702 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
703 DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS,
704 DSP_ACC_REGS, DSP_ACC_REGS, ALL_REGS, ALL_REGS,
705 ALL_REGS, ALL_REGS, ALL_REGS, ALL_REGS
706 };
707
708 /* The value of TARGET_ATTRIBUTE_TABLE. */
709 static const struct attribute_spec mips_attribute_table[] = {
710 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler,
711 om_diagnostic } */
712 { "long_call", 0, 0, false, true, true, NULL, false },
713 { "far", 0, 0, false, true, true, NULL, false },
714 { "near", 0, 0, false, true, true, NULL, false },
715 /* We would really like to treat "mips16" and "nomips16" as type
716 attributes, but GCC doesn't provide the hooks we need to support
717 the right conversion rules. As declaration attributes, they affect
718 code generation but don't carry other semantics. */
719 { "mips16", 0, 0, true, false, false, NULL, false },
720 { "nomips16", 0, 0, true, false, false, NULL, false },
721 { "micromips", 0, 0, true, false, false, NULL, false },
722 { "nomicromips", 0, 0, true, false, false, NULL, false },
723 { "nocompression", 0, 0, true, false, false, NULL, false },
724 /* Allow functions to be specified as interrupt handlers */
725 { "interrupt", 0, 0, false, true, true, NULL, false },
726 { "use_shadow_register_set", 0, 0, false, true, true, NULL, false },
727 { "keep_interrupts_masked", 0, 0, false, true, true, NULL, false },
728 { "use_debug_exception_return", 0, 0, false, true, true, NULL, false },
729 { NULL, 0, 0, false, false, false, NULL, false }
730 };
731 \f
732 /* A table describing all the processors GCC knows about; see
733 mips-cpus.def for details. */
734 static const struct mips_cpu_info mips_cpu_info_table[] = {
735 #define MIPS_CPU(NAME, CPU, ISA, FLAGS) \
736 { NAME, CPU, ISA, FLAGS },
737 #include "mips-cpus.def"
738 #undef MIPS_CPU
739 };
740
741 /* Default costs. If these are used for a processor we should look
742 up the actual costs. */
743 #define DEFAULT_COSTS COSTS_N_INSNS (6), /* fp_add */ \
744 COSTS_N_INSNS (7), /* fp_mult_sf */ \
745 COSTS_N_INSNS (8), /* fp_mult_df */ \
746 COSTS_N_INSNS (23), /* fp_div_sf */ \
747 COSTS_N_INSNS (36), /* fp_div_df */ \
748 COSTS_N_INSNS (10), /* int_mult_si */ \
749 COSTS_N_INSNS (10), /* int_mult_di */ \
750 COSTS_N_INSNS (69), /* int_div_si */ \
751 COSTS_N_INSNS (69), /* int_div_di */ \
752 2, /* branch_cost */ \
753 4 /* memory_latency */
754
755 /* Floating-point costs for processors without an FPU. Just assume that
756 all floating-point libcalls are very expensive. */
757 #define SOFT_FP_COSTS COSTS_N_INSNS (256), /* fp_add */ \
758 COSTS_N_INSNS (256), /* fp_mult_sf */ \
759 COSTS_N_INSNS (256), /* fp_mult_df */ \
760 COSTS_N_INSNS (256), /* fp_div_sf */ \
761 COSTS_N_INSNS (256) /* fp_div_df */
762
763 /* Costs to use when optimizing for size. */
764 static const struct mips_rtx_cost_data mips_rtx_cost_optimize_size = {
765 COSTS_N_INSNS (1), /* fp_add */
766 COSTS_N_INSNS (1), /* fp_mult_sf */
767 COSTS_N_INSNS (1), /* fp_mult_df */
768 COSTS_N_INSNS (1), /* fp_div_sf */
769 COSTS_N_INSNS (1), /* fp_div_df */
770 COSTS_N_INSNS (1), /* int_mult_si */
771 COSTS_N_INSNS (1), /* int_mult_di */
772 COSTS_N_INSNS (1), /* int_div_si */
773 COSTS_N_INSNS (1), /* int_div_di */
774 2, /* branch_cost */
775 4 /* memory_latency */
776 };
777
778 /* Costs to use when optimizing for speed, indexed by processor. */
779 static const struct mips_rtx_cost_data
780 mips_rtx_cost_data[NUM_PROCESSOR_VALUES] = {
781 { /* R3000 */
782 COSTS_N_INSNS (2), /* fp_add */
783 COSTS_N_INSNS (4), /* fp_mult_sf */
784 COSTS_N_INSNS (5), /* fp_mult_df */
785 COSTS_N_INSNS (12), /* fp_div_sf */
786 COSTS_N_INSNS (19), /* fp_div_df */
787 COSTS_N_INSNS (12), /* int_mult_si */
788 COSTS_N_INSNS (12), /* int_mult_di */
789 COSTS_N_INSNS (35), /* int_div_si */
790 COSTS_N_INSNS (35), /* int_div_di */
791 1, /* branch_cost */
792 4 /* memory_latency */
793 },
794 { /* 4KC */
795 SOFT_FP_COSTS,
796 COSTS_N_INSNS (6), /* int_mult_si */
797 COSTS_N_INSNS (6), /* int_mult_di */
798 COSTS_N_INSNS (36), /* int_div_si */
799 COSTS_N_INSNS (36), /* int_div_di */
800 1, /* branch_cost */
801 4 /* memory_latency */
802 },
803 { /* 4KP */
804 SOFT_FP_COSTS,
805 COSTS_N_INSNS (36), /* int_mult_si */
806 COSTS_N_INSNS (36), /* int_mult_di */
807 COSTS_N_INSNS (37), /* int_div_si */
808 COSTS_N_INSNS (37), /* int_div_di */
809 1, /* branch_cost */
810 4 /* memory_latency */
811 },
812 { /* 5KC */
813 SOFT_FP_COSTS,
814 COSTS_N_INSNS (4), /* int_mult_si */
815 COSTS_N_INSNS (11), /* int_mult_di */
816 COSTS_N_INSNS (36), /* int_div_si */
817 COSTS_N_INSNS (68), /* int_div_di */
818 1, /* branch_cost */
819 4 /* memory_latency */
820 },
821 { /* 5KF */
822 COSTS_N_INSNS (4), /* fp_add */
823 COSTS_N_INSNS (4), /* fp_mult_sf */
824 COSTS_N_INSNS (5), /* fp_mult_df */
825 COSTS_N_INSNS (17), /* fp_div_sf */
826 COSTS_N_INSNS (32), /* fp_div_df */
827 COSTS_N_INSNS (4), /* int_mult_si */
828 COSTS_N_INSNS (11), /* int_mult_di */
829 COSTS_N_INSNS (36), /* int_div_si */
830 COSTS_N_INSNS (68), /* int_div_di */
831 1, /* branch_cost */
832 4 /* memory_latency */
833 },
834 { /* 20KC */
835 COSTS_N_INSNS (4), /* fp_add */
836 COSTS_N_INSNS (4), /* fp_mult_sf */
837 COSTS_N_INSNS (5), /* fp_mult_df */
838 COSTS_N_INSNS (17), /* fp_div_sf */
839 COSTS_N_INSNS (32), /* fp_div_df */
840 COSTS_N_INSNS (4), /* int_mult_si */
841 COSTS_N_INSNS (7), /* int_mult_di */
842 COSTS_N_INSNS (42), /* int_div_si */
843 COSTS_N_INSNS (72), /* int_div_di */
844 1, /* branch_cost */
845 4 /* memory_latency */
846 },
847 { /* 24KC */
848 SOFT_FP_COSTS,
849 COSTS_N_INSNS (5), /* int_mult_si */
850 COSTS_N_INSNS (5), /* int_mult_di */
851 COSTS_N_INSNS (41), /* int_div_si */
852 COSTS_N_INSNS (41), /* int_div_di */
853 1, /* branch_cost */
854 4 /* memory_latency */
855 },
856 { /* 24KF2_1 */
857 COSTS_N_INSNS (8), /* fp_add */
858 COSTS_N_INSNS (8), /* fp_mult_sf */
859 COSTS_N_INSNS (10), /* fp_mult_df */
860 COSTS_N_INSNS (34), /* fp_div_sf */
861 COSTS_N_INSNS (64), /* fp_div_df */
862 COSTS_N_INSNS (5), /* int_mult_si */
863 COSTS_N_INSNS (5), /* int_mult_di */
864 COSTS_N_INSNS (41), /* int_div_si */
865 COSTS_N_INSNS (41), /* int_div_di */
866 1, /* branch_cost */
867 4 /* memory_latency */
868 },
869 { /* 24KF1_1 */
870 COSTS_N_INSNS (4), /* fp_add */
871 COSTS_N_INSNS (4), /* fp_mult_sf */
872 COSTS_N_INSNS (5), /* fp_mult_df */
873 COSTS_N_INSNS (17), /* fp_div_sf */
874 COSTS_N_INSNS (32), /* fp_div_df */
875 COSTS_N_INSNS (5), /* int_mult_si */
876 COSTS_N_INSNS (5), /* int_mult_di */
877 COSTS_N_INSNS (41), /* int_div_si */
878 COSTS_N_INSNS (41), /* int_div_di */
879 1, /* branch_cost */
880 4 /* memory_latency */
881 },
882 { /* 74KC */
883 SOFT_FP_COSTS,
884 COSTS_N_INSNS (5), /* int_mult_si */
885 COSTS_N_INSNS (5), /* int_mult_di */
886 COSTS_N_INSNS (41), /* int_div_si */
887 COSTS_N_INSNS (41), /* int_div_di */
888 1, /* branch_cost */
889 4 /* memory_latency */
890 },
891 { /* 74KF2_1 */
892 COSTS_N_INSNS (8), /* fp_add */
893 COSTS_N_INSNS (8), /* fp_mult_sf */
894 COSTS_N_INSNS (10), /* fp_mult_df */
895 COSTS_N_INSNS (34), /* fp_div_sf */
896 COSTS_N_INSNS (64), /* fp_div_df */
897 COSTS_N_INSNS (5), /* int_mult_si */
898 COSTS_N_INSNS (5), /* int_mult_di */
899 COSTS_N_INSNS (41), /* int_div_si */
900 COSTS_N_INSNS (41), /* int_div_di */
901 1, /* branch_cost */
902 4 /* memory_latency */
903 },
904 { /* 74KF1_1 */
905 COSTS_N_INSNS (4), /* fp_add */
906 COSTS_N_INSNS (4), /* fp_mult_sf */
907 COSTS_N_INSNS (5), /* fp_mult_df */
908 COSTS_N_INSNS (17), /* fp_div_sf */
909 COSTS_N_INSNS (32), /* fp_div_df */
910 COSTS_N_INSNS (5), /* int_mult_si */
911 COSTS_N_INSNS (5), /* int_mult_di */
912 COSTS_N_INSNS (41), /* int_div_si */
913 COSTS_N_INSNS (41), /* int_div_di */
914 1, /* branch_cost */
915 4 /* memory_latency */
916 },
917 { /* 74KF3_2 */
918 COSTS_N_INSNS (6), /* fp_add */
919 COSTS_N_INSNS (6), /* fp_mult_sf */
920 COSTS_N_INSNS (7), /* fp_mult_df */
921 COSTS_N_INSNS (25), /* fp_div_sf */
922 COSTS_N_INSNS (48), /* fp_div_df */
923 COSTS_N_INSNS (5), /* int_mult_si */
924 COSTS_N_INSNS (5), /* int_mult_di */
925 COSTS_N_INSNS (41), /* int_div_si */
926 COSTS_N_INSNS (41), /* int_div_di */
927 1, /* branch_cost */
928 4 /* memory_latency */
929 },
930 { /* Loongson-2E */
931 DEFAULT_COSTS
932 },
933 { /* Loongson-2F */
934 DEFAULT_COSTS
935 },
936 { /* Loongson-3A */
937 DEFAULT_COSTS
938 },
939 { /* M4k */
940 DEFAULT_COSTS
941 },
942 /* Octeon */
943 {
944 SOFT_FP_COSTS,
945 COSTS_N_INSNS (5), /* int_mult_si */
946 COSTS_N_INSNS (5), /* int_mult_di */
947 COSTS_N_INSNS (72), /* int_div_si */
948 COSTS_N_INSNS (72), /* int_div_di */
949 1, /* branch_cost */
950 4 /* memory_latency */
951 },
952 /* Octeon II */
953 {
954 SOFT_FP_COSTS,
955 COSTS_N_INSNS (6), /* int_mult_si */
956 COSTS_N_INSNS (6), /* int_mult_di */
957 COSTS_N_INSNS (18), /* int_div_si */
958 COSTS_N_INSNS (35), /* int_div_di */
959 4, /* branch_cost */
960 4 /* memory_latency */
961 },
962 { /* R3900 */
963 COSTS_N_INSNS (2), /* fp_add */
964 COSTS_N_INSNS (4), /* fp_mult_sf */
965 COSTS_N_INSNS (5), /* fp_mult_df */
966 COSTS_N_INSNS (12), /* fp_div_sf */
967 COSTS_N_INSNS (19), /* fp_div_df */
968 COSTS_N_INSNS (2), /* int_mult_si */
969 COSTS_N_INSNS (2), /* int_mult_di */
970 COSTS_N_INSNS (35), /* int_div_si */
971 COSTS_N_INSNS (35), /* int_div_di */
972 1, /* branch_cost */
973 4 /* memory_latency */
974 },
975 { /* R6000 */
976 COSTS_N_INSNS (3), /* fp_add */
977 COSTS_N_INSNS (5), /* fp_mult_sf */
978 COSTS_N_INSNS (6), /* fp_mult_df */
979 COSTS_N_INSNS (15), /* fp_div_sf */
980 COSTS_N_INSNS (16), /* fp_div_df */
981 COSTS_N_INSNS (17), /* int_mult_si */
982 COSTS_N_INSNS (17), /* int_mult_di */
983 COSTS_N_INSNS (38), /* int_div_si */
984 COSTS_N_INSNS (38), /* int_div_di */
985 2, /* branch_cost */
986 6 /* memory_latency */
987 },
988 { /* R4000 */
989 COSTS_N_INSNS (6), /* fp_add */
990 COSTS_N_INSNS (7), /* fp_mult_sf */
991 COSTS_N_INSNS (8), /* fp_mult_df */
992 COSTS_N_INSNS (23), /* fp_div_sf */
993 COSTS_N_INSNS (36), /* fp_div_df */
994 COSTS_N_INSNS (10), /* int_mult_si */
995 COSTS_N_INSNS (10), /* int_mult_di */
996 COSTS_N_INSNS (69), /* int_div_si */
997 COSTS_N_INSNS (69), /* int_div_di */
998 2, /* branch_cost */
999 6 /* memory_latency */
1000 },
1001 { /* R4100 */
1002 DEFAULT_COSTS
1003 },
1004 { /* R4111 */
1005 DEFAULT_COSTS
1006 },
1007 { /* R4120 */
1008 DEFAULT_COSTS
1009 },
1010 { /* R4130 */
1011 /* The only costs that appear to be updated here are
1012 integer multiplication. */
1013 SOFT_FP_COSTS,
1014 COSTS_N_INSNS (4), /* int_mult_si */
1015 COSTS_N_INSNS (6), /* int_mult_di */
1016 COSTS_N_INSNS (69), /* int_div_si */
1017 COSTS_N_INSNS (69), /* int_div_di */
1018 1, /* branch_cost */
1019 4 /* memory_latency */
1020 },
1021 { /* R4300 */
1022 DEFAULT_COSTS
1023 },
1024 { /* R4600 */
1025 DEFAULT_COSTS
1026 },
1027 { /* R4650 */
1028 DEFAULT_COSTS
1029 },
1030 { /* R4700 */
1031 DEFAULT_COSTS
1032 },
1033 { /* R5000 */
1034 COSTS_N_INSNS (6), /* fp_add */
1035 COSTS_N_INSNS (4), /* fp_mult_sf */
1036 COSTS_N_INSNS (5), /* fp_mult_df */
1037 COSTS_N_INSNS (23), /* fp_div_sf */
1038 COSTS_N_INSNS (36), /* fp_div_df */
1039 COSTS_N_INSNS (5), /* int_mult_si */
1040 COSTS_N_INSNS (5), /* int_mult_di */
1041 COSTS_N_INSNS (36), /* int_div_si */
1042 COSTS_N_INSNS (36), /* int_div_di */
1043 1, /* branch_cost */
1044 4 /* memory_latency */
1045 },
1046 { /* R5400 */
1047 COSTS_N_INSNS (6), /* fp_add */
1048 COSTS_N_INSNS (5), /* fp_mult_sf */
1049 COSTS_N_INSNS (6), /* fp_mult_df */
1050 COSTS_N_INSNS (30), /* fp_div_sf */
1051 COSTS_N_INSNS (59), /* fp_div_df */
1052 COSTS_N_INSNS (3), /* int_mult_si */
1053 COSTS_N_INSNS (4), /* int_mult_di */
1054 COSTS_N_INSNS (42), /* int_div_si */
1055 COSTS_N_INSNS (74), /* int_div_di */
1056 1, /* branch_cost */
1057 4 /* memory_latency */
1058 },
1059 { /* R5500 */
1060 COSTS_N_INSNS (6), /* fp_add */
1061 COSTS_N_INSNS (5), /* fp_mult_sf */
1062 COSTS_N_INSNS (6), /* fp_mult_df */
1063 COSTS_N_INSNS (30), /* fp_div_sf */
1064 COSTS_N_INSNS (59), /* fp_div_df */
1065 COSTS_N_INSNS (5), /* int_mult_si */
1066 COSTS_N_INSNS (9), /* int_mult_di */
1067 COSTS_N_INSNS (42), /* int_div_si */
1068 COSTS_N_INSNS (74), /* int_div_di */
1069 1, /* branch_cost */
1070 4 /* memory_latency */
1071 },
1072 { /* R5900 */
1073 COSTS_N_INSNS (4), /* fp_add */
1074 COSTS_N_INSNS (4), /* fp_mult_sf */
1075 COSTS_N_INSNS (256), /* fp_mult_df */
1076 COSTS_N_INSNS (8), /* fp_div_sf */
1077 COSTS_N_INSNS (256), /* fp_div_df */
1078 COSTS_N_INSNS (4), /* int_mult_si */
1079 COSTS_N_INSNS (256), /* int_mult_di */
1080 COSTS_N_INSNS (37), /* int_div_si */
1081 COSTS_N_INSNS (256), /* int_div_di */
1082 1, /* branch_cost */
1083 4 /* memory_latency */
1084 },
1085 { /* R7000 */
1086 /* The only costs that are changed here are
1087 integer multiplication. */
1088 COSTS_N_INSNS (6), /* fp_add */
1089 COSTS_N_INSNS (7), /* fp_mult_sf */
1090 COSTS_N_INSNS (8), /* fp_mult_df */
1091 COSTS_N_INSNS (23), /* fp_div_sf */
1092 COSTS_N_INSNS (36), /* fp_div_df */
1093 COSTS_N_INSNS (5), /* int_mult_si */
1094 COSTS_N_INSNS (9), /* int_mult_di */
1095 COSTS_N_INSNS (69), /* int_div_si */
1096 COSTS_N_INSNS (69), /* int_div_di */
1097 1, /* branch_cost */
1098 4 /* memory_latency */
1099 },
1100 { /* R8000 */
1101 DEFAULT_COSTS
1102 },
1103 { /* R9000 */
1104 /* The only costs that are changed here are
1105 integer multiplication. */
1106 COSTS_N_INSNS (6), /* fp_add */
1107 COSTS_N_INSNS (7), /* fp_mult_sf */
1108 COSTS_N_INSNS (8), /* fp_mult_df */
1109 COSTS_N_INSNS (23), /* fp_div_sf */
1110 COSTS_N_INSNS (36), /* fp_div_df */
1111 COSTS_N_INSNS (3), /* int_mult_si */
1112 COSTS_N_INSNS (8), /* int_mult_di */
1113 COSTS_N_INSNS (69), /* int_div_si */
1114 COSTS_N_INSNS (69), /* int_div_di */
1115 1, /* branch_cost */
1116 4 /* memory_latency */
1117 },
1118 { /* R1x000 */
1119 COSTS_N_INSNS (2), /* fp_add */
1120 COSTS_N_INSNS (2), /* fp_mult_sf */
1121 COSTS_N_INSNS (2), /* fp_mult_df */
1122 COSTS_N_INSNS (12), /* fp_div_sf */
1123 COSTS_N_INSNS (19), /* fp_div_df */
1124 COSTS_N_INSNS (5), /* int_mult_si */
1125 COSTS_N_INSNS (9), /* int_mult_di */
1126 COSTS_N_INSNS (34), /* int_div_si */
1127 COSTS_N_INSNS (66), /* int_div_di */
1128 1, /* branch_cost */
1129 4 /* memory_latency */
1130 },
1131 { /* SB1 */
1132 /* These costs are the same as the SB-1A below. */
1133 COSTS_N_INSNS (4), /* fp_add */
1134 COSTS_N_INSNS (4), /* fp_mult_sf */
1135 COSTS_N_INSNS (4), /* fp_mult_df */
1136 COSTS_N_INSNS (24), /* fp_div_sf */
1137 COSTS_N_INSNS (32), /* fp_div_df */
1138 COSTS_N_INSNS (3), /* int_mult_si */
1139 COSTS_N_INSNS (4), /* int_mult_di */
1140 COSTS_N_INSNS (36), /* int_div_si */
1141 COSTS_N_INSNS (68), /* int_div_di */
1142 1, /* branch_cost */
1143 4 /* memory_latency */
1144 },
1145 { /* SB1-A */
1146 /* These costs are the same as the SB-1 above. */
1147 COSTS_N_INSNS (4), /* fp_add */
1148 COSTS_N_INSNS (4), /* fp_mult_sf */
1149 COSTS_N_INSNS (4), /* fp_mult_df */
1150 COSTS_N_INSNS (24), /* fp_div_sf */
1151 COSTS_N_INSNS (32), /* fp_div_df */
1152 COSTS_N_INSNS (3), /* int_mult_si */
1153 COSTS_N_INSNS (4), /* int_mult_di */
1154 COSTS_N_INSNS (36), /* int_div_si */
1155 COSTS_N_INSNS (68), /* int_div_di */
1156 1, /* branch_cost */
1157 4 /* memory_latency */
1158 },
1159 { /* SR71000 */
1160 DEFAULT_COSTS
1161 },
1162 { /* XLR */
1163 SOFT_FP_COSTS,
1164 COSTS_N_INSNS (8), /* int_mult_si */
1165 COSTS_N_INSNS (8), /* int_mult_di */
1166 COSTS_N_INSNS (72), /* int_div_si */
1167 COSTS_N_INSNS (72), /* int_div_di */
1168 1, /* branch_cost */
1169 4 /* memory_latency */
1170 },
1171 { /* XLP */
1172 /* These costs are the same as 5KF above. */
1173 COSTS_N_INSNS (4), /* fp_add */
1174 COSTS_N_INSNS (4), /* fp_mult_sf */
1175 COSTS_N_INSNS (5), /* fp_mult_df */
1176 COSTS_N_INSNS (17), /* fp_div_sf */
1177 COSTS_N_INSNS (32), /* fp_div_df */
1178 COSTS_N_INSNS (4), /* int_mult_si */
1179 COSTS_N_INSNS (11), /* int_mult_di */
1180 COSTS_N_INSNS (36), /* int_div_si */
1181 COSTS_N_INSNS (68), /* int_div_di */
1182 1, /* branch_cost */
1183 4 /* memory_latency */
1184 },
1185 { /* P5600 */
1186 COSTS_N_INSNS (4), /* fp_add */
1187 COSTS_N_INSNS (5), /* fp_mult_sf */
1188 COSTS_N_INSNS (5), /* fp_mult_df */
1189 COSTS_N_INSNS (17), /* fp_div_sf */
1190 COSTS_N_INSNS (17), /* fp_div_df */
1191 COSTS_N_INSNS (5), /* int_mult_si */
1192 COSTS_N_INSNS (5), /* int_mult_di */
1193 COSTS_N_INSNS (8), /* int_div_si */
1194 COSTS_N_INSNS (8), /* int_div_di */
1195 2, /* branch_cost */
1196 10 /* memory_latency */
1197 }
1198 };
1199 \f
1200 static rtx mips_find_pic_call_symbol (rtx_insn *, rtx, bool);
1201 static int mips_register_move_cost (enum machine_mode, reg_class_t,
1202 reg_class_t);
1203 static unsigned int mips_function_arg_boundary (enum machine_mode, const_tree);
1204 \f
1205 /* This hash table keeps track of implicit "mips16" and "nomips16" attributes
1206 for -mflip_mips16. It maps decl names onto a boolean mode setting. */
1207 struct GTY (()) mflip_mips16_entry {
1208 const char *name;
1209 bool mips16_p;
1210 };
1211 static GTY ((param_is (struct mflip_mips16_entry))) htab_t mflip_mips16_htab;
1212
1213 /* Hash table callbacks for mflip_mips16_htab. */
1214
1215 static hashval_t
1216 mflip_mips16_htab_hash (const void *entry)
1217 {
1218 return htab_hash_string (((const struct mflip_mips16_entry *) entry)->name);
1219 }
1220
1221 static int
1222 mflip_mips16_htab_eq (const void *entry, const void *name)
1223 {
1224 return strcmp (((const struct mflip_mips16_entry *) entry)->name,
1225 (const char *) name) == 0;
1226 }
1227
1228 /* True if -mflip-mips16 should next add an attribute for the default MIPS16
1229 mode, false if it should next add an attribute for the opposite mode. */
1230 static GTY(()) bool mips16_flipper;
1231
1232 /* DECL is a function that needs a default "mips16" or "nomips16" attribute
1233 for -mflip-mips16. Return true if it should use "mips16" and false if
1234 it should use "nomips16". */
1235
1236 static bool
1237 mflip_mips16_use_mips16_p (tree decl)
1238 {
1239 struct mflip_mips16_entry *entry;
1240 const char *name;
1241 hashval_t hash;
1242 void **slot;
1243 bool base_is_mips16 = (mips_base_compression_flags & MASK_MIPS16) != 0;
1244
1245 /* Use the opposite of the command-line setting for anonymous decls. */
1246 if (!DECL_NAME (decl))
1247 return !base_is_mips16;
1248
1249 if (!mflip_mips16_htab)
1250 mflip_mips16_htab = htab_create_ggc (37, mflip_mips16_htab_hash,
1251 mflip_mips16_htab_eq, NULL);
1252
1253 name = IDENTIFIER_POINTER (DECL_NAME (decl));
1254 hash = htab_hash_string (name);
1255 slot = htab_find_slot_with_hash (mflip_mips16_htab, name, hash, INSERT);
1256 entry = (struct mflip_mips16_entry *) *slot;
1257 if (!entry)
1258 {
1259 mips16_flipper = !mips16_flipper;
1260 entry = ggc_alloc<mflip_mips16_entry> ();
1261 entry->name = name;
1262 entry->mips16_p = mips16_flipper ? !base_is_mips16 : base_is_mips16;
1263 *slot = entry;
1264 }
1265 return entry->mips16_p;
1266 }
1267 \f
1268 /* Predicates to test for presence of "near" and "far"/"long_call"
1269 attributes on the given TYPE. */
1270
1271 static bool
1272 mips_near_type_p (const_tree type)
1273 {
1274 return lookup_attribute ("near", TYPE_ATTRIBUTES (type)) != NULL;
1275 }
1276
1277 static bool
1278 mips_far_type_p (const_tree type)
1279 {
1280 return (lookup_attribute ("long_call", TYPE_ATTRIBUTES (type)) != NULL
1281 || lookup_attribute ("far", TYPE_ATTRIBUTES (type)) != NULL);
1282 }
1283
1284
1285 /* Check if the interrupt attribute is set for a function. */
1286
1287 static bool
1288 mips_interrupt_type_p (tree type)
1289 {
1290 return lookup_attribute ("interrupt", TYPE_ATTRIBUTES (type)) != NULL;
1291 }
1292
1293 /* Check if the attribute to use shadow register set is set for a function. */
1294
1295 static bool
1296 mips_use_shadow_register_set_p (tree type)
1297 {
1298 return lookup_attribute ("use_shadow_register_set",
1299 TYPE_ATTRIBUTES (type)) != NULL;
1300 }
1301
1302 /* Check if the attribute to keep interrupts masked is set for a function. */
1303
1304 static bool
1305 mips_keep_interrupts_masked_p (tree type)
1306 {
1307 return lookup_attribute ("keep_interrupts_masked",
1308 TYPE_ATTRIBUTES (type)) != NULL;
1309 }
1310
1311 /* Check if the attribute to use debug exception return is set for
1312 a function. */
1313
1314 static bool
1315 mips_use_debug_exception_return_p (tree type)
1316 {
1317 return lookup_attribute ("use_debug_exception_return",
1318 TYPE_ATTRIBUTES (type)) != NULL;
1319 }
1320
1321 /* Return the set of compression modes that are explicitly required
1322 by the attributes in ATTRIBUTES. */
1323
1324 static unsigned int
1325 mips_get_compress_on_flags (tree attributes)
1326 {
1327 unsigned int flags = 0;
1328
1329 if (lookup_attribute ("mips16", attributes) != NULL)
1330 flags |= MASK_MIPS16;
1331
1332 if (lookup_attribute ("micromips", attributes) != NULL)
1333 flags |= MASK_MICROMIPS;
1334
1335 return flags;
1336 }
1337
1338 /* Return the set of compression modes that are explicitly forbidden
1339 by the attributes in ATTRIBUTES. */
1340
1341 static unsigned int
1342 mips_get_compress_off_flags (tree attributes)
1343 {
1344 unsigned int flags = 0;
1345
1346 if (lookup_attribute ("nocompression", attributes) != NULL)
1347 flags |= MASK_MIPS16 | MASK_MICROMIPS;
1348
1349 if (lookup_attribute ("nomips16", attributes) != NULL)
1350 flags |= MASK_MIPS16;
1351
1352 if (lookup_attribute ("nomicromips", attributes) != NULL)
1353 flags |= MASK_MICROMIPS;
1354
1355 return flags;
1356 }
1357
1358 /* Return the compression mode that should be used for function DECL.
1359 Return the ambient setting if DECL is null. */
1360
1361 static unsigned int
1362 mips_get_compress_mode (tree decl)
1363 {
1364 unsigned int flags, force_on;
1365
1366 flags = mips_base_compression_flags;
1367 if (decl)
1368 {
1369 /* Nested functions must use the same frame pointer as their
1370 parent and must therefore use the same ISA mode. */
1371 tree parent = decl_function_context (decl);
1372 if (parent)
1373 decl = parent;
1374 force_on = mips_get_compress_on_flags (DECL_ATTRIBUTES (decl));
1375 if (force_on)
1376 return force_on;
1377 flags &= ~mips_get_compress_off_flags (DECL_ATTRIBUTES (decl));
1378 }
1379 return flags;
1380 }
1381
1382 /* Return the attribute name associated with MASK_MIPS16 and MASK_MICROMIPS
1383 flags FLAGS. */
1384
1385 static const char *
1386 mips_get_compress_on_name (unsigned int flags)
1387 {
1388 if (flags == MASK_MIPS16)
1389 return "mips16";
1390 return "micromips";
1391 }
1392
1393 /* Return the attribute name that forbids MASK_MIPS16 and MASK_MICROMIPS
1394 flags FLAGS. */
1395
1396 static const char *
1397 mips_get_compress_off_name (unsigned int flags)
1398 {
1399 if (flags == MASK_MIPS16)
1400 return "nomips16";
1401 if (flags == MASK_MICROMIPS)
1402 return "nomicromips";
1403 return "nocompression";
1404 }
1405
1406 /* Implement TARGET_COMP_TYPE_ATTRIBUTES. */
1407
1408 static int
1409 mips_comp_type_attributes (const_tree type1, const_tree type2)
1410 {
1411 /* Disallow mixed near/far attributes. */
1412 if (mips_far_type_p (type1) && mips_near_type_p (type2))
1413 return 0;
1414 if (mips_near_type_p (type1) && mips_far_type_p (type2))
1415 return 0;
1416 return 1;
1417 }
1418
1419 /* Implement TARGET_INSERT_ATTRIBUTES. */
1420
1421 static void
1422 mips_insert_attributes (tree decl, tree *attributes)
1423 {
1424 const char *name;
1425 unsigned int compression_flags, nocompression_flags;
1426
1427 /* Check for "mips16" and "nomips16" attributes. */
1428 compression_flags = mips_get_compress_on_flags (*attributes);
1429 nocompression_flags = mips_get_compress_off_flags (*attributes);
1430
1431 if (TREE_CODE (decl) != FUNCTION_DECL)
1432 {
1433 if (nocompression_flags)
1434 error ("%qs attribute only applies to functions",
1435 mips_get_compress_off_name (nocompression_flags));
1436
1437 if (compression_flags)
1438 error ("%qs attribute only applies to functions",
1439 mips_get_compress_on_name (nocompression_flags));
1440 }
1441 else
1442 {
1443 compression_flags |= mips_get_compress_on_flags (DECL_ATTRIBUTES (decl));
1444 nocompression_flags |=
1445 mips_get_compress_off_flags (DECL_ATTRIBUTES (decl));
1446
1447 if (compression_flags && nocompression_flags)
1448 error ("%qE cannot have both %qs and %qs attributes",
1449 DECL_NAME (decl), mips_get_compress_on_name (compression_flags),
1450 mips_get_compress_off_name (nocompression_flags));
1451
1452 if (compression_flags & MASK_MIPS16
1453 && compression_flags & MASK_MICROMIPS)
1454 error ("%qE cannot have both %qs and %qs attributes",
1455 DECL_NAME (decl), "mips16", "micromips");
1456
1457 if (TARGET_FLIP_MIPS16
1458 && !DECL_ARTIFICIAL (decl)
1459 && compression_flags == 0
1460 && nocompression_flags == 0)
1461 {
1462 /* Implement -mflip-mips16. If DECL has neither a "nomips16" nor a
1463 "mips16" attribute, arbitrarily pick one. We must pick the same
1464 setting for duplicate declarations of a function. */
1465 name = mflip_mips16_use_mips16_p (decl) ? "mips16" : "nomips16";
1466 *attributes = tree_cons (get_identifier (name), NULL, *attributes);
1467 name = "nomicromips";
1468 *attributes = tree_cons (get_identifier (name), NULL, *attributes);
1469 }
1470 }
1471 }
1472
1473 /* Implement TARGET_MERGE_DECL_ATTRIBUTES. */
1474
1475 static tree
1476 mips_merge_decl_attributes (tree olddecl, tree newdecl)
1477 {
1478 unsigned int diff;
1479
1480 diff = (mips_get_compress_on_flags (DECL_ATTRIBUTES (olddecl))
1481 ^ mips_get_compress_on_flags (DECL_ATTRIBUTES (newdecl)));
1482 if (diff)
1483 error ("%qE redeclared with conflicting %qs attributes",
1484 DECL_NAME (newdecl), mips_get_compress_on_name (diff));
1485
1486 diff = (mips_get_compress_off_flags (DECL_ATTRIBUTES (olddecl))
1487 ^ mips_get_compress_off_flags (DECL_ATTRIBUTES (newdecl)));
1488 if (diff)
1489 error ("%qE redeclared with conflicting %qs attributes",
1490 DECL_NAME (newdecl), mips_get_compress_off_name (diff));
1491
1492 return merge_attributes (DECL_ATTRIBUTES (olddecl),
1493 DECL_ATTRIBUTES (newdecl));
1494 }
1495
1496 /* Implement TARGET_CAN_INLINE_P. */
1497
1498 static bool
1499 mips_can_inline_p (tree caller, tree callee)
1500 {
1501 if (mips_get_compress_mode (callee) != mips_get_compress_mode (caller))
1502 return false;
1503 return default_target_can_inline_p (caller, callee);
1504 }
1505 \f
1506 /* If X is a PLUS of a CONST_INT, return the two terms in *BASE_PTR
1507 and *OFFSET_PTR. Return X in *BASE_PTR and 0 in *OFFSET_PTR otherwise. */
1508
1509 static void
1510 mips_split_plus (rtx x, rtx *base_ptr, HOST_WIDE_INT *offset_ptr)
1511 {
1512 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1)))
1513 {
1514 *base_ptr = XEXP (x, 0);
1515 *offset_ptr = INTVAL (XEXP (x, 1));
1516 }
1517 else
1518 {
1519 *base_ptr = x;
1520 *offset_ptr = 0;
1521 }
1522 }
1523 \f
1524 static unsigned int mips_build_integer (struct mips_integer_op *,
1525 unsigned HOST_WIDE_INT);
1526
1527 /* A subroutine of mips_build_integer, with the same interface.
1528 Assume that the final action in the sequence should be a left shift. */
1529
1530 static unsigned int
1531 mips_build_shift (struct mips_integer_op *codes, HOST_WIDE_INT value)
1532 {
1533 unsigned int i, shift;
1534
1535 /* Shift VALUE right until its lowest bit is set. Shift arithmetically
1536 since signed numbers are easier to load than unsigned ones. */
1537 shift = 0;
1538 while ((value & 1) == 0)
1539 value /= 2, shift++;
1540
1541 i = mips_build_integer (codes, value);
1542 codes[i].code = ASHIFT;
1543 codes[i].value = shift;
1544 return i + 1;
1545 }
1546
1547 /* As for mips_build_shift, but assume that the final action will be
1548 an IOR or PLUS operation. */
1549
1550 static unsigned int
1551 mips_build_lower (struct mips_integer_op *codes, unsigned HOST_WIDE_INT value)
1552 {
1553 unsigned HOST_WIDE_INT high;
1554 unsigned int i;
1555
1556 high = value & ~(unsigned HOST_WIDE_INT) 0xffff;
1557 if (!LUI_OPERAND (high) && (value & 0x18000) == 0x18000)
1558 {
1559 /* The constant is too complex to load with a simple LUI/ORI pair,
1560 so we want to give the recursive call as many trailing zeros as
1561 possible. In this case, we know bit 16 is set and that the
1562 low 16 bits form a negative number. If we subtract that number
1563 from VALUE, we will clear at least the lowest 17 bits, maybe more. */
1564 i = mips_build_integer (codes, CONST_HIGH_PART (value));
1565 codes[i].code = PLUS;
1566 codes[i].value = CONST_LOW_PART (value);
1567 }
1568 else
1569 {
1570 /* Either this is a simple LUI/ORI pair, or clearing the lowest 16
1571 bits gives a value with at least 17 trailing zeros. */
1572 i = mips_build_integer (codes, high);
1573 codes[i].code = IOR;
1574 codes[i].value = value & 0xffff;
1575 }
1576 return i + 1;
1577 }
1578
1579 /* Fill CODES with a sequence of rtl operations to load VALUE.
1580 Return the number of operations needed. */
1581
1582 static unsigned int
1583 mips_build_integer (struct mips_integer_op *codes,
1584 unsigned HOST_WIDE_INT value)
1585 {
1586 if (SMALL_OPERAND (value)
1587 || SMALL_OPERAND_UNSIGNED (value)
1588 || LUI_OPERAND (value))
1589 {
1590 /* The value can be loaded with a single instruction. */
1591 codes[0].code = UNKNOWN;
1592 codes[0].value = value;
1593 return 1;
1594 }
1595 else if ((value & 1) != 0 || LUI_OPERAND (CONST_HIGH_PART (value)))
1596 {
1597 /* Either the constant is a simple LUI/ORI combination or its
1598 lowest bit is set. We don't want to shift in this case. */
1599 return mips_build_lower (codes, value);
1600 }
1601 else if ((value & 0xffff) == 0)
1602 {
1603 /* The constant will need at least three actions. The lowest
1604 16 bits are clear, so the final action will be a shift. */
1605 return mips_build_shift (codes, value);
1606 }
1607 else
1608 {
1609 /* The final action could be a shift, add or inclusive OR.
1610 Rather than use a complex condition to select the best
1611 approach, try both mips_build_shift and mips_build_lower
1612 and pick the one that gives the shortest sequence.
1613 Note that this case is only used once per constant. */
1614 struct mips_integer_op alt_codes[MIPS_MAX_INTEGER_OPS];
1615 unsigned int cost, alt_cost;
1616
1617 cost = mips_build_shift (codes, value);
1618 alt_cost = mips_build_lower (alt_codes, value);
1619 if (alt_cost < cost)
1620 {
1621 memcpy (codes, alt_codes, alt_cost * sizeof (codes[0]));
1622 cost = alt_cost;
1623 }
1624 return cost;
1625 }
1626 }
1627 \f
1628 /* Implement TARGET_LEGITIMATE_CONSTANT_P. */
1629
1630 static bool
1631 mips_legitimate_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED, rtx x)
1632 {
1633 return mips_const_insns (x) > 0;
1634 }
1635 \f
1636 /* Return a SYMBOL_REF for a MIPS16 function called NAME. */
1637
1638 static rtx
1639 mips16_stub_function (const char *name)
1640 {
1641 rtx x;
1642
1643 x = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (name));
1644 SYMBOL_REF_FLAGS (x) |= (SYMBOL_FLAG_EXTERNAL | SYMBOL_FLAG_FUNCTION);
1645 return x;
1646 }
1647
1648 /* Return a legitimate call address for STUB, given that STUB is a MIPS16
1649 support function. */
1650
1651 static rtx
1652 mips16_stub_call_address (mips_one_only_stub *stub)
1653 {
1654 rtx fn = mips16_stub_function (stub->get_name ());
1655 SYMBOL_REF_FLAGS (fn) |= SYMBOL_FLAG_LOCAL;
1656 if (!call_insn_operand (fn, VOIDmode))
1657 fn = force_reg (Pmode, fn);
1658 return fn;
1659 }
1660 \f
1661 /* A stub for moving the thread pointer into TLS_GET_TP_REGNUM. */
1662
1663 class mips16_rdhwr_one_only_stub : public mips_one_only_stub
1664 {
1665 virtual const char *get_name ();
1666 virtual void output_body ();
1667 };
1668
1669 const char *
1670 mips16_rdhwr_one_only_stub::get_name ()
1671 {
1672 return "__mips16_rdhwr";
1673 }
1674
1675 void
1676 mips16_rdhwr_one_only_stub::output_body ()
1677 {
1678 fprintf (asm_out_file,
1679 "\t.set\tpush\n"
1680 "\t.set\tmips32r2\n"
1681 "\t.set\tnoreorder\n"
1682 "\trdhwr\t$3,$29\n"
1683 "\t.set\tpop\n"
1684 "\tj\t$31\n");
1685 }
1686
1687 /* A stub for moving the FCSR into GET_FCSR_REGNUM. */
1688 class mips16_get_fcsr_one_only_stub : public mips_one_only_stub
1689 {
1690 virtual const char *get_name ();
1691 virtual void output_body ();
1692 };
1693
1694 const char *
1695 mips16_get_fcsr_one_only_stub::get_name ()
1696 {
1697 return "__mips16_get_fcsr";
1698 }
1699
1700 void
1701 mips16_get_fcsr_one_only_stub::output_body ()
1702 {
1703 fprintf (asm_out_file,
1704 "\tcfc1\t%s,$31\n"
1705 "\tj\t$31\n", reg_names[GET_FCSR_REGNUM]);
1706 }
1707
1708 /* A stub for moving SET_FCSR_REGNUM into the FCSR. */
1709 class mips16_set_fcsr_one_only_stub : public mips_one_only_stub
1710 {
1711 virtual const char *get_name ();
1712 virtual void output_body ();
1713 };
1714
1715 const char *
1716 mips16_set_fcsr_one_only_stub::get_name ()
1717 {
1718 return "__mips16_set_fcsr";
1719 }
1720
1721 void
1722 mips16_set_fcsr_one_only_stub::output_body ()
1723 {
1724 fprintf (asm_out_file,
1725 "\tctc1\t%s,$31\n"
1726 "\tj\t$31\n", reg_names[SET_FCSR_REGNUM]);
1727 }
1728 \f
1729 /* Return true if symbols of type TYPE require a GOT access. */
1730
1731 static bool
1732 mips_got_symbol_type_p (enum mips_symbol_type type)
1733 {
1734 switch (type)
1735 {
1736 case SYMBOL_GOT_PAGE_OFST:
1737 case SYMBOL_GOT_DISP:
1738 return true;
1739
1740 default:
1741 return false;
1742 }
1743 }
1744
1745 /* Return true if X is a thread-local symbol. */
1746
1747 static bool
1748 mips_tls_symbol_p (rtx x)
1749 {
1750 return GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_TLS_MODEL (x) != 0;
1751 }
1752
1753 /* Return true if SYMBOL_REF X is associated with a global symbol
1754 (in the STB_GLOBAL sense). */
1755
1756 static bool
1757 mips_global_symbol_p (const_rtx x)
1758 {
1759 const_tree decl = SYMBOL_REF_DECL (x);
1760
1761 if (!decl)
1762 return !SYMBOL_REF_LOCAL_P (x) || SYMBOL_REF_EXTERNAL_P (x);
1763
1764 /* Weakref symbols are not TREE_PUBLIC, but their targets are global
1765 or weak symbols. Relocations in the object file will be against
1766 the target symbol, so it's that symbol's binding that matters here. */
1767 return DECL_P (decl) && (TREE_PUBLIC (decl) || DECL_WEAK (decl));
1768 }
1769
1770 /* Return true if function X is a libgcc MIPS16 stub function. */
1771
1772 static bool
1773 mips16_stub_function_p (const_rtx x)
1774 {
1775 return (GET_CODE (x) == SYMBOL_REF
1776 && strncmp (XSTR (x, 0), "__mips16_", 9) == 0);
1777 }
1778
1779 /* Return true if function X is a locally-defined and locally-binding
1780 MIPS16 function. */
1781
1782 static bool
1783 mips16_local_function_p (const_rtx x)
1784 {
1785 return (GET_CODE (x) == SYMBOL_REF
1786 && SYMBOL_REF_LOCAL_P (x)
1787 && !SYMBOL_REF_EXTERNAL_P (x)
1788 && (mips_get_compress_mode (SYMBOL_REF_DECL (x)) & MASK_MIPS16));
1789 }
1790
1791 /* Return true if SYMBOL_REF X binds locally. */
1792
1793 static bool
1794 mips_symbol_binds_local_p (const_rtx x)
1795 {
1796 return (SYMBOL_REF_DECL (x)
1797 ? targetm.binds_local_p (SYMBOL_REF_DECL (x))
1798 : SYMBOL_REF_LOCAL_P (x));
1799 }
1800
1801 /* Return true if rtx constants of mode MODE should be put into a small
1802 data section. */
1803
1804 static bool
1805 mips_rtx_constant_in_small_data_p (enum machine_mode mode)
1806 {
1807 return (!TARGET_EMBEDDED_DATA
1808 && TARGET_LOCAL_SDATA
1809 && GET_MODE_SIZE (mode) <= mips_small_data_threshold);
1810 }
1811
1812 /* Return true if X should not be moved directly into register $25.
1813 We need this because many versions of GAS will treat "la $25,foo" as
1814 part of a call sequence and so allow a global "foo" to be lazily bound. */
1815
1816 bool
1817 mips_dangerous_for_la25_p (rtx x)
1818 {
1819 return (!TARGET_EXPLICIT_RELOCS
1820 && TARGET_USE_GOT
1821 && GET_CODE (x) == SYMBOL_REF
1822 && mips_global_symbol_p (x));
1823 }
1824
1825 /* Return true if calls to X might need $25 to be valid on entry. */
1826
1827 bool
1828 mips_use_pic_fn_addr_reg_p (const_rtx x)
1829 {
1830 if (!TARGET_USE_PIC_FN_ADDR_REG)
1831 return false;
1832
1833 /* MIPS16 stub functions are guaranteed not to use $25. */
1834 if (mips16_stub_function_p (x))
1835 return false;
1836
1837 if (GET_CODE (x) == SYMBOL_REF)
1838 {
1839 /* If PLTs and copy relocations are available, the static linker
1840 will make sure that $25 is valid on entry to the target function. */
1841 if (TARGET_ABICALLS_PIC0)
1842 return false;
1843
1844 /* Locally-defined functions use absolute accesses to set up
1845 the global pointer. */
1846 if (TARGET_ABSOLUTE_ABICALLS
1847 && mips_symbol_binds_local_p (x)
1848 && !SYMBOL_REF_EXTERNAL_P (x))
1849 return false;
1850 }
1851
1852 return true;
1853 }
1854
1855 /* Return the method that should be used to access SYMBOL_REF or
1856 LABEL_REF X in context CONTEXT. */
1857
1858 static enum mips_symbol_type
1859 mips_classify_symbol (const_rtx x, enum mips_symbol_context context)
1860 {
1861 if (TARGET_RTP_PIC)
1862 return SYMBOL_GOT_DISP;
1863
1864 if (GET_CODE (x) == LABEL_REF)
1865 {
1866 /* Only return SYMBOL_PC_RELATIVE if we are generating MIPS16
1867 code and if we know that the label is in the current function's
1868 text section. LABEL_REFs are used for jump tables as well as
1869 text labels, so we must check whether jump tables live in the
1870 text section. */
1871 if (TARGET_MIPS16_SHORT_JUMP_TABLES
1872 && !LABEL_REF_NONLOCAL_P (x))
1873 return SYMBOL_PC_RELATIVE;
1874
1875 if (TARGET_ABICALLS && !TARGET_ABSOLUTE_ABICALLS)
1876 return SYMBOL_GOT_PAGE_OFST;
1877
1878 return SYMBOL_ABSOLUTE;
1879 }
1880
1881 gcc_assert (GET_CODE (x) == SYMBOL_REF);
1882
1883 if (SYMBOL_REF_TLS_MODEL (x))
1884 return SYMBOL_TLS;
1885
1886 if (CONSTANT_POOL_ADDRESS_P (x))
1887 {
1888 if (TARGET_MIPS16_TEXT_LOADS)
1889 return SYMBOL_PC_RELATIVE;
1890
1891 if (TARGET_MIPS16_PCREL_LOADS && context == SYMBOL_CONTEXT_MEM)
1892 return SYMBOL_PC_RELATIVE;
1893
1894 if (mips_rtx_constant_in_small_data_p (get_pool_mode (x)))
1895 return SYMBOL_GP_RELATIVE;
1896 }
1897
1898 /* Do not use small-data accesses for weak symbols; they may end up
1899 being zero. */
1900 if (TARGET_GPOPT && SYMBOL_REF_SMALL_P (x) && !SYMBOL_REF_WEAK (x))
1901 return SYMBOL_GP_RELATIVE;
1902
1903 /* Don't use GOT accesses for locally-binding symbols when -mno-shared
1904 is in effect. */
1905 if (TARGET_ABICALLS_PIC2
1906 && !(TARGET_ABSOLUTE_ABICALLS && mips_symbol_binds_local_p (x)))
1907 {
1908 /* There are three cases to consider:
1909
1910 - o32 PIC (either with or without explicit relocs)
1911 - n32/n64 PIC without explicit relocs
1912 - n32/n64 PIC with explicit relocs
1913
1914 In the first case, both local and global accesses will use an
1915 R_MIPS_GOT16 relocation. We must correctly predict which of
1916 the two semantics (local or global) the assembler and linker
1917 will apply. The choice depends on the symbol's binding rather
1918 than its visibility.
1919
1920 In the second case, the assembler will not use R_MIPS_GOT16
1921 relocations, but it chooses between local and global accesses
1922 in the same way as for o32 PIC.
1923
1924 In the third case we have more freedom since both forms of
1925 access will work for any kind of symbol. However, there seems
1926 little point in doing things differently. */
1927 if (mips_global_symbol_p (x))
1928 return SYMBOL_GOT_DISP;
1929
1930 return SYMBOL_GOT_PAGE_OFST;
1931 }
1932
1933 return SYMBOL_ABSOLUTE;
1934 }
1935
1936 /* Classify the base of symbolic expression X, given that X appears in
1937 context CONTEXT. */
1938
1939 static enum mips_symbol_type
1940 mips_classify_symbolic_expression (rtx x, enum mips_symbol_context context)
1941 {
1942 rtx offset;
1943
1944 split_const (x, &x, &offset);
1945 if (UNSPEC_ADDRESS_P (x))
1946 return UNSPEC_ADDRESS_TYPE (x);
1947
1948 return mips_classify_symbol (x, context);
1949 }
1950
1951 /* Return true if OFFSET is within the range [0, ALIGN), where ALIGN
1952 is the alignment in bytes of SYMBOL_REF X. */
1953
1954 static bool
1955 mips_offset_within_alignment_p (rtx x, HOST_WIDE_INT offset)
1956 {
1957 HOST_WIDE_INT align;
1958
1959 align = SYMBOL_REF_DECL (x) ? DECL_ALIGN_UNIT (SYMBOL_REF_DECL (x)) : 1;
1960 return IN_RANGE (offset, 0, align - 1);
1961 }
1962
1963 /* Return true if X is a symbolic constant that can be used in context
1964 CONTEXT. If it is, store the type of the symbol in *SYMBOL_TYPE. */
1965
1966 bool
1967 mips_symbolic_constant_p (rtx x, enum mips_symbol_context context,
1968 enum mips_symbol_type *symbol_type)
1969 {
1970 rtx offset;
1971
1972 split_const (x, &x, &offset);
1973 if (UNSPEC_ADDRESS_P (x))
1974 {
1975 *symbol_type = UNSPEC_ADDRESS_TYPE (x);
1976 x = UNSPEC_ADDRESS (x);
1977 }
1978 else if (GET_CODE (x) == SYMBOL_REF || GET_CODE (x) == LABEL_REF)
1979 {
1980 *symbol_type = mips_classify_symbol (x, context);
1981 if (*symbol_type == SYMBOL_TLS)
1982 return false;
1983 }
1984 else
1985 return false;
1986
1987 if (offset == const0_rtx)
1988 return true;
1989
1990 /* Check whether a nonzero offset is valid for the underlying
1991 relocations. */
1992 switch (*symbol_type)
1993 {
1994 case SYMBOL_ABSOLUTE:
1995 case SYMBOL_64_HIGH:
1996 case SYMBOL_64_MID:
1997 case SYMBOL_64_LOW:
1998 /* If the target has 64-bit pointers and the object file only
1999 supports 32-bit symbols, the values of those symbols will be
2000 sign-extended. In this case we can't allow an arbitrary offset
2001 in case the 32-bit value X + OFFSET has a different sign from X. */
2002 if (Pmode == DImode && !ABI_HAS_64BIT_SYMBOLS)
2003 return offset_within_block_p (x, INTVAL (offset));
2004
2005 /* In other cases the relocations can handle any offset. */
2006 return true;
2007
2008 case SYMBOL_PC_RELATIVE:
2009 /* Allow constant pool references to be converted to LABEL+CONSTANT.
2010 In this case, we no longer have access to the underlying constant,
2011 but the original symbol-based access was known to be valid. */
2012 if (GET_CODE (x) == LABEL_REF)
2013 return true;
2014
2015 /* Fall through. */
2016
2017 case SYMBOL_GP_RELATIVE:
2018 /* Make sure that the offset refers to something within the
2019 same object block. This should guarantee that the final
2020 PC- or GP-relative offset is within the 16-bit limit. */
2021 return offset_within_block_p (x, INTVAL (offset));
2022
2023 case SYMBOL_GOT_PAGE_OFST:
2024 case SYMBOL_GOTOFF_PAGE:
2025 /* If the symbol is global, the GOT entry will contain the symbol's
2026 address, and we will apply a 16-bit offset after loading it.
2027 If the symbol is local, the linker should provide enough local
2028 GOT entries for a 16-bit offset, but larger offsets may lead
2029 to GOT overflow. */
2030 return SMALL_INT (offset);
2031
2032 case SYMBOL_TPREL:
2033 case SYMBOL_DTPREL:
2034 /* There is no carry between the HI and LO REL relocations, so the
2035 offset is only valid if we know it won't lead to such a carry. */
2036 return mips_offset_within_alignment_p (x, INTVAL (offset));
2037
2038 case SYMBOL_GOT_DISP:
2039 case SYMBOL_GOTOFF_DISP:
2040 case SYMBOL_GOTOFF_CALL:
2041 case SYMBOL_GOTOFF_LOADGP:
2042 case SYMBOL_TLSGD:
2043 case SYMBOL_TLSLDM:
2044 case SYMBOL_GOTTPREL:
2045 case SYMBOL_TLS:
2046 case SYMBOL_HALF:
2047 return false;
2048 }
2049 gcc_unreachable ();
2050 }
2051 \f
2052 /* Like mips_symbol_insns, but treat extended MIPS16 instructions as a
2053 single instruction. We rely on the fact that, in the worst case,
2054 all instructions involved in a MIPS16 address calculation are usually
2055 extended ones. */
2056
2057 static int
2058 mips_symbol_insns_1 (enum mips_symbol_type type, enum machine_mode mode)
2059 {
2060 if (mips_use_pcrel_pool_p[(int) type])
2061 {
2062 if (mode == MAX_MACHINE_MODE)
2063 /* LEAs will be converted into constant-pool references by
2064 mips_reorg. */
2065 type = SYMBOL_PC_RELATIVE;
2066 else
2067 /* The constant must be loaded and then dereferenced. */
2068 return 0;
2069 }
2070
2071 switch (type)
2072 {
2073 case SYMBOL_ABSOLUTE:
2074 /* When using 64-bit symbols, we need 5 preparatory instructions,
2075 such as:
2076
2077 lui $at,%highest(symbol)
2078 daddiu $at,$at,%higher(symbol)
2079 dsll $at,$at,16
2080 daddiu $at,$at,%hi(symbol)
2081 dsll $at,$at,16
2082
2083 The final address is then $at + %lo(symbol). With 32-bit
2084 symbols we just need a preparatory LUI for normal mode and
2085 a preparatory LI and SLL for MIPS16. */
2086 return ABI_HAS_64BIT_SYMBOLS ? 6 : TARGET_MIPS16 ? 3 : 2;
2087
2088 case SYMBOL_GP_RELATIVE:
2089 /* Treat GP-relative accesses as taking a single instruction on
2090 MIPS16 too; the copy of $gp can often be shared. */
2091 return 1;
2092
2093 case SYMBOL_PC_RELATIVE:
2094 /* PC-relative constants can be only be used with ADDIUPC,
2095 DADDIUPC, LWPC and LDPC. */
2096 if (mode == MAX_MACHINE_MODE
2097 || GET_MODE_SIZE (mode) == 4
2098 || GET_MODE_SIZE (mode) == 8)
2099 return 1;
2100
2101 /* The constant must be loaded using ADDIUPC or DADDIUPC first. */
2102 return 0;
2103
2104 case SYMBOL_GOT_DISP:
2105 /* The constant will have to be loaded from the GOT before it
2106 is used in an address. */
2107 if (mode != MAX_MACHINE_MODE)
2108 return 0;
2109
2110 /* Fall through. */
2111
2112 case SYMBOL_GOT_PAGE_OFST:
2113 /* Unless -funit-at-a-time is in effect, we can't be sure whether the
2114 local/global classification is accurate. The worst cases are:
2115
2116 (1) For local symbols when generating o32 or o64 code. The assembler
2117 will use:
2118
2119 lw $at,%got(symbol)
2120 nop
2121
2122 ...and the final address will be $at + %lo(symbol).
2123
2124 (2) For global symbols when -mxgot. The assembler will use:
2125
2126 lui $at,%got_hi(symbol)
2127 (d)addu $at,$at,$gp
2128
2129 ...and the final address will be $at + %got_lo(symbol). */
2130 return 3;
2131
2132 case SYMBOL_GOTOFF_PAGE:
2133 case SYMBOL_GOTOFF_DISP:
2134 case SYMBOL_GOTOFF_CALL:
2135 case SYMBOL_GOTOFF_LOADGP:
2136 case SYMBOL_64_HIGH:
2137 case SYMBOL_64_MID:
2138 case SYMBOL_64_LOW:
2139 case SYMBOL_TLSGD:
2140 case SYMBOL_TLSLDM:
2141 case SYMBOL_DTPREL:
2142 case SYMBOL_GOTTPREL:
2143 case SYMBOL_TPREL:
2144 case SYMBOL_HALF:
2145 /* A 16-bit constant formed by a single relocation, or a 32-bit
2146 constant formed from a high 16-bit relocation and a low 16-bit
2147 relocation. Use mips_split_p to determine which. 32-bit
2148 constants need an "lui; addiu" sequence for normal mode and
2149 an "li; sll; addiu" sequence for MIPS16 mode. */
2150 return !mips_split_p[type] ? 1 : TARGET_MIPS16 ? 3 : 2;
2151
2152 case SYMBOL_TLS:
2153 /* We don't treat a bare TLS symbol as a constant. */
2154 return 0;
2155 }
2156 gcc_unreachable ();
2157 }
2158
2159 /* If MODE is MAX_MACHINE_MODE, return the number of instructions needed
2160 to load symbols of type TYPE into a register. Return 0 if the given
2161 type of symbol cannot be used as an immediate operand.
2162
2163 Otherwise, return the number of instructions needed to load or store
2164 values of mode MODE to or from addresses of type TYPE. Return 0 if
2165 the given type of symbol is not valid in addresses.
2166
2167 In both cases, instruction counts are based off BASE_INSN_LENGTH. */
2168
2169 static int
2170 mips_symbol_insns (enum mips_symbol_type type, enum machine_mode mode)
2171 {
2172 return mips_symbol_insns_1 (type, mode) * (TARGET_MIPS16 ? 2 : 1);
2173 }
2174 \f
2175 /* Implement TARGET_CANNOT_FORCE_CONST_MEM. */
2176
2177 static bool
2178 mips_cannot_force_const_mem (enum machine_mode mode, rtx x)
2179 {
2180 enum mips_symbol_type type;
2181 rtx base, offset;
2182
2183 /* There is no assembler syntax for expressing an address-sized
2184 high part. */
2185 if (GET_CODE (x) == HIGH)
2186 return true;
2187
2188 /* As an optimization, reject constants that mips_legitimize_move
2189 can expand inline.
2190
2191 Suppose we have a multi-instruction sequence that loads constant C
2192 into register R. If R does not get allocated a hard register, and
2193 R is used in an operand that allows both registers and memory
2194 references, reload will consider forcing C into memory and using
2195 one of the instruction's memory alternatives. Returning false
2196 here will force it to use an input reload instead. */
2197 if (CONST_INT_P (x) && mips_legitimate_constant_p (mode, x))
2198 return true;
2199
2200 split_const (x, &base, &offset);
2201 if (mips_symbolic_constant_p (base, SYMBOL_CONTEXT_LEA, &type))
2202 {
2203 /* See whether we explicitly want these symbols in the pool. */
2204 if (mips_use_pcrel_pool_p[(int) type])
2205 return false;
2206
2207 /* The same optimization as for CONST_INT. */
2208 if (SMALL_INT (offset) && mips_symbol_insns (type, MAX_MACHINE_MODE) > 0)
2209 return true;
2210
2211 /* If MIPS16 constant pools live in the text section, they should
2212 not refer to anything that might need run-time relocation. */
2213 if (TARGET_MIPS16_PCREL_LOADS && mips_got_symbol_type_p (type))
2214 return true;
2215 }
2216
2217 /* TLS symbols must be computed by mips_legitimize_move. */
2218 if (tls_referenced_p (x))
2219 return true;
2220
2221 return false;
2222 }
2223
2224 /* Implement TARGET_USE_BLOCKS_FOR_CONSTANT_P. We can't use blocks for
2225 constants when we're using a per-function constant pool. */
2226
2227 static bool
2228 mips_use_blocks_for_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED,
2229 const_rtx x ATTRIBUTE_UNUSED)
2230 {
2231 return !TARGET_MIPS16_PCREL_LOADS;
2232 }
2233 \f
2234 /* Return true if register REGNO is a valid base register for mode MODE.
2235 STRICT_P is true if REG_OK_STRICT is in effect. */
2236
2237 int
2238 mips_regno_mode_ok_for_base_p (int regno, enum machine_mode mode,
2239 bool strict_p)
2240 {
2241 if (!HARD_REGISTER_NUM_P (regno))
2242 {
2243 if (!strict_p)
2244 return true;
2245 regno = reg_renumber[regno];
2246 }
2247
2248 /* These fake registers will be eliminated to either the stack or
2249 hard frame pointer, both of which are usually valid base registers.
2250 Reload deals with the cases where the eliminated form isn't valid. */
2251 if (regno == ARG_POINTER_REGNUM || regno == FRAME_POINTER_REGNUM)
2252 return true;
2253
2254 /* In MIPS16 mode, the stack pointer can only address word and doubleword
2255 values, nothing smaller. */
2256 if (TARGET_MIPS16 && regno == STACK_POINTER_REGNUM)
2257 return GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8;
2258
2259 return TARGET_MIPS16 ? M16_REG_P (regno) : GP_REG_P (regno);
2260 }
2261
2262 /* Return true if X is a valid base register for mode MODE.
2263 STRICT_P is true if REG_OK_STRICT is in effect. */
2264
2265 static bool
2266 mips_valid_base_register_p (rtx x, enum machine_mode mode, bool strict_p)
2267 {
2268 if (!strict_p && GET_CODE (x) == SUBREG)
2269 x = SUBREG_REG (x);
2270
2271 return (REG_P (x)
2272 && mips_regno_mode_ok_for_base_p (REGNO (x), mode, strict_p));
2273 }
2274
2275 /* Return true if, for every base register BASE_REG, (plus BASE_REG X)
2276 can address a value of mode MODE. */
2277
2278 static bool
2279 mips_valid_offset_p (rtx x, enum machine_mode mode)
2280 {
2281 /* Check that X is a signed 16-bit number. */
2282 if (!const_arith_operand (x, Pmode))
2283 return false;
2284
2285 /* We may need to split multiword moves, so make sure that every word
2286 is accessible. */
2287 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
2288 && !SMALL_OPERAND (INTVAL (x) + GET_MODE_SIZE (mode) - UNITS_PER_WORD))
2289 return false;
2290
2291 return true;
2292 }
2293
2294 /* Return true if a LO_SUM can address a value of mode MODE when the
2295 LO_SUM symbol has type SYMBOL_TYPE. */
2296
2297 static bool
2298 mips_valid_lo_sum_p (enum mips_symbol_type symbol_type, enum machine_mode mode)
2299 {
2300 /* Check that symbols of type SYMBOL_TYPE can be used to access values
2301 of mode MODE. */
2302 if (mips_symbol_insns (symbol_type, mode) == 0)
2303 return false;
2304
2305 /* Check that there is a known low-part relocation. */
2306 if (mips_lo_relocs[symbol_type] == NULL)
2307 return false;
2308
2309 /* We may need to split multiword moves, so make sure that each word
2310 can be accessed without inducing a carry. This is mainly needed
2311 for o64, which has historically only guaranteed 64-bit alignment
2312 for 128-bit types. */
2313 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
2314 && GET_MODE_BITSIZE (mode) > GET_MODE_ALIGNMENT (mode))
2315 return false;
2316
2317 return true;
2318 }
2319
2320 /* Return true if X is a valid address for machine mode MODE. If it is,
2321 fill in INFO appropriately. STRICT_P is true if REG_OK_STRICT is in
2322 effect. */
2323
2324 static bool
2325 mips_classify_address (struct mips_address_info *info, rtx x,
2326 enum machine_mode mode, bool strict_p)
2327 {
2328 switch (GET_CODE (x))
2329 {
2330 case REG:
2331 case SUBREG:
2332 info->type = ADDRESS_REG;
2333 info->reg = x;
2334 info->offset = const0_rtx;
2335 return mips_valid_base_register_p (info->reg, mode, strict_p);
2336
2337 case PLUS:
2338 info->type = ADDRESS_REG;
2339 info->reg = XEXP (x, 0);
2340 info->offset = XEXP (x, 1);
2341 return (mips_valid_base_register_p (info->reg, mode, strict_p)
2342 && mips_valid_offset_p (info->offset, mode));
2343
2344 case LO_SUM:
2345 info->type = ADDRESS_LO_SUM;
2346 info->reg = XEXP (x, 0);
2347 info->offset = XEXP (x, 1);
2348 /* We have to trust the creator of the LO_SUM to do something vaguely
2349 sane. Target-independent code that creates a LO_SUM should also
2350 create and verify the matching HIGH. Target-independent code that
2351 adds an offset to a LO_SUM must prove that the offset will not
2352 induce a carry. Failure to do either of these things would be
2353 a bug, and we are not required to check for it here. The MIPS
2354 backend itself should only create LO_SUMs for valid symbolic
2355 constants, with the high part being either a HIGH or a copy
2356 of _gp. */
2357 info->symbol_type
2358 = mips_classify_symbolic_expression (info->offset, SYMBOL_CONTEXT_MEM);
2359 return (mips_valid_base_register_p (info->reg, mode, strict_p)
2360 && mips_valid_lo_sum_p (info->symbol_type, mode));
2361
2362 case CONST_INT:
2363 /* Small-integer addresses don't occur very often, but they
2364 are legitimate if $0 is a valid base register. */
2365 info->type = ADDRESS_CONST_INT;
2366 return !TARGET_MIPS16 && SMALL_INT (x);
2367
2368 case CONST:
2369 case LABEL_REF:
2370 case SYMBOL_REF:
2371 info->type = ADDRESS_SYMBOLIC;
2372 return (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_MEM,
2373 &info->symbol_type)
2374 && mips_symbol_insns (info->symbol_type, mode) > 0
2375 && !mips_split_p[info->symbol_type]);
2376
2377 default:
2378 return false;
2379 }
2380 }
2381
2382 /* Implement TARGET_LEGITIMATE_ADDRESS_P. */
2383
2384 static bool
2385 mips_legitimate_address_p (enum machine_mode mode, rtx x, bool strict_p)
2386 {
2387 struct mips_address_info addr;
2388
2389 return mips_classify_address (&addr, x, mode, strict_p);
2390 }
2391
2392 /* Return true if X is a legitimate $sp-based address for mode MDOE. */
2393
2394 bool
2395 mips_stack_address_p (rtx x, enum machine_mode mode)
2396 {
2397 struct mips_address_info addr;
2398
2399 return (mips_classify_address (&addr, x, mode, false)
2400 && addr.type == ADDRESS_REG
2401 && addr.reg == stack_pointer_rtx);
2402 }
2403
2404 /* Return true if ADDR matches the pattern for the LWXS load scaled indexed
2405 address instruction. Note that such addresses are not considered
2406 legitimate in the TARGET_LEGITIMATE_ADDRESS_P sense, because their use
2407 is so restricted. */
2408
2409 static bool
2410 mips_lwxs_address_p (rtx addr)
2411 {
2412 if (ISA_HAS_LWXS
2413 && GET_CODE (addr) == PLUS
2414 && REG_P (XEXP (addr, 1)))
2415 {
2416 rtx offset = XEXP (addr, 0);
2417 if (GET_CODE (offset) == MULT
2418 && REG_P (XEXP (offset, 0))
2419 && CONST_INT_P (XEXP (offset, 1))
2420 && INTVAL (XEXP (offset, 1)) == 4)
2421 return true;
2422 }
2423 return false;
2424 }
2425
2426 /* Return true if ADDR matches the pattern for the L{B,H,W,D}{,U}X load
2427 indexed address instruction. Note that such addresses are
2428 not considered legitimate in the TARGET_LEGITIMATE_ADDRESS_P
2429 sense, because their use is so restricted. */
2430
2431 static bool
2432 mips_lx_address_p (rtx addr, enum machine_mode mode)
2433 {
2434 if (GET_CODE (addr) != PLUS
2435 || !REG_P (XEXP (addr, 0))
2436 || !REG_P (XEXP (addr, 1)))
2437 return false;
2438 if (ISA_HAS_LBX && mode == QImode)
2439 return true;
2440 if (ISA_HAS_LHX && mode == HImode)
2441 return true;
2442 if (ISA_HAS_LWX && mode == SImode)
2443 return true;
2444 if (ISA_HAS_LDX && mode == DImode)
2445 return true;
2446 return false;
2447 }
2448 \f
2449 /* Return true if a value at OFFSET bytes from base register BASE can be
2450 accessed using an unextended MIPS16 instruction. MODE is the mode of
2451 the value.
2452
2453 Usually the offset in an unextended instruction is a 5-bit field.
2454 The offset is unsigned and shifted left once for LH and SH, twice
2455 for LW and SW, and so on. An exception is LWSP and SWSP, which have
2456 an 8-bit immediate field that's shifted left twice. */
2457
2458 static bool
2459 mips16_unextended_reference_p (enum machine_mode mode, rtx base,
2460 unsigned HOST_WIDE_INT offset)
2461 {
2462 if (mode != BLKmode && offset % GET_MODE_SIZE (mode) == 0)
2463 {
2464 if (GET_MODE_SIZE (mode) == 4 && base == stack_pointer_rtx)
2465 return offset < 256U * GET_MODE_SIZE (mode);
2466 return offset < 32U * GET_MODE_SIZE (mode);
2467 }
2468 return false;
2469 }
2470
2471 /* Return the number of instructions needed to load or store a value
2472 of mode MODE at address X, assuming that BASE_INSN_LENGTH is the
2473 length of one instruction. Return 0 if X isn't valid for MODE.
2474 Assume that multiword moves may need to be split into word moves
2475 if MIGHT_SPLIT_P, otherwise assume that a single load or store is
2476 enough. */
2477
2478 int
2479 mips_address_insns (rtx x, enum machine_mode mode, bool might_split_p)
2480 {
2481 struct mips_address_info addr;
2482 int factor;
2483
2484 /* BLKmode is used for single unaligned loads and stores and should
2485 not count as a multiword mode. (GET_MODE_SIZE (BLKmode) is pretty
2486 meaningless, so we have to single it out as a special case one way
2487 or the other.) */
2488 if (mode != BLKmode && might_split_p)
2489 factor = (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
2490 else
2491 factor = 1;
2492
2493 if (mips_classify_address (&addr, x, mode, false))
2494 switch (addr.type)
2495 {
2496 case ADDRESS_REG:
2497 if (TARGET_MIPS16
2498 && !mips16_unextended_reference_p (mode, addr.reg,
2499 UINTVAL (addr.offset)))
2500 return factor * 2;
2501 return factor;
2502
2503 case ADDRESS_LO_SUM:
2504 return TARGET_MIPS16 ? factor * 2 : factor;
2505
2506 case ADDRESS_CONST_INT:
2507 return factor;
2508
2509 case ADDRESS_SYMBOLIC:
2510 return factor * mips_symbol_insns (addr.symbol_type, mode);
2511 }
2512 return 0;
2513 }
2514
2515 /* Return true if X fits within an unsigned field of BITS bits that is
2516 shifted left SHIFT bits before being used. */
2517
2518 bool
2519 mips_unsigned_immediate_p (unsigned HOST_WIDE_INT x, int bits, int shift = 0)
2520 {
2521 return (x & ((1 << shift) - 1)) == 0 && x < ((unsigned) 1 << (shift + bits));
2522 }
2523
2524 /* Return true if X fits within a signed field of BITS bits that is
2525 shifted left SHIFT bits before being used. */
2526
2527 bool
2528 mips_signed_immediate_p (unsigned HOST_WIDE_INT x, int bits, int shift = 0)
2529 {
2530 x += 1 << (bits + shift - 1);
2531 return mips_unsigned_immediate_p (x, bits, shift);
2532 }
2533
2534 /* Return true if X is legitimate for accessing values of mode MODE,
2535 if it is based on a MIPS16 register, and if the offset satisfies
2536 OFFSET_PREDICATE. */
2537
2538 bool
2539 m16_based_address_p (rtx x, enum machine_mode mode,
2540 insn_operand_predicate_fn offset_predicate)
2541 {
2542 struct mips_address_info addr;
2543
2544 return (mips_classify_address (&addr, x, mode, false)
2545 && addr.type == ADDRESS_REG
2546 && M16_REG_P (REGNO (addr.reg))
2547 && offset_predicate (addr.offset, mode));
2548 }
2549
2550 /* Return true if X is a legitimate address that conforms to the requirements
2551 for a microMIPS LWSP or SWSP insn. */
2552
2553 bool
2554 lwsp_swsp_address_p (rtx x, enum machine_mode mode)
2555 {
2556 struct mips_address_info addr;
2557
2558 return (mips_classify_address (&addr, x, mode, false)
2559 && addr.type == ADDRESS_REG
2560 && REGNO (addr.reg) == STACK_POINTER_REGNUM
2561 && uw5_operand (addr.offset, mode));
2562 }
2563
2564 /* Return true if X is a legitimate address with a 12-bit offset.
2565 MODE is the mode of the value being accessed. */
2566
2567 bool
2568 umips_12bit_offset_address_p (rtx x, enum machine_mode mode)
2569 {
2570 struct mips_address_info addr;
2571
2572 return (mips_classify_address (&addr, x, mode, false)
2573 && addr.type == ADDRESS_REG
2574 && CONST_INT_P (addr.offset)
2575 && UMIPS_12BIT_OFFSET_P (INTVAL (addr.offset)));
2576 }
2577
2578 /* Return the number of instructions needed to load constant X,
2579 assuming that BASE_INSN_LENGTH is the length of one instruction.
2580 Return 0 if X isn't a valid constant. */
2581
2582 int
2583 mips_const_insns (rtx x)
2584 {
2585 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS];
2586 enum mips_symbol_type symbol_type;
2587 rtx offset;
2588
2589 switch (GET_CODE (x))
2590 {
2591 case HIGH:
2592 if (!mips_symbolic_constant_p (XEXP (x, 0), SYMBOL_CONTEXT_LEA,
2593 &symbol_type)
2594 || !mips_split_p[symbol_type])
2595 return 0;
2596
2597 /* This is simply an LUI for normal mode. It is an extended
2598 LI followed by an extended SLL for MIPS16. */
2599 return TARGET_MIPS16 ? 4 : 1;
2600
2601 case CONST_INT:
2602 if (TARGET_MIPS16)
2603 /* Unsigned 8-bit constants can be loaded using an unextended
2604 LI instruction. Unsigned 16-bit constants can be loaded
2605 using an extended LI. Negative constants must be loaded
2606 using LI and then negated. */
2607 return (IN_RANGE (INTVAL (x), 0, 255) ? 1
2608 : SMALL_OPERAND_UNSIGNED (INTVAL (x)) ? 2
2609 : IN_RANGE (-INTVAL (x), 0, 255) ? 2
2610 : SMALL_OPERAND_UNSIGNED (-INTVAL (x)) ? 3
2611 : 0);
2612
2613 return mips_build_integer (codes, INTVAL (x));
2614
2615 case CONST_DOUBLE:
2616 case CONST_VECTOR:
2617 /* Allow zeros for normal mode, where we can use $0. */
2618 return !TARGET_MIPS16 && x == CONST0_RTX (GET_MODE (x)) ? 1 : 0;
2619
2620 case CONST:
2621 if (CONST_GP_P (x))
2622 return 1;
2623
2624 /* See if we can refer to X directly. */
2625 if (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_LEA, &symbol_type))
2626 return mips_symbol_insns (symbol_type, MAX_MACHINE_MODE);
2627
2628 /* Otherwise try splitting the constant into a base and offset.
2629 If the offset is a 16-bit value, we can load the base address
2630 into a register and then use (D)ADDIU to add in the offset.
2631 If the offset is larger, we can load the base and offset
2632 into separate registers and add them together with (D)ADDU.
2633 However, the latter is only possible before reload; during
2634 and after reload, we must have the option of forcing the
2635 constant into the pool instead. */
2636 split_const (x, &x, &offset);
2637 if (offset != 0)
2638 {
2639 int n = mips_const_insns (x);
2640 if (n != 0)
2641 {
2642 if (SMALL_INT (offset))
2643 return n + 1;
2644 else if (!targetm.cannot_force_const_mem (GET_MODE (x), x))
2645 return n + 1 + mips_build_integer (codes, INTVAL (offset));
2646 }
2647 }
2648 return 0;
2649
2650 case SYMBOL_REF:
2651 case LABEL_REF:
2652 return mips_symbol_insns (mips_classify_symbol (x, SYMBOL_CONTEXT_LEA),
2653 MAX_MACHINE_MODE);
2654
2655 default:
2656 return 0;
2657 }
2658 }
2659
2660 /* X is a doubleword constant that can be handled by splitting it into
2661 two words and loading each word separately. Return the number of
2662 instructions required to do this, assuming that BASE_INSN_LENGTH
2663 is the length of one instruction. */
2664
2665 int
2666 mips_split_const_insns (rtx x)
2667 {
2668 unsigned int low, high;
2669
2670 low = mips_const_insns (mips_subword (x, false));
2671 high = mips_const_insns (mips_subword (x, true));
2672 gcc_assert (low > 0 && high > 0);
2673 return low + high;
2674 }
2675
2676 /* Return the number of instructions needed to implement INSN,
2677 given that it loads from or stores to MEM. Assume that
2678 BASE_INSN_LENGTH is the length of one instruction. */
2679
2680 int
2681 mips_load_store_insns (rtx mem, rtx insn)
2682 {
2683 enum machine_mode mode;
2684 bool might_split_p;
2685 rtx set;
2686
2687 gcc_assert (MEM_P (mem));
2688 mode = GET_MODE (mem);
2689
2690 /* Try to prove that INSN does not need to be split. */
2691 might_split_p = GET_MODE_SIZE (mode) > UNITS_PER_WORD;
2692 if (might_split_p)
2693 {
2694 set = single_set (insn);
2695 if (set && !mips_split_move_insn_p (SET_DEST (set), SET_SRC (set), insn))
2696 might_split_p = false;
2697 }
2698
2699 return mips_address_insns (XEXP (mem, 0), mode, might_split_p);
2700 }
2701
2702 /* Return the number of instructions needed for an integer division,
2703 assuming that BASE_INSN_LENGTH is the length of one instruction. */
2704
2705 int
2706 mips_idiv_insns (void)
2707 {
2708 int count;
2709
2710 count = 1;
2711 if (TARGET_CHECK_ZERO_DIV)
2712 {
2713 if (GENERATE_DIVIDE_TRAPS)
2714 count++;
2715 else
2716 count += 2;
2717 }
2718
2719 if (TARGET_FIX_R4000 || TARGET_FIX_R4400)
2720 count++;
2721 return count;
2722 }
2723 \f
2724 /* Emit a move from SRC to DEST. Assume that the move expanders can
2725 handle all moves if !can_create_pseudo_p (). The distinction is
2726 important because, unlike emit_move_insn, the move expanders know
2727 how to force Pmode objects into the constant pool even when the
2728 constant pool address is not itself legitimate. */
2729
2730 rtx_insn *
2731 mips_emit_move (rtx dest, rtx src)
2732 {
2733 return (can_create_pseudo_p ()
2734 ? emit_move_insn (dest, src)
2735 : emit_move_insn_1 (dest, src));
2736 }
2737
2738 /* Emit a move from SRC to DEST, splitting compound moves into individual
2739 instructions. SPLIT_TYPE is the type of split to perform. */
2740
2741 static void
2742 mips_emit_move_or_split (rtx dest, rtx src, enum mips_split_type split_type)
2743 {
2744 if (mips_split_move_p (dest, src, split_type))
2745 mips_split_move (dest, src, split_type);
2746 else
2747 mips_emit_move (dest, src);
2748 }
2749
2750 /* Emit an instruction of the form (set TARGET (CODE OP0)). */
2751
2752 static void
2753 mips_emit_unary (enum rtx_code code, rtx target, rtx op0)
2754 {
2755 emit_insn (gen_rtx_SET (VOIDmode, target,
2756 gen_rtx_fmt_e (code, GET_MODE (op0), op0)));
2757 }
2758
2759 /* Compute (CODE OP0) and store the result in a new register of mode MODE.
2760 Return that new register. */
2761
2762 static rtx
2763 mips_force_unary (enum machine_mode mode, enum rtx_code code, rtx op0)
2764 {
2765 rtx reg;
2766
2767 reg = gen_reg_rtx (mode);
2768 mips_emit_unary (code, reg, op0);
2769 return reg;
2770 }
2771
2772 /* Emit an instruction of the form (set TARGET (CODE OP0 OP1)). */
2773
2774 void
2775 mips_emit_binary (enum rtx_code code, rtx target, rtx op0, rtx op1)
2776 {
2777 emit_insn (gen_rtx_SET (VOIDmode, target,
2778 gen_rtx_fmt_ee (code, GET_MODE (target), op0, op1)));
2779 }
2780
2781 /* Compute (CODE OP0 OP1) and store the result in a new register
2782 of mode MODE. Return that new register. */
2783
2784 static rtx
2785 mips_force_binary (enum machine_mode mode, enum rtx_code code, rtx op0, rtx op1)
2786 {
2787 rtx reg;
2788
2789 reg = gen_reg_rtx (mode);
2790 mips_emit_binary (code, reg, op0, op1);
2791 return reg;
2792 }
2793
2794 /* Copy VALUE to a register and return that register. If new pseudos
2795 are allowed, copy it into a new register, otherwise use DEST. */
2796
2797 static rtx
2798 mips_force_temporary (rtx dest, rtx value)
2799 {
2800 if (can_create_pseudo_p ())
2801 return force_reg (Pmode, value);
2802 else
2803 {
2804 mips_emit_move (dest, value);
2805 return dest;
2806 }
2807 }
2808
2809 /* Emit a call sequence with call pattern PATTERN and return the call
2810 instruction itself (which is not necessarily the last instruction
2811 emitted). ORIG_ADDR is the original, unlegitimized address,
2812 ADDR is the legitimized form, and LAZY_P is true if the call
2813 address is lazily-bound. */
2814
2815 static rtx_insn *
2816 mips_emit_call_insn (rtx pattern, rtx orig_addr, rtx addr, bool lazy_p)
2817 {
2818 rtx_insn *insn;
2819 rtx reg;
2820
2821 insn = emit_call_insn (pattern);
2822
2823 if (TARGET_MIPS16 && mips_use_pic_fn_addr_reg_p (orig_addr))
2824 {
2825 /* MIPS16 JALRs only take MIPS16 registers. If the target
2826 function requires $25 to be valid on entry, we must copy it
2827 there separately. The move instruction can be put in the
2828 call's delay slot. */
2829 reg = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
2830 emit_insn_before (gen_move_insn (reg, addr), insn);
2831 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), reg);
2832 }
2833
2834 if (lazy_p)
2835 /* Lazy-binding stubs require $gp to be valid on entry. */
2836 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), pic_offset_table_rtx);
2837
2838 if (TARGET_USE_GOT)
2839 {
2840 /* See the comment above load_call<mode> for details. */
2841 use_reg (&CALL_INSN_FUNCTION_USAGE (insn),
2842 gen_rtx_REG (Pmode, GOT_VERSION_REGNUM));
2843 emit_insn (gen_update_got_version ());
2844 }
2845
2846 if (TARGET_MIPS16
2847 && TARGET_EXPLICIT_RELOCS
2848 && TARGET_CALL_CLOBBERED_GP)
2849 {
2850 rtx post_call_tmp_reg = gen_rtx_REG (word_mode, POST_CALL_TMP_REG);
2851 clobber_reg (&CALL_INSN_FUNCTION_USAGE (insn), post_call_tmp_reg);
2852 }
2853
2854 return insn;
2855 }
2856 \f
2857 /* Wrap symbol or label BASE in an UNSPEC address of type SYMBOL_TYPE,
2858 then add CONST_INT OFFSET to the result. */
2859
2860 static rtx
2861 mips_unspec_address_offset (rtx base, rtx offset,
2862 enum mips_symbol_type symbol_type)
2863 {
2864 base = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, base),
2865 UNSPEC_ADDRESS_FIRST + symbol_type);
2866 if (offset != const0_rtx)
2867 base = gen_rtx_PLUS (Pmode, base, offset);
2868 return gen_rtx_CONST (Pmode, base);
2869 }
2870
2871 /* Return an UNSPEC address with underlying address ADDRESS and symbol
2872 type SYMBOL_TYPE. */
2873
2874 rtx
2875 mips_unspec_address (rtx address, enum mips_symbol_type symbol_type)
2876 {
2877 rtx base, offset;
2878
2879 split_const (address, &base, &offset);
2880 return mips_unspec_address_offset (base, offset, symbol_type);
2881 }
2882
2883 /* If OP is an UNSPEC address, return the address to which it refers,
2884 otherwise return OP itself. */
2885
2886 rtx
2887 mips_strip_unspec_address (rtx op)
2888 {
2889 rtx base, offset;
2890
2891 split_const (op, &base, &offset);
2892 if (UNSPEC_ADDRESS_P (base))
2893 op = plus_constant (Pmode, UNSPEC_ADDRESS (base), INTVAL (offset));
2894 return op;
2895 }
2896
2897 /* If mips_unspec_address (ADDR, SYMBOL_TYPE) is a 32-bit value, add the
2898 high part to BASE and return the result. Just return BASE otherwise.
2899 TEMP is as for mips_force_temporary.
2900
2901 The returned expression can be used as the first operand to a LO_SUM. */
2902
2903 static rtx
2904 mips_unspec_offset_high (rtx temp, rtx base, rtx addr,
2905 enum mips_symbol_type symbol_type)
2906 {
2907 if (mips_split_p[symbol_type])
2908 {
2909 addr = gen_rtx_HIGH (Pmode, mips_unspec_address (addr, symbol_type));
2910 addr = mips_force_temporary (temp, addr);
2911 base = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, addr, base));
2912 }
2913 return base;
2914 }
2915 \f
2916 /* Return an instruction that copies $gp into register REG. We want
2917 GCC to treat the register's value as constant, so that its value
2918 can be rematerialized on demand. */
2919
2920 static rtx
2921 gen_load_const_gp (rtx reg)
2922 {
2923 return PMODE_INSN (gen_load_const_gp, (reg));
2924 }
2925
2926 /* Return a pseudo register that contains the value of $gp throughout
2927 the current function. Such registers are needed by MIPS16 functions,
2928 for which $gp itself is not a valid base register or addition operand. */
2929
2930 static rtx
2931 mips16_gp_pseudo_reg (void)
2932 {
2933 if (cfun->machine->mips16_gp_pseudo_rtx == NULL_RTX)
2934 {
2935 rtx insn;
2936 rtx_insn *scan;
2937
2938 cfun->machine->mips16_gp_pseudo_rtx = gen_reg_rtx (Pmode);
2939
2940 push_topmost_sequence ();
2941
2942 scan = get_insns ();
2943 while (NEXT_INSN (scan) && !INSN_P (NEXT_INSN (scan)))
2944 scan = NEXT_INSN (scan);
2945
2946 insn = gen_load_const_gp (cfun->machine->mips16_gp_pseudo_rtx);
2947 insn = emit_insn_after (insn, scan);
2948 INSN_LOCATION (insn) = 0;
2949
2950 pop_topmost_sequence ();
2951 }
2952
2953 return cfun->machine->mips16_gp_pseudo_rtx;
2954 }
2955
2956 /* Return a base register that holds pic_offset_table_rtx.
2957 TEMP, if nonnull, is a scratch Pmode base register. */
2958
2959 rtx
2960 mips_pic_base_register (rtx temp)
2961 {
2962 if (!TARGET_MIPS16)
2963 return pic_offset_table_rtx;
2964
2965 if (currently_expanding_to_rtl)
2966 return mips16_gp_pseudo_reg ();
2967
2968 if (can_create_pseudo_p ())
2969 temp = gen_reg_rtx (Pmode);
2970
2971 if (TARGET_USE_GOT)
2972 /* The first post-reload split exposes all references to $gp
2973 (both uses and definitions). All references must remain
2974 explicit after that point.
2975
2976 It is safe to introduce uses of $gp at any time, so for
2977 simplicity, we do that before the split too. */
2978 mips_emit_move (temp, pic_offset_table_rtx);
2979 else
2980 emit_insn (gen_load_const_gp (temp));
2981 return temp;
2982 }
2983
2984 /* Return the RHS of a load_call<mode> insn. */
2985
2986 static rtx
2987 mips_unspec_call (rtx reg, rtx symbol)
2988 {
2989 rtvec vec;
2990
2991 vec = gen_rtvec (3, reg, symbol, gen_rtx_REG (SImode, GOT_VERSION_REGNUM));
2992 return gen_rtx_UNSPEC (Pmode, vec, UNSPEC_LOAD_CALL);
2993 }
2994
2995 /* If SRC is the RHS of a load_call<mode> insn, return the underlying symbol
2996 reference. Return NULL_RTX otherwise. */
2997
2998 static rtx
2999 mips_strip_unspec_call (rtx src)
3000 {
3001 if (GET_CODE (src) == UNSPEC && XINT (src, 1) == UNSPEC_LOAD_CALL)
3002 return mips_strip_unspec_address (XVECEXP (src, 0, 1));
3003 return NULL_RTX;
3004 }
3005
3006 /* Create and return a GOT reference of type TYPE for address ADDR.
3007 TEMP, if nonnull, is a scratch Pmode base register. */
3008
3009 rtx
3010 mips_got_load (rtx temp, rtx addr, enum mips_symbol_type type)
3011 {
3012 rtx base, high, lo_sum_symbol;
3013
3014 base = mips_pic_base_register (temp);
3015
3016 /* If we used the temporary register to load $gp, we can't use
3017 it for the high part as well. */
3018 if (temp != NULL && reg_overlap_mentioned_p (base, temp))
3019 temp = NULL;
3020
3021 high = mips_unspec_offset_high (temp, base, addr, type);
3022 lo_sum_symbol = mips_unspec_address (addr, type);
3023
3024 if (type == SYMBOL_GOTOFF_CALL)
3025 return mips_unspec_call (high, lo_sum_symbol);
3026 else
3027 return PMODE_INSN (gen_unspec_got, (high, lo_sum_symbol));
3028 }
3029
3030 /* If MODE is MAX_MACHINE_MODE, ADDR appears as a move operand, otherwise
3031 it appears in a MEM of that mode. Return true if ADDR is a legitimate
3032 constant in that context and can be split into high and low parts.
3033 If so, and if LOW_OUT is nonnull, emit the high part and store the
3034 low part in *LOW_OUT. Leave *LOW_OUT unchanged otherwise.
3035
3036 TEMP is as for mips_force_temporary and is used to load the high
3037 part into a register.
3038
3039 When MODE is MAX_MACHINE_MODE, the low part is guaranteed to be
3040 a legitimize SET_SRC for an .md pattern, otherwise the low part
3041 is guaranteed to be a legitimate address for mode MODE. */
3042
3043 bool
3044 mips_split_symbol (rtx temp, rtx addr, enum machine_mode mode, rtx *low_out)
3045 {
3046 enum mips_symbol_context context;
3047 enum mips_symbol_type symbol_type;
3048 rtx high;
3049
3050 context = (mode == MAX_MACHINE_MODE
3051 ? SYMBOL_CONTEXT_LEA
3052 : SYMBOL_CONTEXT_MEM);
3053 if (GET_CODE (addr) == HIGH && context == SYMBOL_CONTEXT_LEA)
3054 {
3055 addr = XEXP (addr, 0);
3056 if (mips_symbolic_constant_p (addr, context, &symbol_type)
3057 && mips_symbol_insns (symbol_type, mode) > 0
3058 && mips_split_hi_p[symbol_type])
3059 {
3060 if (low_out)
3061 switch (symbol_type)
3062 {
3063 case SYMBOL_GOT_PAGE_OFST:
3064 /* The high part of a page/ofst pair is loaded from the GOT. */
3065 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_PAGE);
3066 break;
3067
3068 default:
3069 gcc_unreachable ();
3070 }
3071 return true;
3072 }
3073 }
3074 else
3075 {
3076 if (mips_symbolic_constant_p (addr, context, &symbol_type)
3077 && mips_symbol_insns (symbol_type, mode) > 0
3078 && mips_split_p[symbol_type])
3079 {
3080 if (low_out)
3081 switch (symbol_type)
3082 {
3083 case SYMBOL_GOT_DISP:
3084 /* SYMBOL_GOT_DISP symbols are loaded from the GOT. */
3085 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_DISP);
3086 break;
3087
3088 case SYMBOL_GP_RELATIVE:
3089 high = mips_pic_base_register (temp);
3090 *low_out = gen_rtx_LO_SUM (Pmode, high, addr);
3091 break;
3092
3093 default:
3094 high = gen_rtx_HIGH (Pmode, copy_rtx (addr));
3095 high = mips_force_temporary (temp, high);
3096 *low_out = gen_rtx_LO_SUM (Pmode, high, addr);
3097 break;
3098 }
3099 return true;
3100 }
3101 }
3102 return false;
3103 }
3104
3105 /* Return a legitimate address for REG + OFFSET. TEMP is as for
3106 mips_force_temporary; it is only needed when OFFSET is not a
3107 SMALL_OPERAND. */
3108
3109 static rtx
3110 mips_add_offset (rtx temp, rtx reg, HOST_WIDE_INT offset)
3111 {
3112 if (!SMALL_OPERAND (offset))
3113 {
3114 rtx high;
3115
3116 if (TARGET_MIPS16)
3117 {
3118 /* Load the full offset into a register so that we can use
3119 an unextended instruction for the address itself. */
3120 high = GEN_INT (offset);
3121 offset = 0;
3122 }
3123 else
3124 {
3125 /* Leave OFFSET as a 16-bit offset and put the excess in HIGH.
3126 The addition inside the macro CONST_HIGH_PART may cause an
3127 overflow, so we need to force a sign-extension check. */
3128 high = gen_int_mode (CONST_HIGH_PART (offset), Pmode);
3129 offset = CONST_LOW_PART (offset);
3130 }
3131 high = mips_force_temporary (temp, high);
3132 reg = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, high, reg));
3133 }
3134 return plus_constant (Pmode, reg, offset);
3135 }
3136 \f
3137 /* The __tls_get_attr symbol. */
3138 static GTY(()) rtx mips_tls_symbol;
3139
3140 /* Return an instruction sequence that calls __tls_get_addr. SYM is
3141 the TLS symbol we are referencing and TYPE is the symbol type to use
3142 (either global dynamic or local dynamic). V0 is an RTX for the
3143 return value location. */
3144
3145 static rtx
3146 mips_call_tls_get_addr (rtx sym, enum mips_symbol_type type, rtx v0)
3147 {
3148 rtx insn, loc, a0;
3149
3150 a0 = gen_rtx_REG (Pmode, GP_ARG_FIRST);
3151
3152 if (!mips_tls_symbol)
3153 mips_tls_symbol = init_one_libfunc ("__tls_get_addr");
3154
3155 loc = mips_unspec_address (sym, type);
3156
3157 start_sequence ();
3158
3159 emit_insn (gen_rtx_SET (Pmode, a0,
3160 gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, loc)));
3161 insn = mips_expand_call (MIPS_CALL_NORMAL, v0, mips_tls_symbol,
3162 const0_rtx, NULL_RTX, false);
3163 RTL_CONST_CALL_P (insn) = 1;
3164 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), a0);
3165 insn = get_insns ();
3166
3167 end_sequence ();
3168
3169 return insn;
3170 }
3171
3172 /* Return a pseudo register that contains the current thread pointer. */
3173
3174 rtx
3175 mips_expand_thread_pointer (rtx tp)
3176 {
3177 rtx fn;
3178
3179 if (TARGET_MIPS16)
3180 {
3181 if (!mips16_rdhwr_stub)
3182 mips16_rdhwr_stub = new mips16_rdhwr_one_only_stub ();
3183 fn = mips16_stub_call_address (mips16_rdhwr_stub);
3184 emit_insn (PMODE_INSN (gen_tls_get_tp_mips16, (tp, fn)));
3185 }
3186 else
3187 emit_insn (PMODE_INSN (gen_tls_get_tp, (tp)));
3188 return tp;
3189 }
3190
3191 static rtx
3192 mips_get_tp (void)
3193 {
3194 return mips_expand_thread_pointer (gen_reg_rtx (Pmode));
3195 }
3196
3197 /* Generate the code to access LOC, a thread-local SYMBOL_REF, and return
3198 its address. The return value will be both a valid address and a valid
3199 SET_SRC (either a REG or a LO_SUM). */
3200
3201 static rtx
3202 mips_legitimize_tls_address (rtx loc)
3203 {
3204 rtx dest, insn, v0, tp, tmp1, tmp2, eqv, offset;
3205 enum tls_model model;
3206
3207 model = SYMBOL_REF_TLS_MODEL (loc);
3208 /* Only TARGET_ABICALLS code can have more than one module; other
3209 code must be be static and should not use a GOT. All TLS models
3210 reduce to local exec in this situation. */
3211 if (!TARGET_ABICALLS)
3212 model = TLS_MODEL_LOCAL_EXEC;
3213
3214 switch (model)
3215 {
3216 case TLS_MODEL_GLOBAL_DYNAMIC:
3217 v0 = gen_rtx_REG (Pmode, GP_RETURN);
3218 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSGD, v0);
3219 dest = gen_reg_rtx (Pmode);
3220 emit_libcall_block (insn, dest, v0, loc);
3221 break;
3222
3223 case TLS_MODEL_LOCAL_DYNAMIC:
3224 v0 = gen_rtx_REG (Pmode, GP_RETURN);
3225 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSLDM, v0);
3226 tmp1 = gen_reg_rtx (Pmode);
3227
3228 /* Attach a unique REG_EQUIV, to allow the RTL optimizers to
3229 share the LDM result with other LD model accesses. */
3230 eqv = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, const0_rtx),
3231 UNSPEC_TLS_LDM);
3232 emit_libcall_block (insn, tmp1, v0, eqv);
3233
3234 offset = mips_unspec_address (loc, SYMBOL_DTPREL);
3235 if (mips_split_p[SYMBOL_DTPREL])
3236 {
3237 tmp2 = mips_unspec_offset_high (NULL, tmp1, loc, SYMBOL_DTPREL);
3238 dest = gen_rtx_LO_SUM (Pmode, tmp2, offset);
3239 }
3240 else
3241 dest = expand_binop (Pmode, add_optab, tmp1, offset,
3242 0, 0, OPTAB_DIRECT);
3243 break;
3244
3245 case TLS_MODEL_INITIAL_EXEC:
3246 tp = mips_get_tp ();
3247 tmp1 = gen_reg_rtx (Pmode);
3248 tmp2 = mips_unspec_address (loc, SYMBOL_GOTTPREL);
3249 if (Pmode == DImode)
3250 emit_insn (gen_load_gotdi (tmp1, pic_offset_table_rtx, tmp2));
3251 else
3252 emit_insn (gen_load_gotsi (tmp1, pic_offset_table_rtx, tmp2));
3253 dest = gen_reg_rtx (Pmode);
3254 emit_insn (gen_add3_insn (dest, tmp1, tp));
3255 break;
3256
3257 case TLS_MODEL_LOCAL_EXEC:
3258 tmp1 = mips_get_tp ();
3259 offset = mips_unspec_address (loc, SYMBOL_TPREL);
3260 if (mips_split_p[SYMBOL_TPREL])
3261 {
3262 tmp2 = mips_unspec_offset_high (NULL, tmp1, loc, SYMBOL_TPREL);
3263 dest = gen_rtx_LO_SUM (Pmode, tmp2, offset);
3264 }
3265 else
3266 dest = expand_binop (Pmode, add_optab, tmp1, offset,
3267 0, 0, OPTAB_DIRECT);
3268 break;
3269
3270 default:
3271 gcc_unreachable ();
3272 }
3273 return dest;
3274 }
3275 \f
3276 /* Implement "TARGET = __builtin_mips_get_fcsr ()" for MIPS16,
3277 using a stub. */
3278
3279 void
3280 mips16_expand_get_fcsr (rtx target)
3281 {
3282 if (!mips16_get_fcsr_stub)
3283 mips16_get_fcsr_stub = new mips16_get_fcsr_one_only_stub ();
3284 rtx fn = mips16_stub_call_address (mips16_get_fcsr_stub);
3285 emit_insn (PMODE_INSN (gen_mips_get_fcsr_mips16, (fn)));
3286 emit_move_insn (target, gen_rtx_REG (SImode, GET_FCSR_REGNUM));
3287 }
3288
3289 /* Implement __builtin_mips_set_fcsr (TARGET) for MIPS16, using a stub. */
3290
3291 void
3292 mips16_expand_set_fcsr (rtx newval)
3293 {
3294 if (!mips16_set_fcsr_stub)
3295 mips16_set_fcsr_stub = new mips16_set_fcsr_one_only_stub ();
3296 rtx fn = mips16_stub_call_address (mips16_set_fcsr_stub);
3297 emit_move_insn (gen_rtx_REG (SImode, SET_FCSR_REGNUM), newval);
3298 emit_insn (PMODE_INSN (gen_mips_set_fcsr_mips16, (fn)));
3299 }
3300 \f
3301 /* If X is not a valid address for mode MODE, force it into a register. */
3302
3303 static rtx
3304 mips_force_address (rtx x, enum machine_mode mode)
3305 {
3306 if (!mips_legitimate_address_p (mode, x, false))
3307 x = force_reg (Pmode, x);
3308 return x;
3309 }
3310
3311 /* This function is used to implement LEGITIMIZE_ADDRESS. If X can
3312 be legitimized in a way that the generic machinery might not expect,
3313 return a new address, otherwise return NULL. MODE is the mode of
3314 the memory being accessed. */
3315
3316 static rtx
3317 mips_legitimize_address (rtx x, rtx oldx ATTRIBUTE_UNUSED,
3318 enum machine_mode mode)
3319 {
3320 rtx base, addr;
3321 HOST_WIDE_INT offset;
3322
3323 if (mips_tls_symbol_p (x))
3324 return mips_legitimize_tls_address (x);
3325
3326 /* See if the address can split into a high part and a LO_SUM. */
3327 if (mips_split_symbol (NULL, x, mode, &addr))
3328 return mips_force_address (addr, mode);
3329
3330 /* Handle BASE + OFFSET using mips_add_offset. */
3331 mips_split_plus (x, &base, &offset);
3332 if (offset != 0)
3333 {
3334 if (!mips_valid_base_register_p (base, mode, false))
3335 base = copy_to_mode_reg (Pmode, base);
3336 addr = mips_add_offset (NULL, base, offset);
3337 return mips_force_address (addr, mode);
3338 }
3339
3340 return x;
3341 }
3342
3343 /* Load VALUE into DEST. TEMP is as for mips_force_temporary. */
3344
3345 void
3346 mips_move_integer (rtx temp, rtx dest, unsigned HOST_WIDE_INT value)
3347 {
3348 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS];
3349 enum machine_mode mode;
3350 unsigned int i, num_ops;
3351 rtx x;
3352
3353 mode = GET_MODE (dest);
3354 num_ops = mips_build_integer (codes, value);
3355
3356 /* Apply each binary operation to X. Invariant: X is a legitimate
3357 source operand for a SET pattern. */
3358 x = GEN_INT (codes[0].value);
3359 for (i = 1; i < num_ops; i++)
3360 {
3361 if (!can_create_pseudo_p ())
3362 {
3363 emit_insn (gen_rtx_SET (VOIDmode, temp, x));
3364 x = temp;
3365 }
3366 else
3367 x = force_reg (mode, x);
3368 x = gen_rtx_fmt_ee (codes[i].code, mode, x, GEN_INT (codes[i].value));
3369 }
3370
3371 emit_insn (gen_rtx_SET (VOIDmode, dest, x));
3372 }
3373
3374 /* Subroutine of mips_legitimize_move. Move constant SRC into register
3375 DEST given that SRC satisfies immediate_operand but doesn't satisfy
3376 move_operand. */
3377
3378 static void
3379 mips_legitimize_const_move (enum machine_mode mode, rtx dest, rtx src)
3380 {
3381 rtx base, offset;
3382
3383 /* Split moves of big integers into smaller pieces. */
3384 if (splittable_const_int_operand (src, mode))
3385 {
3386 mips_move_integer (dest, dest, INTVAL (src));
3387 return;
3388 }
3389
3390 /* Split moves of symbolic constants into high/low pairs. */
3391 if (mips_split_symbol (dest, src, MAX_MACHINE_MODE, &src))
3392 {
3393 emit_insn (gen_rtx_SET (VOIDmode, dest, src));
3394 return;
3395 }
3396
3397 /* Generate the appropriate access sequences for TLS symbols. */
3398 if (mips_tls_symbol_p (src))
3399 {
3400 mips_emit_move (dest, mips_legitimize_tls_address (src));
3401 return;
3402 }
3403
3404 /* If we have (const (plus symbol offset)), and that expression cannot
3405 be forced into memory, load the symbol first and add in the offset.
3406 In non-MIPS16 mode, prefer to do this even if the constant _can_ be
3407 forced into memory, as it usually produces better code. */
3408 split_const (src, &base, &offset);
3409 if (offset != const0_rtx
3410 && (targetm.cannot_force_const_mem (mode, src)
3411 || (!TARGET_MIPS16 && can_create_pseudo_p ())))
3412 {
3413 base = mips_force_temporary (dest, base);
3414 mips_emit_move (dest, mips_add_offset (NULL, base, INTVAL (offset)));
3415 return;
3416 }
3417
3418 src = force_const_mem (mode, src);
3419
3420 /* When using explicit relocs, constant pool references are sometimes
3421 not legitimate addresses. */
3422 mips_split_symbol (dest, XEXP (src, 0), mode, &XEXP (src, 0));
3423 mips_emit_move (dest, src);
3424 }
3425
3426 /* If (set DEST SRC) is not a valid move instruction, emit an equivalent
3427 sequence that is valid. */
3428
3429 bool
3430 mips_legitimize_move (enum machine_mode mode, rtx dest, rtx src)
3431 {
3432 if (!register_operand (dest, mode) && !reg_or_0_operand (src, mode))
3433 {
3434 mips_emit_move (dest, force_reg (mode, src));
3435 return true;
3436 }
3437
3438 /* We need to deal with constants that would be legitimate
3439 immediate_operands but aren't legitimate move_operands. */
3440 if (CONSTANT_P (src) && !move_operand (src, mode))
3441 {
3442 mips_legitimize_const_move (mode, dest, src);
3443 set_unique_reg_note (get_last_insn (), REG_EQUAL, copy_rtx (src));
3444 return true;
3445 }
3446 return false;
3447 }
3448 \f
3449 /* Return true if value X in context CONTEXT is a small-data address
3450 that can be rewritten as a LO_SUM. */
3451
3452 static bool
3453 mips_rewrite_small_data_p (rtx x, enum mips_symbol_context context)
3454 {
3455 enum mips_symbol_type symbol_type;
3456
3457 return (mips_lo_relocs[SYMBOL_GP_RELATIVE]
3458 && !mips_split_p[SYMBOL_GP_RELATIVE]
3459 && mips_symbolic_constant_p (x, context, &symbol_type)
3460 && symbol_type == SYMBOL_GP_RELATIVE);
3461 }
3462
3463 /* A for_each_rtx callback for mips_small_data_pattern_p. DATA is the
3464 containing MEM, or null if none. */
3465
3466 static int
3467 mips_small_data_pattern_1 (rtx *loc, void *data)
3468 {
3469 enum mips_symbol_context context;
3470
3471 /* Ignore things like "g" constraints in asms. We make no particular
3472 guarantee about which symbolic constants are acceptable as asm operands
3473 versus which must be forced into a GPR. */
3474 if (GET_CODE (*loc) == LO_SUM || GET_CODE (*loc) == ASM_OPERANDS)
3475 return -1;
3476
3477 if (MEM_P (*loc))
3478 {
3479 if (for_each_rtx (&XEXP (*loc, 0), mips_small_data_pattern_1, *loc))
3480 return 1;
3481 return -1;
3482 }
3483
3484 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA;
3485 return mips_rewrite_small_data_p (*loc, context);
3486 }
3487
3488 /* Return true if OP refers to small data symbols directly, not through
3489 a LO_SUM. */
3490
3491 bool
3492 mips_small_data_pattern_p (rtx op)
3493 {
3494 return for_each_rtx (&op, mips_small_data_pattern_1, NULL);
3495 }
3496
3497 /* A for_each_rtx callback, used by mips_rewrite_small_data.
3498 DATA is the containing MEM, or null if none. */
3499
3500 static int
3501 mips_rewrite_small_data_1 (rtx *loc, void *data)
3502 {
3503 enum mips_symbol_context context;
3504
3505 if (MEM_P (*loc))
3506 {
3507 for_each_rtx (&XEXP (*loc, 0), mips_rewrite_small_data_1, *loc);
3508 return -1;
3509 }
3510
3511 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA;
3512 if (mips_rewrite_small_data_p (*loc, context))
3513 *loc = gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, *loc);
3514
3515 if (GET_CODE (*loc) == LO_SUM)
3516 return -1;
3517
3518 return 0;
3519 }
3520
3521 /* Rewrite instruction pattern PATTERN so that it refers to small data
3522 using explicit relocations. */
3523
3524 rtx
3525 mips_rewrite_small_data (rtx pattern)
3526 {
3527 pattern = copy_insn (pattern);
3528 for_each_rtx (&pattern, mips_rewrite_small_data_1, NULL);
3529 return pattern;
3530 }
3531 \f
3532 /* The cost of loading values from the constant pool. It should be
3533 larger than the cost of any constant we want to synthesize inline. */
3534 #define CONSTANT_POOL_COST COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 8)
3535
3536 /* Return the cost of X when used as an operand to the MIPS16 instruction
3537 that implements CODE. Return -1 if there is no such instruction, or if
3538 X is not a valid immediate operand for it. */
3539
3540 static int
3541 mips16_constant_cost (int code, HOST_WIDE_INT x)
3542 {
3543 switch (code)
3544 {
3545 case ASHIFT:
3546 case ASHIFTRT:
3547 case LSHIFTRT:
3548 /* Shifts by between 1 and 8 bits (inclusive) are unextended,
3549 other shifts are extended. The shift patterns truncate the shift
3550 count to the right size, so there are no out-of-range values. */
3551 if (IN_RANGE (x, 1, 8))
3552 return 0;
3553 return COSTS_N_INSNS (1);
3554
3555 case PLUS:
3556 if (IN_RANGE (x, -128, 127))
3557 return 0;
3558 if (SMALL_OPERAND (x))
3559 return COSTS_N_INSNS (1);
3560 return -1;
3561
3562 case LEU:
3563 /* Like LE, but reject the always-true case. */
3564 if (x == -1)
3565 return -1;
3566 case LE:
3567 /* We add 1 to the immediate and use SLT. */
3568 x += 1;
3569 case XOR:
3570 /* We can use CMPI for an xor with an unsigned 16-bit X. */
3571 case LT:
3572 case LTU:
3573 if (IN_RANGE (x, 0, 255))
3574 return 0;
3575 if (SMALL_OPERAND_UNSIGNED (x))
3576 return COSTS_N_INSNS (1);
3577 return -1;
3578
3579 case EQ:
3580 case NE:
3581 /* Equality comparisons with 0 are cheap. */
3582 if (x == 0)
3583 return 0;
3584 return -1;
3585
3586 default:
3587 return -1;
3588 }
3589 }
3590
3591 /* Return true if there is a non-MIPS16 instruction that implements CODE
3592 and if that instruction accepts X as an immediate operand. */
3593
3594 static int
3595 mips_immediate_operand_p (int code, HOST_WIDE_INT x)
3596 {
3597 switch (code)
3598 {
3599 case ASHIFT:
3600 case ASHIFTRT:
3601 case LSHIFTRT:
3602 /* All shift counts are truncated to a valid constant. */
3603 return true;
3604
3605 case ROTATE:
3606 case ROTATERT:
3607 /* Likewise rotates, if the target supports rotates at all. */
3608 return ISA_HAS_ROR;
3609
3610 case AND:
3611 case IOR:
3612 case XOR:
3613 /* These instructions take 16-bit unsigned immediates. */
3614 return SMALL_OPERAND_UNSIGNED (x);
3615
3616 case PLUS:
3617 case LT:
3618 case LTU:
3619 /* These instructions take 16-bit signed immediates. */
3620 return SMALL_OPERAND (x);
3621
3622 case EQ:
3623 case NE:
3624 case GT:
3625 case GTU:
3626 /* The "immediate" forms of these instructions are really
3627 implemented as comparisons with register 0. */
3628 return x == 0;
3629
3630 case GE:
3631 case GEU:
3632 /* Likewise, meaning that the only valid immediate operand is 1. */
3633 return x == 1;
3634
3635 case LE:
3636 /* We add 1 to the immediate and use SLT. */
3637 return SMALL_OPERAND (x + 1);
3638
3639 case LEU:
3640 /* Likewise SLTU, but reject the always-true case. */
3641 return SMALL_OPERAND (x + 1) && x + 1 != 0;
3642
3643 case SIGN_EXTRACT:
3644 case ZERO_EXTRACT:
3645 /* The bit position and size are immediate operands. */
3646 return ISA_HAS_EXT_INS;
3647
3648 default:
3649 /* By default assume that $0 can be used for 0. */
3650 return x == 0;
3651 }
3652 }
3653
3654 /* Return the cost of binary operation X, given that the instruction
3655 sequence for a word-sized or smaller operation has cost SINGLE_COST
3656 and that the sequence of a double-word operation has cost DOUBLE_COST.
3657 If SPEED is true, optimize for speed otherwise optimize for size. */
3658
3659 static int
3660 mips_binary_cost (rtx x, int single_cost, int double_cost, bool speed)
3661 {
3662 int cost;
3663
3664 if (GET_MODE_SIZE (GET_MODE (x)) == UNITS_PER_WORD * 2)
3665 cost = double_cost;
3666 else
3667 cost = single_cost;
3668 return (cost
3669 + set_src_cost (XEXP (x, 0), speed)
3670 + rtx_cost (XEXP (x, 1), GET_CODE (x), 1, speed));
3671 }
3672
3673 /* Return the cost of floating-point multiplications of mode MODE. */
3674
3675 static int
3676 mips_fp_mult_cost (enum machine_mode mode)
3677 {
3678 return mode == DFmode ? mips_cost->fp_mult_df : mips_cost->fp_mult_sf;
3679 }
3680
3681 /* Return the cost of floating-point divisions of mode MODE. */
3682
3683 static int
3684 mips_fp_div_cost (enum machine_mode mode)
3685 {
3686 return mode == DFmode ? mips_cost->fp_div_df : mips_cost->fp_div_sf;
3687 }
3688
3689 /* Return the cost of sign-extending OP to mode MODE, not including the
3690 cost of OP itself. */
3691
3692 static int
3693 mips_sign_extend_cost (enum machine_mode mode, rtx op)
3694 {
3695 if (MEM_P (op))
3696 /* Extended loads are as cheap as unextended ones. */
3697 return 0;
3698
3699 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode)
3700 /* A sign extension from SImode to DImode in 64-bit mode is free. */
3701 return 0;
3702
3703 if (ISA_HAS_SEB_SEH || GENERATE_MIPS16E)
3704 /* We can use SEB or SEH. */
3705 return COSTS_N_INSNS (1);
3706
3707 /* We need to use a shift left and a shift right. */
3708 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2);
3709 }
3710
3711 /* Return the cost of zero-extending OP to mode MODE, not including the
3712 cost of OP itself. */
3713
3714 static int
3715 mips_zero_extend_cost (enum machine_mode mode, rtx op)
3716 {
3717 if (MEM_P (op))
3718 /* Extended loads are as cheap as unextended ones. */
3719 return 0;
3720
3721 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode)
3722 /* We need a shift left by 32 bits and a shift right by 32 bits. */
3723 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2);
3724
3725 if (GENERATE_MIPS16E)
3726 /* We can use ZEB or ZEH. */
3727 return COSTS_N_INSNS (1);
3728
3729 if (TARGET_MIPS16)
3730 /* We need to load 0xff or 0xffff into a register and use AND. */
3731 return COSTS_N_INSNS (GET_MODE (op) == QImode ? 2 : 3);
3732
3733 /* We can use ANDI. */
3734 return COSTS_N_INSNS (1);
3735 }
3736
3737 /* Return the cost of moving between two registers of mode MODE,
3738 assuming that the move will be in pieces of at most UNITS bytes. */
3739
3740 static int
3741 mips_set_reg_reg_piece_cost (enum machine_mode mode, unsigned int units)
3742 {
3743 return COSTS_N_INSNS ((GET_MODE_SIZE (mode) + units - 1) / units);
3744 }
3745
3746 /* Return the cost of moving between two registers of mode MODE. */
3747
3748 static int
3749 mips_set_reg_reg_cost (enum machine_mode mode)
3750 {
3751 switch (GET_MODE_CLASS (mode))
3752 {
3753 case MODE_CC:
3754 return mips_set_reg_reg_piece_cost (mode, GET_MODE_SIZE (CCmode));
3755
3756 case MODE_FLOAT:
3757 case MODE_COMPLEX_FLOAT:
3758 case MODE_VECTOR_FLOAT:
3759 if (TARGET_HARD_FLOAT)
3760 return mips_set_reg_reg_piece_cost (mode, UNITS_PER_HWFPVALUE);
3761 /* Fall through */
3762
3763 default:
3764 return mips_set_reg_reg_piece_cost (mode, UNITS_PER_WORD);
3765 }
3766 }
3767
3768 /* Implement TARGET_RTX_COSTS. */
3769
3770 static bool
3771 mips_rtx_costs (rtx x, int code, int outer_code, int opno ATTRIBUTE_UNUSED,
3772 int *total, bool speed)
3773 {
3774 enum machine_mode mode = GET_MODE (x);
3775 bool float_mode_p = FLOAT_MODE_P (mode);
3776 int cost;
3777 rtx addr;
3778
3779 /* The cost of a COMPARE is hard to define for MIPS. COMPAREs don't
3780 appear in the instruction stream, and the cost of a comparison is
3781 really the cost of the branch or scc condition. At the time of
3782 writing, GCC only uses an explicit outer COMPARE code when optabs
3783 is testing whether a constant is expensive enough to force into a
3784 register. We want optabs to pass such constants through the MIPS
3785 expanders instead, so make all constants very cheap here. */
3786 if (outer_code == COMPARE)
3787 {
3788 gcc_assert (CONSTANT_P (x));
3789 *total = 0;
3790 return true;
3791 }
3792
3793 switch (code)
3794 {
3795 case CONST_INT:
3796 /* Treat *clear_upper32-style ANDs as having zero cost in the
3797 second operand. The cost is entirely in the first operand.
3798
3799 ??? This is needed because we would otherwise try to CSE
3800 the constant operand. Although that's the right thing for
3801 instructions that continue to be a register operation throughout
3802 compilation, it is disastrous for instructions that could
3803 later be converted into a memory operation. */
3804 if (TARGET_64BIT
3805 && outer_code == AND
3806 && UINTVAL (x) == 0xffffffff)
3807 {
3808 *total = 0;
3809 return true;
3810 }
3811
3812 if (TARGET_MIPS16)
3813 {
3814 cost = mips16_constant_cost (outer_code, INTVAL (x));
3815 if (cost >= 0)
3816 {
3817 *total = cost;
3818 return true;
3819 }
3820 }
3821 else
3822 {
3823 /* When not optimizing for size, we care more about the cost
3824 of hot code, and hot code is often in a loop. If a constant
3825 operand needs to be forced into a register, we will often be
3826 able to hoist the constant load out of the loop, so the load
3827 should not contribute to the cost. */
3828 if (speed || mips_immediate_operand_p (outer_code, INTVAL (x)))
3829 {
3830 *total = 0;
3831 return true;
3832 }
3833 }
3834 /* Fall through. */
3835
3836 case CONST:
3837 case SYMBOL_REF:
3838 case LABEL_REF:
3839 case CONST_DOUBLE:
3840 if (force_to_mem_operand (x, VOIDmode))
3841 {
3842 *total = COSTS_N_INSNS (1);
3843 return true;
3844 }
3845 cost = mips_const_insns (x);
3846 if (cost > 0)
3847 {
3848 /* If the constant is likely to be stored in a GPR, SETs of
3849 single-insn constants are as cheap as register sets; we
3850 never want to CSE them.
3851
3852 Don't reduce the cost of storing a floating-point zero in
3853 FPRs. If we have a zero in an FPR for other reasons, we
3854 can get better cfg-cleanup and delayed-branch results by
3855 using it consistently, rather than using $0 sometimes and
3856 an FPR at other times. Also, moves between floating-point
3857 registers are sometimes cheaper than (D)MTC1 $0. */
3858 if (cost == 1
3859 && outer_code == SET
3860 && !(float_mode_p && TARGET_HARD_FLOAT))
3861 cost = 0;
3862 /* When non-MIPS16 code loads a constant N>1 times, we rarely
3863 want to CSE the constant itself. It is usually better to
3864 have N copies of the last operation in the sequence and one
3865 shared copy of the other operations. (Note that this is
3866 not true for MIPS16 code, where the final operation in the
3867 sequence is often an extended instruction.)
3868
3869 Also, if we have a CONST_INT, we don't know whether it is
3870 for a word or doubleword operation, so we cannot rely on
3871 the result of mips_build_integer. */
3872 else if (!TARGET_MIPS16
3873 && (outer_code == SET || mode == VOIDmode))
3874 cost = 1;
3875 *total = COSTS_N_INSNS (cost);
3876 return true;
3877 }
3878 /* The value will need to be fetched from the constant pool. */
3879 *total = CONSTANT_POOL_COST;
3880 return true;
3881
3882 case MEM:
3883 /* If the address is legitimate, return the number of
3884 instructions it needs. */
3885 addr = XEXP (x, 0);
3886 cost = mips_address_insns (addr, mode, true);
3887 if (cost > 0)
3888 {
3889 *total = COSTS_N_INSNS (cost + 1);
3890 return true;
3891 }
3892 /* Check for a scaled indexed address. */
3893 if (mips_lwxs_address_p (addr)
3894 || mips_lx_address_p (addr, mode))
3895 {
3896 *total = COSTS_N_INSNS (2);
3897 return true;
3898 }
3899 /* Otherwise use the default handling. */
3900 return false;
3901
3902 case FFS:
3903 *total = COSTS_N_INSNS (6);
3904 return false;
3905
3906 case NOT:
3907 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 2 : 1);
3908 return false;
3909
3910 case AND:
3911 /* Check for a *clear_upper32 pattern and treat it like a zero
3912 extension. See the pattern's comment for details. */
3913 if (TARGET_64BIT
3914 && mode == DImode
3915 && CONST_INT_P (XEXP (x, 1))
3916 && UINTVAL (XEXP (x, 1)) == 0xffffffff)
3917 {
3918 *total = (mips_zero_extend_cost (mode, XEXP (x, 0))
3919 + set_src_cost (XEXP (x, 0), speed));
3920 return true;
3921 }
3922 if (ISA_HAS_CINS && CONST_INT_P (XEXP (x, 1)))
3923 {
3924 rtx op = XEXP (x, 0);
3925 if (GET_CODE (op) == ASHIFT
3926 && CONST_INT_P (XEXP (op, 1))
3927 && mask_low_and_shift_p (mode, XEXP (x, 1), XEXP (op, 1), 32))
3928 {
3929 *total = COSTS_N_INSNS (1) + set_src_cost (XEXP (op, 0), speed);
3930 return true;
3931 }
3932 }
3933 /* (AND (NOT op0) (NOT op1) is a nor operation that can be done in
3934 a single instruction. */
3935 if (!TARGET_MIPS16
3936 && GET_CODE (XEXP (x, 0)) == NOT
3937 && GET_CODE (XEXP (x, 1)) == NOT)
3938 {
3939 cost = GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 2 : 1;
3940 *total = (COSTS_N_INSNS (cost)
3941 + set_src_cost (XEXP (XEXP (x, 0), 0), speed)
3942 + set_src_cost (XEXP (XEXP (x, 1), 0), speed));
3943 return true;
3944 }
3945
3946 /* Fall through. */
3947
3948 case IOR:
3949 case XOR:
3950 /* Double-word operations use two single-word operations. */
3951 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (2),
3952 speed);
3953 return true;
3954
3955 case ASHIFT:
3956 case ASHIFTRT:
3957 case LSHIFTRT:
3958 case ROTATE:
3959 case ROTATERT:
3960 if (CONSTANT_P (XEXP (x, 1)))
3961 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4),
3962 speed);
3963 else
3964 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (12),
3965 speed);
3966 return true;
3967
3968 case ABS:
3969 if (float_mode_p)
3970 *total = mips_cost->fp_add;
3971 else
3972 *total = COSTS_N_INSNS (4);
3973 return false;
3974
3975 case LO_SUM:
3976 /* Low-part immediates need an extended MIPS16 instruction. */
3977 *total = (COSTS_N_INSNS (TARGET_MIPS16 ? 2 : 1)
3978 + set_src_cost (XEXP (x, 0), speed));
3979 return true;
3980
3981 case LT:
3982 case LTU:
3983 case LE:
3984 case LEU:
3985 case GT:
3986 case GTU:
3987 case GE:
3988 case GEU:
3989 case EQ:
3990 case NE:
3991 case UNORDERED:
3992 case LTGT:
3993 /* Branch comparisons have VOIDmode, so use the first operand's
3994 mode instead. */
3995 mode = GET_MODE (XEXP (x, 0));
3996 if (FLOAT_MODE_P (mode))
3997 {
3998 *total = mips_cost->fp_add;
3999 return false;
4000 }
4001 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4),
4002 speed);
4003 return true;
4004
4005 case MINUS:
4006 if (float_mode_p
4007 && (ISA_HAS_NMADD4_NMSUB4 || ISA_HAS_NMADD3_NMSUB3)
4008 && TARGET_FUSED_MADD
4009 && !HONOR_NANS (mode)
4010 && !HONOR_SIGNED_ZEROS (mode))
4011 {
4012 /* See if we can use NMADD or NMSUB. See mips.md for the
4013 associated patterns. */
4014 rtx op0 = XEXP (x, 0);
4015 rtx op1 = XEXP (x, 1);
4016 if (GET_CODE (op0) == MULT && GET_CODE (XEXP (op0, 0)) == NEG)
4017 {
4018 *total = (mips_fp_mult_cost (mode)
4019 + set_src_cost (XEXP (XEXP (op0, 0), 0), speed)
4020 + set_src_cost (XEXP (op0, 1), speed)
4021 + set_src_cost (op1, speed));
4022 return true;
4023 }
4024 if (GET_CODE (op1) == MULT)
4025 {
4026 *total = (mips_fp_mult_cost (mode)
4027 + set_src_cost (op0, speed)
4028 + set_src_cost (XEXP (op1, 0), speed)
4029 + set_src_cost (XEXP (op1, 1), speed));
4030 return true;
4031 }
4032 }
4033 /* Fall through. */
4034
4035 case PLUS:
4036 if (float_mode_p)
4037 {
4038 /* If this is part of a MADD or MSUB, treat the PLUS as
4039 being free. */
4040 if ((ISA_HAS_FP_MADD4_MSUB4 || ISA_HAS_FP_MADD3_MSUB3)
4041 && TARGET_FUSED_MADD
4042 && GET_CODE (XEXP (x, 0)) == MULT)
4043 *total = 0;
4044 else
4045 *total = mips_cost->fp_add;
4046 return false;
4047 }
4048
4049 /* Double-word operations require three single-word operations and
4050 an SLTU. The MIPS16 version then needs to move the result of
4051 the SLTU from $24 to a MIPS16 register. */
4052 *total = mips_binary_cost (x, COSTS_N_INSNS (1),
4053 COSTS_N_INSNS (TARGET_MIPS16 ? 5 : 4),
4054 speed);
4055 return true;
4056
4057 case NEG:
4058 if (float_mode_p
4059 && (ISA_HAS_NMADD4_NMSUB4 || ISA_HAS_NMADD3_NMSUB3)
4060 && TARGET_FUSED_MADD
4061 && !HONOR_NANS (mode)
4062 && HONOR_SIGNED_ZEROS (mode))
4063 {
4064 /* See if we can use NMADD or NMSUB. See mips.md for the
4065 associated patterns. */
4066 rtx op = XEXP (x, 0);
4067 if ((GET_CODE (op) == PLUS || GET_CODE (op) == MINUS)
4068 && GET_CODE (XEXP (op, 0)) == MULT)
4069 {
4070 *total = (mips_fp_mult_cost (mode)
4071 + set_src_cost (XEXP (XEXP (op, 0), 0), speed)
4072 + set_src_cost (XEXP (XEXP (op, 0), 1), speed)
4073 + set_src_cost (XEXP (op, 1), speed));
4074 return true;
4075 }
4076 }
4077
4078 if (float_mode_p)
4079 *total = mips_cost->fp_add;
4080 else
4081 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 4 : 1);
4082 return false;
4083
4084 case MULT:
4085 if (float_mode_p)
4086 *total = mips_fp_mult_cost (mode);
4087 else if (mode == DImode && !TARGET_64BIT)
4088 /* Synthesized from 2 mulsi3s, 1 mulsidi3 and two additions,
4089 where the mulsidi3 always includes an MFHI and an MFLO. */
4090 *total = (speed
4091 ? mips_cost->int_mult_si * 3 + 6
4092 : COSTS_N_INSNS (ISA_HAS_MUL3 ? 7 : 9));
4093 else if (!speed)
4094 *total = COSTS_N_INSNS (ISA_HAS_MUL3 ? 1 : 2) + 1;
4095 else if (mode == DImode)
4096 *total = mips_cost->int_mult_di;
4097 else
4098 *total = mips_cost->int_mult_si;
4099 return false;
4100
4101 case DIV:
4102 /* Check for a reciprocal. */
4103 if (float_mode_p
4104 && ISA_HAS_FP_RECIP_RSQRT (mode)
4105 && flag_unsafe_math_optimizations
4106 && XEXP (x, 0) == CONST1_RTX (mode))
4107 {
4108 if (outer_code == SQRT || GET_CODE (XEXP (x, 1)) == SQRT)
4109 /* An rsqrt<mode>a or rsqrt<mode>b pattern. Count the
4110 division as being free. */
4111 *total = set_src_cost (XEXP (x, 1), speed);
4112 else
4113 *total = (mips_fp_div_cost (mode)
4114 + set_src_cost (XEXP (x, 1), speed));
4115 return true;
4116 }
4117 /* Fall through. */
4118
4119 case SQRT:
4120 case MOD:
4121 if (float_mode_p)
4122 {
4123 *total = mips_fp_div_cost (mode);
4124 return false;
4125 }
4126 /* Fall through. */
4127
4128 case UDIV:
4129 case UMOD:
4130 if (!speed)
4131 {
4132 /* It is our responsibility to make division by a power of 2
4133 as cheap as 2 register additions if we want the division
4134 expanders to be used for such operations; see the setting
4135 of sdiv_pow2_cheap in optabs.c. Using (D)DIV for MIPS16
4136 should always produce shorter code than using
4137 expand_sdiv2_pow2. */
4138 if (TARGET_MIPS16
4139 && CONST_INT_P (XEXP (x, 1))
4140 && exact_log2 (INTVAL (XEXP (x, 1))) >= 0)
4141 {
4142 *total = COSTS_N_INSNS (2) + set_src_cost (XEXP (x, 0), speed);
4143 return true;
4144 }
4145 *total = COSTS_N_INSNS (mips_idiv_insns ());
4146 }
4147 else if (mode == DImode)
4148 *total = mips_cost->int_div_di;
4149 else
4150 *total = mips_cost->int_div_si;
4151 return false;
4152
4153 case SIGN_EXTEND:
4154 *total = mips_sign_extend_cost (mode, XEXP (x, 0));
4155 return false;
4156
4157 case ZERO_EXTEND:
4158 if (outer_code == SET
4159 && ISA_HAS_BADDU
4160 && (GET_CODE (XEXP (x, 0)) == TRUNCATE
4161 || GET_CODE (XEXP (x, 0)) == SUBREG)
4162 && GET_MODE (XEXP (x, 0)) == QImode
4163 && GET_CODE (XEXP (XEXP (x, 0), 0)) == PLUS)
4164 {
4165 *total = set_src_cost (XEXP (XEXP (x, 0), 0), speed);
4166 return true;
4167 }
4168 *total = mips_zero_extend_cost (mode, XEXP (x, 0));
4169 return false;
4170
4171 case FLOAT:
4172 case UNSIGNED_FLOAT:
4173 case FIX:
4174 case FLOAT_EXTEND:
4175 case FLOAT_TRUNCATE:
4176 *total = mips_cost->fp_add;
4177 return false;
4178
4179 case SET:
4180 if (register_operand (SET_DEST (x), VOIDmode)
4181 && reg_or_0_operand (SET_SRC (x), VOIDmode))
4182 {
4183 *total = mips_set_reg_reg_cost (GET_MODE (SET_DEST (x)));
4184 return true;
4185 }
4186 return false;
4187
4188 default:
4189 return false;
4190 }
4191 }
4192
4193 /* Implement TARGET_ADDRESS_COST. */
4194
4195 static int
4196 mips_address_cost (rtx addr, enum machine_mode mode,
4197 addr_space_t as ATTRIBUTE_UNUSED,
4198 bool speed ATTRIBUTE_UNUSED)
4199 {
4200 return mips_address_insns (addr, mode, false);
4201 }
4202 \f
4203 /* Information about a single instruction in a multi-instruction
4204 asm sequence. */
4205 struct mips_multi_member {
4206 /* True if this is a label, false if it is code. */
4207 bool is_label_p;
4208
4209 /* The output_asm_insn format of the instruction. */
4210 const char *format;
4211
4212 /* The operands to the instruction. */
4213 rtx operands[MAX_RECOG_OPERANDS];
4214 };
4215 typedef struct mips_multi_member mips_multi_member;
4216
4217 /* The instructions that make up the current multi-insn sequence. */
4218 static vec<mips_multi_member> mips_multi_members;
4219
4220 /* How many instructions (as opposed to labels) are in the current
4221 multi-insn sequence. */
4222 static unsigned int mips_multi_num_insns;
4223
4224 /* Start a new multi-insn sequence. */
4225
4226 static void
4227 mips_multi_start (void)
4228 {
4229 mips_multi_members.truncate (0);
4230 mips_multi_num_insns = 0;
4231 }
4232
4233 /* Add a new, uninitialized member to the current multi-insn sequence. */
4234
4235 static struct mips_multi_member *
4236 mips_multi_add (void)
4237 {
4238 mips_multi_member empty;
4239 return mips_multi_members.safe_push (empty);
4240 }
4241
4242 /* Add a normal insn with the given asm format to the current multi-insn
4243 sequence. The other arguments are a null-terminated list of operands. */
4244
4245 static void
4246 mips_multi_add_insn (const char *format, ...)
4247 {
4248 struct mips_multi_member *member;
4249 va_list ap;
4250 unsigned int i;
4251 rtx op;
4252
4253 member = mips_multi_add ();
4254 member->is_label_p = false;
4255 member->format = format;
4256 va_start (ap, format);
4257 i = 0;
4258 while ((op = va_arg (ap, rtx)))
4259 member->operands[i++] = op;
4260 va_end (ap);
4261 mips_multi_num_insns++;
4262 }
4263
4264 /* Add the given label definition to the current multi-insn sequence.
4265 The definition should include the colon. */
4266
4267 static void
4268 mips_multi_add_label (const char *label)
4269 {
4270 struct mips_multi_member *member;
4271
4272 member = mips_multi_add ();
4273 member->is_label_p = true;
4274 member->format = label;
4275 }
4276
4277 /* Return the index of the last member of the current multi-insn sequence. */
4278
4279 static unsigned int
4280 mips_multi_last_index (void)
4281 {
4282 return mips_multi_members.length () - 1;
4283 }
4284
4285 /* Add a copy of an existing instruction to the current multi-insn
4286 sequence. I is the index of the instruction that should be copied. */
4287
4288 static void
4289 mips_multi_copy_insn (unsigned int i)
4290 {
4291 struct mips_multi_member *member;
4292
4293 member = mips_multi_add ();
4294 memcpy (member, &mips_multi_members[i], sizeof (*member));
4295 gcc_assert (!member->is_label_p);
4296 }
4297
4298 /* Change the operand of an existing instruction in the current
4299 multi-insn sequence. I is the index of the instruction,
4300 OP is the index of the operand, and X is the new value. */
4301
4302 static void
4303 mips_multi_set_operand (unsigned int i, unsigned int op, rtx x)
4304 {
4305 mips_multi_members[i].operands[op] = x;
4306 }
4307
4308 /* Write out the asm code for the current multi-insn sequence. */
4309
4310 static void
4311 mips_multi_write (void)
4312 {
4313 struct mips_multi_member *member;
4314 unsigned int i;
4315
4316 FOR_EACH_VEC_ELT (mips_multi_members, i, member)
4317 if (member->is_label_p)
4318 fprintf (asm_out_file, "%s\n", member->format);
4319 else
4320 output_asm_insn (member->format, member->operands);
4321 }
4322 \f
4323 /* Return one word of double-word value OP, taking into account the fixed
4324 endianness of certain registers. HIGH_P is true to select the high part,
4325 false to select the low part. */
4326
4327 rtx
4328 mips_subword (rtx op, bool high_p)
4329 {
4330 unsigned int byte, offset;
4331 enum machine_mode mode;
4332
4333 mode = GET_MODE (op);
4334 if (mode == VOIDmode)
4335 mode = TARGET_64BIT ? TImode : DImode;
4336
4337 if (TARGET_BIG_ENDIAN ? !high_p : high_p)
4338 byte = UNITS_PER_WORD;
4339 else
4340 byte = 0;
4341
4342 if (FP_REG_RTX_P (op))
4343 {
4344 /* Paired FPRs are always ordered little-endian. */
4345 offset = (UNITS_PER_WORD < UNITS_PER_HWFPVALUE ? high_p : byte != 0);
4346 return gen_rtx_REG (word_mode, REGNO (op) + offset);
4347 }
4348
4349 if (MEM_P (op))
4350 return mips_rewrite_small_data (adjust_address (op, word_mode, byte));
4351
4352 return simplify_gen_subreg (word_mode, op, mode, byte);
4353 }
4354
4355 /* Return true if SRC should be moved into DEST using "MULT $0, $0".
4356 SPLIT_TYPE is the condition under which moves should be split. */
4357
4358 static bool
4359 mips_mult_move_p (rtx dest, rtx src, enum mips_split_type split_type)
4360 {
4361 return ((split_type != SPLIT_FOR_SPEED
4362 || mips_tuning_info.fast_mult_zero_zero_p)
4363 && src == const0_rtx
4364 && REG_P (dest)
4365 && GET_MODE_SIZE (GET_MODE (dest)) == 2 * UNITS_PER_WORD
4366 && (ISA_HAS_DSP_MULT
4367 ? ACC_REG_P (REGNO (dest))
4368 : MD_REG_P (REGNO (dest))));
4369 }
4370
4371 /* Return true if a move from SRC to DEST should be split into two.
4372 SPLIT_TYPE describes the split condition. */
4373
4374 bool
4375 mips_split_move_p (rtx dest, rtx src, enum mips_split_type split_type)
4376 {
4377 /* Check whether the move can be done using some variant of MULT $0,$0. */
4378 if (mips_mult_move_p (dest, src, split_type))
4379 return false;
4380
4381 /* FPR-to-FPR moves can be done in a single instruction, if they're
4382 allowed at all. */
4383 unsigned int size = GET_MODE_SIZE (GET_MODE (dest));
4384 if (size == 8 && FP_REG_RTX_P (src) && FP_REG_RTX_P (dest))
4385 return false;
4386
4387 /* Check for floating-point loads and stores. */
4388 if (size == 8 && ISA_HAS_LDC1_SDC1)
4389 {
4390 if (FP_REG_RTX_P (dest) && MEM_P (src))
4391 return false;
4392 if (FP_REG_RTX_P (src) && MEM_P (dest))
4393 return false;
4394 }
4395
4396 /* Otherwise split all multiword moves. */
4397 return size > UNITS_PER_WORD;
4398 }
4399
4400 /* Split a move from SRC to DEST, given that mips_split_move_p holds.
4401 SPLIT_TYPE describes the split condition. */
4402
4403 void
4404 mips_split_move (rtx dest, rtx src, enum mips_split_type split_type)
4405 {
4406 rtx low_dest;
4407
4408 gcc_checking_assert (mips_split_move_p (dest, src, split_type));
4409 if (FP_REG_RTX_P (dest) || FP_REG_RTX_P (src))
4410 {
4411 if (!TARGET_64BIT && GET_MODE (dest) == DImode)
4412 emit_insn (gen_move_doubleword_fprdi (dest, src));
4413 else if (!TARGET_64BIT && GET_MODE (dest) == DFmode)
4414 emit_insn (gen_move_doubleword_fprdf (dest, src));
4415 else if (!TARGET_64BIT && GET_MODE (dest) == V2SFmode)
4416 emit_insn (gen_move_doubleword_fprv2sf (dest, src));
4417 else if (!TARGET_64BIT && GET_MODE (dest) == V2SImode)
4418 emit_insn (gen_move_doubleword_fprv2si (dest, src));
4419 else if (!TARGET_64BIT && GET_MODE (dest) == V4HImode)
4420 emit_insn (gen_move_doubleword_fprv4hi (dest, src));
4421 else if (!TARGET_64BIT && GET_MODE (dest) == V8QImode)
4422 emit_insn (gen_move_doubleword_fprv8qi (dest, src));
4423 else if (TARGET_64BIT && GET_MODE (dest) == TFmode)
4424 emit_insn (gen_move_doubleword_fprtf (dest, src));
4425 else
4426 gcc_unreachable ();
4427 }
4428 else if (REG_P (dest) && REGNO (dest) == MD_REG_FIRST)
4429 {
4430 low_dest = mips_subword (dest, false);
4431 mips_emit_move (low_dest, mips_subword (src, false));
4432 if (TARGET_64BIT)
4433 emit_insn (gen_mthidi_ti (dest, mips_subword (src, true), low_dest));
4434 else
4435 emit_insn (gen_mthisi_di (dest, mips_subword (src, true), low_dest));
4436 }
4437 else if (REG_P (src) && REGNO (src) == MD_REG_FIRST)
4438 {
4439 mips_emit_move (mips_subword (dest, false), mips_subword (src, false));
4440 if (TARGET_64BIT)
4441 emit_insn (gen_mfhidi_ti (mips_subword (dest, true), src));
4442 else
4443 emit_insn (gen_mfhisi_di (mips_subword (dest, true), src));
4444 }
4445 else
4446 {
4447 /* The operation can be split into two normal moves. Decide in
4448 which order to do them. */
4449 low_dest = mips_subword (dest, false);
4450 if (REG_P (low_dest)
4451 && reg_overlap_mentioned_p (low_dest, src))
4452 {
4453 mips_emit_move (mips_subword (dest, true), mips_subword (src, true));
4454 mips_emit_move (low_dest, mips_subword (src, false));
4455 }
4456 else
4457 {
4458 mips_emit_move (low_dest, mips_subword (src, false));
4459 mips_emit_move (mips_subword (dest, true), mips_subword (src, true));
4460 }
4461 }
4462 }
4463
4464 /* Return the split type for instruction INSN. */
4465
4466 static enum mips_split_type
4467 mips_insn_split_type (rtx insn)
4468 {
4469 basic_block bb = BLOCK_FOR_INSN (insn);
4470 if (bb)
4471 {
4472 if (optimize_bb_for_speed_p (bb))
4473 return SPLIT_FOR_SPEED;
4474 else
4475 return SPLIT_FOR_SIZE;
4476 }
4477 /* Once CFG information has been removed, we should trust the optimization
4478 decisions made by previous passes and only split where necessary. */
4479 return SPLIT_IF_NECESSARY;
4480 }
4481
4482 /* Return true if a move from SRC to DEST in INSN should be split. */
4483
4484 bool
4485 mips_split_move_insn_p (rtx dest, rtx src, rtx insn)
4486 {
4487 return mips_split_move_p (dest, src, mips_insn_split_type (insn));
4488 }
4489
4490 /* Split a move from SRC to DEST in INSN, given that mips_split_move_insn_p
4491 holds. */
4492
4493 void
4494 mips_split_move_insn (rtx dest, rtx src, rtx insn)
4495 {
4496 mips_split_move (dest, src, mips_insn_split_type (insn));
4497 }
4498 \f
4499 /* Return the appropriate instructions to move SRC into DEST. Assume
4500 that SRC is operand 1 and DEST is operand 0. */
4501
4502 const char *
4503 mips_output_move (rtx dest, rtx src)
4504 {
4505 enum rtx_code dest_code, src_code;
4506 enum machine_mode mode;
4507 enum mips_symbol_type symbol_type;
4508 bool dbl_p;
4509
4510 dest_code = GET_CODE (dest);
4511 src_code = GET_CODE (src);
4512 mode = GET_MODE (dest);
4513 dbl_p = (GET_MODE_SIZE (mode) == 8);
4514
4515 if (mips_split_move_p (dest, src, SPLIT_IF_NECESSARY))
4516 return "#";
4517
4518 if ((src_code == REG && GP_REG_P (REGNO (src)))
4519 || (!TARGET_MIPS16 && src == CONST0_RTX (mode)))
4520 {
4521 if (dest_code == REG)
4522 {
4523 if (GP_REG_P (REGNO (dest)))
4524 return "move\t%0,%z1";
4525
4526 if (mips_mult_move_p (dest, src, SPLIT_IF_NECESSARY))
4527 {
4528 if (ISA_HAS_DSP_MULT)
4529 return "mult\t%q0,%.,%.";
4530 else
4531 return "mult\t%.,%.";
4532 }
4533
4534 /* Moves to HI are handled by special .md insns. */
4535 if (REGNO (dest) == LO_REGNUM)
4536 return "mtlo\t%z1";
4537
4538 if (DSP_ACC_REG_P (REGNO (dest)))
4539 {
4540 static char retval[] = "mt__\t%z1,%q0";
4541
4542 retval[2] = reg_names[REGNO (dest)][4];
4543 retval[3] = reg_names[REGNO (dest)][5];
4544 return retval;
4545 }
4546
4547 if (FP_REG_P (REGNO (dest)))
4548 return dbl_p ? "dmtc1\t%z1,%0" : "mtc1\t%z1,%0";
4549
4550 if (ALL_COP_REG_P (REGNO (dest)))
4551 {
4552 static char retval[] = "dmtc_\t%z1,%0";
4553
4554 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest));
4555 return dbl_p ? retval : retval + 1;
4556 }
4557 }
4558 if (dest_code == MEM)
4559 switch (GET_MODE_SIZE (mode))
4560 {
4561 case 1: return "sb\t%z1,%0";
4562 case 2: return "sh\t%z1,%0";
4563 case 4: return "sw\t%z1,%0";
4564 case 8: return "sd\t%z1,%0";
4565 }
4566 }
4567 if (dest_code == REG && GP_REG_P (REGNO (dest)))
4568 {
4569 if (src_code == REG)
4570 {
4571 /* Moves from HI are handled by special .md insns. */
4572 if (REGNO (src) == LO_REGNUM)
4573 {
4574 /* When generating VR4120 or VR4130 code, we use MACC and
4575 DMACC instead of MFLO. This avoids both the normal
4576 MIPS III HI/LO hazards and the errata related to
4577 -mfix-vr4130. */
4578 if (ISA_HAS_MACCHI)
4579 return dbl_p ? "dmacc\t%0,%.,%." : "macc\t%0,%.,%.";
4580 return "mflo\t%0";
4581 }
4582
4583 if (DSP_ACC_REG_P (REGNO (src)))
4584 {
4585 static char retval[] = "mf__\t%0,%q1";
4586
4587 retval[2] = reg_names[REGNO (src)][4];
4588 retval[3] = reg_names[REGNO (src)][5];
4589 return retval;
4590 }
4591
4592 if (FP_REG_P (REGNO (src)))
4593 return dbl_p ? "dmfc1\t%0,%1" : "mfc1\t%0,%1";
4594
4595 if (ALL_COP_REG_P (REGNO (src)))
4596 {
4597 static char retval[] = "dmfc_\t%0,%1";
4598
4599 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src));
4600 return dbl_p ? retval : retval + 1;
4601 }
4602 }
4603
4604 if (src_code == MEM)
4605 switch (GET_MODE_SIZE (mode))
4606 {
4607 case 1: return "lbu\t%0,%1";
4608 case 2: return "lhu\t%0,%1";
4609 case 4: return "lw\t%0,%1";
4610 case 8: return "ld\t%0,%1";
4611 }
4612
4613 if (src_code == CONST_INT)
4614 {
4615 /* Don't use the X format for the operand itself, because that
4616 will give out-of-range numbers for 64-bit hosts and 32-bit
4617 targets. */
4618 if (!TARGET_MIPS16)
4619 return "li\t%0,%1\t\t\t# %X1";
4620
4621 if (SMALL_OPERAND_UNSIGNED (INTVAL (src)))
4622 return "li\t%0,%1";
4623
4624 if (SMALL_OPERAND_UNSIGNED (-INTVAL (src)))
4625 return "#";
4626 }
4627
4628 if (src_code == HIGH)
4629 return TARGET_MIPS16 ? "#" : "lui\t%0,%h1";
4630
4631 if (CONST_GP_P (src))
4632 return "move\t%0,%1";
4633
4634 if (mips_symbolic_constant_p (src, SYMBOL_CONTEXT_LEA, &symbol_type)
4635 && mips_lo_relocs[symbol_type] != 0)
4636 {
4637 /* A signed 16-bit constant formed by applying a relocation
4638 operator to a symbolic address. */
4639 gcc_assert (!mips_split_p[symbol_type]);
4640 return "li\t%0,%R1";
4641 }
4642
4643 if (symbolic_operand (src, VOIDmode))
4644 {
4645 gcc_assert (TARGET_MIPS16
4646 ? TARGET_MIPS16_TEXT_LOADS
4647 : !TARGET_EXPLICIT_RELOCS);
4648 return dbl_p ? "dla\t%0,%1" : "la\t%0,%1";
4649 }
4650 }
4651 if (src_code == REG && FP_REG_P (REGNO (src)))
4652 {
4653 if (dest_code == REG && FP_REG_P (REGNO (dest)))
4654 {
4655 if (GET_MODE (dest) == V2SFmode)
4656 return "mov.ps\t%0,%1";
4657 else
4658 return dbl_p ? "mov.d\t%0,%1" : "mov.s\t%0,%1";
4659 }
4660
4661 if (dest_code == MEM)
4662 return dbl_p ? "sdc1\t%1,%0" : "swc1\t%1,%0";
4663 }
4664 if (dest_code == REG && FP_REG_P (REGNO (dest)))
4665 {
4666 if (src_code == MEM)
4667 return dbl_p ? "ldc1\t%0,%1" : "lwc1\t%0,%1";
4668 }
4669 if (dest_code == REG && ALL_COP_REG_P (REGNO (dest)) && src_code == MEM)
4670 {
4671 static char retval[] = "l_c_\t%0,%1";
4672
4673 retval[1] = (dbl_p ? 'd' : 'w');
4674 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest));
4675 return retval;
4676 }
4677 if (dest_code == MEM && src_code == REG && ALL_COP_REG_P (REGNO (src)))
4678 {
4679 static char retval[] = "s_c_\t%1,%0";
4680
4681 retval[1] = (dbl_p ? 'd' : 'w');
4682 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src));
4683 return retval;
4684 }
4685 gcc_unreachable ();
4686 }
4687 \f
4688 /* Return true if CMP1 is a suitable second operand for integer ordering
4689 test CODE. See also the *sCC patterns in mips.md. */
4690
4691 static bool
4692 mips_int_order_operand_ok_p (enum rtx_code code, rtx cmp1)
4693 {
4694 switch (code)
4695 {
4696 case GT:
4697 case GTU:
4698 return reg_or_0_operand (cmp1, VOIDmode);
4699
4700 case GE:
4701 case GEU:
4702 return !TARGET_MIPS16 && cmp1 == const1_rtx;
4703
4704 case LT:
4705 case LTU:
4706 return arith_operand (cmp1, VOIDmode);
4707
4708 case LE:
4709 return sle_operand (cmp1, VOIDmode);
4710
4711 case LEU:
4712 return sleu_operand (cmp1, VOIDmode);
4713
4714 default:
4715 gcc_unreachable ();
4716 }
4717 }
4718
4719 /* Return true if *CMP1 (of mode MODE) is a valid second operand for
4720 integer ordering test *CODE, or if an equivalent combination can
4721 be formed by adjusting *CODE and *CMP1. When returning true, update
4722 *CODE and *CMP1 with the chosen code and operand, otherwise leave
4723 them alone. */
4724
4725 static bool
4726 mips_canonicalize_int_order_test (enum rtx_code *code, rtx *cmp1,
4727 enum machine_mode mode)
4728 {
4729 HOST_WIDE_INT plus_one;
4730
4731 if (mips_int_order_operand_ok_p (*code, *cmp1))
4732 return true;
4733
4734 if (CONST_INT_P (*cmp1))
4735 switch (*code)
4736 {
4737 case LE:
4738 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode);
4739 if (INTVAL (*cmp1) < plus_one)
4740 {
4741 *code = LT;
4742 *cmp1 = force_reg (mode, GEN_INT (plus_one));
4743 return true;
4744 }
4745 break;
4746
4747 case LEU:
4748 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode);
4749 if (plus_one != 0)
4750 {
4751 *code = LTU;
4752 *cmp1 = force_reg (mode, GEN_INT (plus_one));
4753 return true;
4754 }
4755 break;
4756
4757 default:
4758 break;
4759 }
4760 return false;
4761 }
4762
4763 /* Compare CMP0 and CMP1 using ordering test CODE and store the result
4764 in TARGET. CMP0 and TARGET are register_operands. If INVERT_PTR
4765 is nonnull, it's OK to set TARGET to the inverse of the result and
4766 flip *INVERT_PTR instead. */
4767
4768 static void
4769 mips_emit_int_order_test (enum rtx_code code, bool *invert_ptr,
4770 rtx target, rtx cmp0, rtx cmp1)
4771 {
4772 enum machine_mode mode;
4773
4774 /* First see if there is a MIPS instruction that can do this operation.
4775 If not, try doing the same for the inverse operation. If that also
4776 fails, force CMP1 into a register and try again. */
4777 mode = GET_MODE (cmp0);
4778 if (mips_canonicalize_int_order_test (&code, &cmp1, mode))
4779 mips_emit_binary (code, target, cmp0, cmp1);
4780 else
4781 {
4782 enum rtx_code inv_code = reverse_condition (code);
4783 if (!mips_canonicalize_int_order_test (&inv_code, &cmp1, mode))
4784 {
4785 cmp1 = force_reg (mode, cmp1);
4786 mips_emit_int_order_test (code, invert_ptr, target, cmp0, cmp1);
4787 }
4788 else if (invert_ptr == 0)
4789 {
4790 rtx inv_target;
4791
4792 inv_target = mips_force_binary (GET_MODE (target),
4793 inv_code, cmp0, cmp1);
4794 mips_emit_binary (XOR, target, inv_target, const1_rtx);
4795 }
4796 else
4797 {
4798 *invert_ptr = !*invert_ptr;
4799 mips_emit_binary (inv_code, target, cmp0, cmp1);
4800 }
4801 }
4802 }
4803
4804 /* Return a register that is zero iff CMP0 and CMP1 are equal.
4805 The register will have the same mode as CMP0. */
4806
4807 static rtx
4808 mips_zero_if_equal (rtx cmp0, rtx cmp1)
4809 {
4810 if (cmp1 == const0_rtx)
4811 return cmp0;
4812
4813 if (uns_arith_operand (cmp1, VOIDmode))
4814 return expand_binop (GET_MODE (cmp0), xor_optab,
4815 cmp0, cmp1, 0, 0, OPTAB_DIRECT);
4816
4817 return expand_binop (GET_MODE (cmp0), sub_optab,
4818 cmp0, cmp1, 0, 0, OPTAB_DIRECT);
4819 }
4820
4821 /* Convert *CODE into a code that can be used in a floating-point
4822 scc instruction (C.cond.fmt). Return true if the values of
4823 the condition code registers will be inverted, with 0 indicating
4824 that the condition holds. */
4825
4826 static bool
4827 mips_reversed_fp_cond (enum rtx_code *code)
4828 {
4829 switch (*code)
4830 {
4831 case NE:
4832 case LTGT:
4833 case ORDERED:
4834 *code = reverse_condition_maybe_unordered (*code);
4835 return true;
4836
4837 default:
4838 return false;
4839 }
4840 }
4841
4842 /* Allocate a floating-point condition-code register of mode MODE.
4843
4844 These condition code registers are used for certain kinds
4845 of compound operation, such as compare and branches, vconds,
4846 and built-in functions. At expand time, their use is entirely
4847 controlled by MIPS-specific code and is entirely internal
4848 to these compound operations.
4849
4850 We could (and did in the past) expose condition-code values
4851 as pseudo registers and leave the register allocator to pick
4852 appropriate registers. The problem is that it is not practically
4853 possible for the rtl optimizers to guarantee that no spills will
4854 be needed, even when AVOID_CCMODE_COPIES is defined. We would
4855 therefore need spill and reload sequences to handle the worst case.
4856
4857 Although such sequences do exist, they are very expensive and are
4858 not something we'd want to use. This is especially true of CCV2 and
4859 CCV4, where all the shuffling would greatly outweigh whatever benefit
4860 the vectorization itself provides.
4861
4862 The main benefit of having more than one condition-code register
4863 is to allow the pipelining of operations, especially those involving
4864 comparisons and conditional moves. We don't really expect the
4865 registers to be live for long periods, and certainly never want
4866 them to be live across calls.
4867
4868 Also, there should be no penalty attached to using all the available
4869 registers. They are simply bits in the same underlying FPU control
4870 register.
4871
4872 We therefore expose the hardware registers from the outset and use
4873 a simple round-robin allocation scheme. */
4874
4875 static rtx
4876 mips_allocate_fcc (enum machine_mode mode)
4877 {
4878 unsigned int regno, count;
4879
4880 gcc_assert (TARGET_HARD_FLOAT && ISA_HAS_8CC);
4881
4882 if (mode == CCmode)
4883 count = 1;
4884 else if (mode == CCV2mode)
4885 count = 2;
4886 else if (mode == CCV4mode)
4887 count = 4;
4888 else
4889 gcc_unreachable ();
4890
4891 cfun->machine->next_fcc += -cfun->machine->next_fcc & (count - 1);
4892 if (cfun->machine->next_fcc > ST_REG_LAST - ST_REG_FIRST)
4893 cfun->machine->next_fcc = 0;
4894 regno = ST_REG_FIRST + cfun->machine->next_fcc;
4895 cfun->machine->next_fcc += count;
4896 return gen_rtx_REG (mode, regno);
4897 }
4898
4899 /* Convert a comparison into something that can be used in a branch or
4900 conditional move. On entry, *OP0 and *OP1 are the values being
4901 compared and *CODE is the code used to compare them.
4902
4903 Update *CODE, *OP0 and *OP1 so that they describe the final comparison.
4904 If NEED_EQ_NE_P, then only EQ or NE comparisons against zero are possible,
4905 otherwise any standard branch condition can be used. The standard branch
4906 conditions are:
4907
4908 - EQ or NE between two registers.
4909 - any comparison between a register and zero. */
4910
4911 static void
4912 mips_emit_compare (enum rtx_code *code, rtx *op0, rtx *op1, bool need_eq_ne_p)
4913 {
4914 rtx cmp_op0 = *op0;
4915 rtx cmp_op1 = *op1;
4916
4917 if (GET_MODE_CLASS (GET_MODE (*op0)) == MODE_INT)
4918 {
4919 if (!need_eq_ne_p && *op1 == const0_rtx)
4920 ;
4921 else if (*code == EQ || *code == NE)
4922 {
4923 if (need_eq_ne_p)
4924 {
4925 *op0 = mips_zero_if_equal (cmp_op0, cmp_op1);
4926 *op1 = const0_rtx;
4927 }
4928 else
4929 *op1 = force_reg (GET_MODE (cmp_op0), cmp_op1);
4930 }
4931 else
4932 {
4933 /* The comparison needs a separate scc instruction. Store the
4934 result of the scc in *OP0 and compare it against zero. */
4935 bool invert = false;
4936 *op0 = gen_reg_rtx (GET_MODE (cmp_op0));
4937 mips_emit_int_order_test (*code, &invert, *op0, cmp_op0, cmp_op1);
4938 *code = (invert ? EQ : NE);
4939 *op1 = const0_rtx;
4940 }
4941 }
4942 else if (ALL_FIXED_POINT_MODE_P (GET_MODE (cmp_op0)))
4943 {
4944 *op0 = gen_rtx_REG (CCDSPmode, CCDSP_CC_REGNUM);
4945 mips_emit_binary (*code, *op0, cmp_op0, cmp_op1);
4946 *code = NE;
4947 *op1 = const0_rtx;
4948 }
4949 else
4950 {
4951 enum rtx_code cmp_code;
4952
4953 /* Floating-point tests use a separate C.cond.fmt comparison to
4954 set a condition code register. The branch or conditional move
4955 will then compare that register against zero.
4956
4957 Set CMP_CODE to the code of the comparison instruction and
4958 *CODE to the code that the branch or move should use. */
4959 cmp_code = *code;
4960 *code = mips_reversed_fp_cond (&cmp_code) ? EQ : NE;
4961 *op0 = (ISA_HAS_8CC
4962 ? mips_allocate_fcc (CCmode)
4963 : gen_rtx_REG (CCmode, FPSW_REGNUM));
4964 *op1 = const0_rtx;
4965 mips_emit_binary (cmp_code, *op0, cmp_op0, cmp_op1);
4966 }
4967 }
4968 \f
4969 /* Try performing the comparison in OPERANDS[1], whose arms are OPERANDS[2]
4970 and OPERAND[3]. Store the result in OPERANDS[0].
4971
4972 On 64-bit targets, the mode of the comparison and target will always be
4973 SImode, thus possibly narrower than that of the comparison's operands. */
4974
4975 void
4976 mips_expand_scc (rtx operands[])
4977 {
4978 rtx target = operands[0];
4979 enum rtx_code code = GET_CODE (operands[1]);
4980 rtx op0 = operands[2];
4981 rtx op1 = operands[3];
4982
4983 gcc_assert (GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT);
4984
4985 if (code == EQ || code == NE)
4986 {
4987 if (ISA_HAS_SEQ_SNE
4988 && reg_imm10_operand (op1, GET_MODE (op1)))
4989 mips_emit_binary (code, target, op0, op1);
4990 else
4991 {
4992 rtx zie = mips_zero_if_equal (op0, op1);
4993 mips_emit_binary (code, target, zie, const0_rtx);
4994 }
4995 }
4996 else
4997 mips_emit_int_order_test (code, 0, target, op0, op1);
4998 }
4999
5000 /* Compare OPERANDS[1] with OPERANDS[2] using comparison code
5001 CODE and jump to OPERANDS[3] if the condition holds. */
5002
5003 void
5004 mips_expand_conditional_branch (rtx *operands)
5005 {
5006 enum rtx_code code = GET_CODE (operands[0]);
5007 rtx op0 = operands[1];
5008 rtx op1 = operands[2];
5009 rtx condition;
5010
5011 mips_emit_compare (&code, &op0, &op1, TARGET_MIPS16);
5012 condition = gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
5013 emit_jump_insn (gen_condjump (condition, operands[3]));
5014 }
5015
5016 /* Implement:
5017
5018 (set temp (COND:CCV2 CMP_OP0 CMP_OP1))
5019 (set DEST (unspec [TRUE_SRC FALSE_SRC temp] UNSPEC_MOVE_TF_PS)) */
5020
5021 void
5022 mips_expand_vcondv2sf (rtx dest, rtx true_src, rtx false_src,
5023 enum rtx_code cond, rtx cmp_op0, rtx cmp_op1)
5024 {
5025 rtx cmp_result;
5026 bool reversed_p;
5027
5028 reversed_p = mips_reversed_fp_cond (&cond);
5029 cmp_result = mips_allocate_fcc (CCV2mode);
5030 emit_insn (gen_scc_ps (cmp_result,
5031 gen_rtx_fmt_ee (cond, VOIDmode, cmp_op0, cmp_op1)));
5032 if (reversed_p)
5033 emit_insn (gen_mips_cond_move_tf_ps (dest, false_src, true_src,
5034 cmp_result));
5035 else
5036 emit_insn (gen_mips_cond_move_tf_ps (dest, true_src, false_src,
5037 cmp_result));
5038 }
5039
5040 /* Perform the comparison in OPERANDS[1]. Move OPERANDS[2] into OPERANDS[0]
5041 if the condition holds, otherwise move OPERANDS[3] into OPERANDS[0]. */
5042
5043 void
5044 mips_expand_conditional_move (rtx *operands)
5045 {
5046 rtx cond;
5047 enum rtx_code code = GET_CODE (operands[1]);
5048 rtx op0 = XEXP (operands[1], 0);
5049 rtx op1 = XEXP (operands[1], 1);
5050
5051 mips_emit_compare (&code, &op0, &op1, true);
5052 cond = gen_rtx_fmt_ee (code, GET_MODE (op0), op0, op1);
5053 emit_insn (gen_rtx_SET (VOIDmode, operands[0],
5054 gen_rtx_IF_THEN_ELSE (GET_MODE (operands[0]), cond,
5055 operands[2], operands[3])));
5056 }
5057
5058 /* Perform the comparison in COMPARISON, then trap if the condition holds. */
5059
5060 void
5061 mips_expand_conditional_trap (rtx comparison)
5062 {
5063 rtx op0, op1;
5064 enum machine_mode mode;
5065 enum rtx_code code;
5066
5067 /* MIPS conditional trap instructions don't have GT or LE flavors,
5068 so we must swap the operands and convert to LT and GE respectively. */
5069 code = GET_CODE (comparison);
5070 switch (code)
5071 {
5072 case GT:
5073 case LE:
5074 case GTU:
5075 case LEU:
5076 code = swap_condition (code);
5077 op0 = XEXP (comparison, 1);
5078 op1 = XEXP (comparison, 0);
5079 break;
5080
5081 default:
5082 op0 = XEXP (comparison, 0);
5083 op1 = XEXP (comparison, 1);
5084 break;
5085 }
5086
5087 mode = GET_MODE (XEXP (comparison, 0));
5088 op0 = force_reg (mode, op0);
5089 if (!arith_operand (op1, mode))
5090 op1 = force_reg (mode, op1);
5091
5092 emit_insn (gen_rtx_TRAP_IF (VOIDmode,
5093 gen_rtx_fmt_ee (code, mode, op0, op1),
5094 const0_rtx));
5095 }
5096 \f
5097 /* Initialize *CUM for a call to a function of type FNTYPE. */
5098
5099 void
5100 mips_init_cumulative_args (CUMULATIVE_ARGS *cum, tree fntype)
5101 {
5102 memset (cum, 0, sizeof (*cum));
5103 cum->prototype = (fntype && prototype_p (fntype));
5104 cum->gp_reg_found = (cum->prototype && stdarg_p (fntype));
5105 }
5106
5107 /* Fill INFO with information about a single argument. CUM is the
5108 cumulative state for earlier arguments. MODE is the mode of this
5109 argument and TYPE is its type (if known). NAMED is true if this
5110 is a named (fixed) argument rather than a variable one. */
5111
5112 static void
5113 mips_get_arg_info (struct mips_arg_info *info, const CUMULATIVE_ARGS *cum,
5114 enum machine_mode mode, const_tree type, bool named)
5115 {
5116 bool doubleword_aligned_p;
5117 unsigned int num_bytes, num_words, max_regs;
5118
5119 /* Work out the size of the argument. */
5120 num_bytes = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode);
5121 num_words = (num_bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
5122
5123 /* Decide whether it should go in a floating-point register, assuming
5124 one is free. Later code checks for availability.
5125
5126 The checks against UNITS_PER_FPVALUE handle the soft-float and
5127 single-float cases. */
5128 switch (mips_abi)
5129 {
5130 case ABI_EABI:
5131 /* The EABI conventions have traditionally been defined in terms
5132 of TYPE_MODE, regardless of the actual type. */
5133 info->fpr_p = ((GET_MODE_CLASS (mode) == MODE_FLOAT
5134 || mode == V2SFmode)
5135 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE);
5136 break;
5137
5138 case ABI_32:
5139 case ABI_O64:
5140 /* Only leading floating-point scalars are passed in
5141 floating-point registers. We also handle vector floats the same
5142 say, which is OK because they are not covered by the standard ABI. */
5143 info->fpr_p = (!cum->gp_reg_found
5144 && cum->arg_number < 2
5145 && (type == 0
5146 || SCALAR_FLOAT_TYPE_P (type)
5147 || VECTOR_FLOAT_TYPE_P (type))
5148 && (GET_MODE_CLASS (mode) == MODE_FLOAT
5149 || mode == V2SFmode)
5150 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE);
5151 break;
5152
5153 case ABI_N32:
5154 case ABI_64:
5155 /* Scalar, complex and vector floating-point types are passed in
5156 floating-point registers, as long as this is a named rather
5157 than a variable argument. */
5158 info->fpr_p = (named
5159 && (type == 0 || FLOAT_TYPE_P (type))
5160 && (GET_MODE_CLASS (mode) == MODE_FLOAT
5161 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
5162 || mode == V2SFmode)
5163 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_FPVALUE);
5164
5165 /* ??? According to the ABI documentation, the real and imaginary
5166 parts of complex floats should be passed in individual registers.
5167 The real and imaginary parts of stack arguments are supposed
5168 to be contiguous and there should be an extra word of padding
5169 at the end.
5170
5171 This has two problems. First, it makes it impossible to use a
5172 single "void *" va_list type, since register and stack arguments
5173 are passed differently. (At the time of writing, MIPSpro cannot
5174 handle complex float varargs correctly.) Second, it's unclear
5175 what should happen when there is only one register free.
5176
5177 For now, we assume that named complex floats should go into FPRs
5178 if there are two FPRs free, otherwise they should be passed in the
5179 same way as a struct containing two floats. */
5180 if (info->fpr_p
5181 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
5182 && GET_MODE_UNIT_SIZE (mode) < UNITS_PER_FPVALUE)
5183 {
5184 if (cum->num_gprs >= MAX_ARGS_IN_REGISTERS - 1)
5185 info->fpr_p = false;
5186 else
5187 num_words = 2;
5188 }
5189 break;
5190
5191 default:
5192 gcc_unreachable ();
5193 }
5194
5195 /* See whether the argument has doubleword alignment. */
5196 doubleword_aligned_p = (mips_function_arg_boundary (mode, type)
5197 > BITS_PER_WORD);
5198
5199 /* Set REG_OFFSET to the register count we're interested in.
5200 The EABI allocates the floating-point registers separately,
5201 but the other ABIs allocate them like integer registers. */
5202 info->reg_offset = (mips_abi == ABI_EABI && info->fpr_p
5203 ? cum->num_fprs
5204 : cum->num_gprs);
5205
5206 /* Advance to an even register if the argument is doubleword-aligned. */
5207 if (doubleword_aligned_p)
5208 info->reg_offset += info->reg_offset & 1;
5209
5210 /* Work out the offset of a stack argument. */
5211 info->stack_offset = cum->stack_words;
5212 if (doubleword_aligned_p)
5213 info->stack_offset += info->stack_offset & 1;
5214
5215 max_regs = MAX_ARGS_IN_REGISTERS - info->reg_offset;
5216
5217 /* Partition the argument between registers and stack. */
5218 info->reg_words = MIN (num_words, max_regs);
5219 info->stack_words = num_words - info->reg_words;
5220 }
5221
5222 /* INFO describes a register argument that has the normal format for the
5223 argument's mode. Return the register it uses, assuming that FPRs are
5224 available if HARD_FLOAT_P. */
5225
5226 static unsigned int
5227 mips_arg_regno (const struct mips_arg_info *info, bool hard_float_p)
5228 {
5229 if (!info->fpr_p || !hard_float_p)
5230 return GP_ARG_FIRST + info->reg_offset;
5231 else if (mips_abi == ABI_32 && TARGET_DOUBLE_FLOAT && info->reg_offset > 0)
5232 /* In o32, the second argument is always passed in $f14
5233 for TARGET_DOUBLE_FLOAT, regardless of whether the
5234 first argument was a word or doubleword. */
5235 return FP_ARG_FIRST + 2;
5236 else
5237 return FP_ARG_FIRST + info->reg_offset;
5238 }
5239
5240 /* Implement TARGET_STRICT_ARGUMENT_NAMING. */
5241
5242 static bool
5243 mips_strict_argument_naming (cumulative_args_t ca ATTRIBUTE_UNUSED)
5244 {
5245 return !TARGET_OLDABI;
5246 }
5247
5248 /* Implement TARGET_FUNCTION_ARG. */
5249
5250 static rtx
5251 mips_function_arg (cumulative_args_t cum_v, enum machine_mode mode,
5252 const_tree type, bool named)
5253 {
5254 CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
5255 struct mips_arg_info info;
5256
5257 /* We will be called with a mode of VOIDmode after the last argument
5258 has been seen. Whatever we return will be passed to the call expander.
5259 If we need a MIPS16 fp_code, return a REG with the code stored as
5260 the mode. */
5261 if (mode == VOIDmode)
5262 {
5263 if (TARGET_MIPS16 && cum->fp_code != 0)
5264 return gen_rtx_REG ((enum machine_mode) cum->fp_code, 0);
5265 else
5266 return NULL;
5267 }
5268
5269 mips_get_arg_info (&info, cum, mode, type, named);
5270
5271 /* Return straight away if the whole argument is passed on the stack. */
5272 if (info.reg_offset == MAX_ARGS_IN_REGISTERS)
5273 return NULL;
5274
5275 /* The n32 and n64 ABIs say that if any 64-bit chunk of the structure
5276 contains a double in its entirety, then that 64-bit chunk is passed
5277 in a floating-point register. */
5278 if (TARGET_NEWABI
5279 && TARGET_HARD_FLOAT
5280 && named
5281 && type != 0
5282 && TREE_CODE (type) == RECORD_TYPE
5283 && TYPE_SIZE_UNIT (type)
5284 && tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
5285 {
5286 tree field;
5287
5288 /* First check to see if there is any such field. */
5289 for (field = TYPE_FIELDS (type); field; field = DECL_CHAIN (field))
5290 if (TREE_CODE (field) == FIELD_DECL
5291 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))
5292 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD
5293 && tree_fits_shwi_p (bit_position (field))
5294 && int_bit_position (field) % BITS_PER_WORD == 0)
5295 break;
5296
5297 if (field != 0)
5298 {
5299 /* Now handle the special case by returning a PARALLEL
5300 indicating where each 64-bit chunk goes. INFO.REG_WORDS
5301 chunks are passed in registers. */
5302 unsigned int i;
5303 HOST_WIDE_INT bitpos;
5304 rtx ret;
5305
5306 /* assign_parms checks the mode of ENTRY_PARM, so we must
5307 use the actual mode here. */
5308 ret = gen_rtx_PARALLEL (mode, rtvec_alloc (info.reg_words));
5309
5310 bitpos = 0;
5311 field = TYPE_FIELDS (type);
5312 for (i = 0; i < info.reg_words; i++)
5313 {
5314 rtx reg;
5315
5316 for (; field; field = DECL_CHAIN (field))
5317 if (TREE_CODE (field) == FIELD_DECL
5318 && int_bit_position (field) >= bitpos)
5319 break;
5320
5321 if (field
5322 && int_bit_position (field) == bitpos
5323 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))
5324 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD)
5325 reg = gen_rtx_REG (DFmode, FP_ARG_FIRST + info.reg_offset + i);
5326 else
5327 reg = gen_rtx_REG (DImode, GP_ARG_FIRST + info.reg_offset + i);
5328
5329 XVECEXP (ret, 0, i)
5330 = gen_rtx_EXPR_LIST (VOIDmode, reg,
5331 GEN_INT (bitpos / BITS_PER_UNIT));
5332
5333 bitpos += BITS_PER_WORD;
5334 }
5335 return ret;
5336 }
5337 }
5338
5339 /* Handle the n32/n64 conventions for passing complex floating-point
5340 arguments in FPR pairs. The real part goes in the lower register
5341 and the imaginary part goes in the upper register. */
5342 if (TARGET_NEWABI
5343 && info.fpr_p
5344 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5345 {
5346 rtx real, imag;
5347 enum machine_mode inner;
5348 unsigned int regno;
5349
5350 inner = GET_MODE_INNER (mode);
5351 regno = FP_ARG_FIRST + info.reg_offset;
5352 if (info.reg_words * UNITS_PER_WORD == GET_MODE_SIZE (inner))
5353 {
5354 /* Real part in registers, imaginary part on stack. */
5355 gcc_assert (info.stack_words == info.reg_words);
5356 return gen_rtx_REG (inner, regno);
5357 }
5358 else
5359 {
5360 gcc_assert (info.stack_words == 0);
5361 real = gen_rtx_EXPR_LIST (VOIDmode,
5362 gen_rtx_REG (inner, regno),
5363 const0_rtx);
5364 imag = gen_rtx_EXPR_LIST (VOIDmode,
5365 gen_rtx_REG (inner,
5366 regno + info.reg_words / 2),
5367 GEN_INT (GET_MODE_SIZE (inner)));
5368 return gen_rtx_PARALLEL (mode, gen_rtvec (2, real, imag));
5369 }
5370 }
5371
5372 return gen_rtx_REG (mode, mips_arg_regno (&info, TARGET_HARD_FLOAT));
5373 }
5374
5375 /* Implement TARGET_FUNCTION_ARG_ADVANCE. */
5376
5377 static void
5378 mips_function_arg_advance (cumulative_args_t cum_v, enum machine_mode mode,
5379 const_tree type, bool named)
5380 {
5381 CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
5382 struct mips_arg_info info;
5383
5384 mips_get_arg_info (&info, cum, mode, type, named);
5385
5386 if (!info.fpr_p)
5387 cum->gp_reg_found = true;
5388
5389 /* See the comment above the CUMULATIVE_ARGS structure in mips.h for
5390 an explanation of what this code does. It assumes that we're using
5391 either the o32 or the o64 ABI, both of which pass at most 2 arguments
5392 in FPRs. */
5393 if (cum->arg_number < 2 && info.fpr_p)
5394 cum->fp_code += (mode == SFmode ? 1 : 2) << (cum->arg_number * 2);
5395
5396 /* Advance the register count. This has the effect of setting
5397 num_gprs to MAX_ARGS_IN_REGISTERS if a doubleword-aligned
5398 argument required us to skip the final GPR and pass the whole
5399 argument on the stack. */
5400 if (mips_abi != ABI_EABI || !info.fpr_p)
5401 cum->num_gprs = info.reg_offset + info.reg_words;
5402 else if (info.reg_words > 0)
5403 cum->num_fprs += MAX_FPRS_PER_FMT;
5404
5405 /* Advance the stack word count. */
5406 if (info.stack_words > 0)
5407 cum->stack_words = info.stack_offset + info.stack_words;
5408
5409 cum->arg_number++;
5410 }
5411
5412 /* Implement TARGET_ARG_PARTIAL_BYTES. */
5413
5414 static int
5415 mips_arg_partial_bytes (cumulative_args_t cum,
5416 enum machine_mode mode, tree type, bool named)
5417 {
5418 struct mips_arg_info info;
5419
5420 mips_get_arg_info (&info, get_cumulative_args (cum), mode, type, named);
5421 return info.stack_words > 0 ? info.reg_words * UNITS_PER_WORD : 0;
5422 }
5423
5424 /* Implement TARGET_FUNCTION_ARG_BOUNDARY. Every parameter gets at
5425 least PARM_BOUNDARY bits of alignment, but will be given anything up
5426 to STACK_BOUNDARY bits if the type requires it. */
5427
5428 static unsigned int
5429 mips_function_arg_boundary (enum machine_mode mode, const_tree type)
5430 {
5431 unsigned int alignment;
5432
5433 alignment = type ? TYPE_ALIGN (type) : GET_MODE_ALIGNMENT (mode);
5434 if (alignment < PARM_BOUNDARY)
5435 alignment = PARM_BOUNDARY;
5436 if (alignment > STACK_BOUNDARY)
5437 alignment = STACK_BOUNDARY;
5438 return alignment;
5439 }
5440
5441 /* Return true if FUNCTION_ARG_PADDING (MODE, TYPE) should return
5442 upward rather than downward. In other words, return true if the
5443 first byte of the stack slot has useful data, false if the last
5444 byte does. */
5445
5446 bool
5447 mips_pad_arg_upward (enum machine_mode mode, const_tree type)
5448 {
5449 /* On little-endian targets, the first byte of every stack argument
5450 is passed in the first byte of the stack slot. */
5451 if (!BYTES_BIG_ENDIAN)
5452 return true;
5453
5454 /* Otherwise, integral types are padded downward: the last byte of a
5455 stack argument is passed in the last byte of the stack slot. */
5456 if (type != 0
5457 ? (INTEGRAL_TYPE_P (type)
5458 || POINTER_TYPE_P (type)
5459 || FIXED_POINT_TYPE_P (type))
5460 : (SCALAR_INT_MODE_P (mode)
5461 || ALL_SCALAR_FIXED_POINT_MODE_P (mode)))
5462 return false;
5463
5464 /* Big-endian o64 pads floating-point arguments downward. */
5465 if (mips_abi == ABI_O64)
5466 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT)
5467 return false;
5468
5469 /* Other types are padded upward for o32, o64, n32 and n64. */
5470 if (mips_abi != ABI_EABI)
5471 return true;
5472
5473 /* Arguments smaller than a stack slot are padded downward. */
5474 if (mode != BLKmode)
5475 return GET_MODE_BITSIZE (mode) >= PARM_BOUNDARY;
5476 else
5477 return int_size_in_bytes (type) >= (PARM_BOUNDARY / BITS_PER_UNIT);
5478 }
5479
5480 /* Likewise BLOCK_REG_PADDING (MODE, TYPE, ...). Return !BYTES_BIG_ENDIAN
5481 if the least significant byte of the register has useful data. Return
5482 the opposite if the most significant byte does. */
5483
5484 bool
5485 mips_pad_reg_upward (enum machine_mode mode, tree type)
5486 {
5487 /* No shifting is required for floating-point arguments. */
5488 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT)
5489 return !BYTES_BIG_ENDIAN;
5490
5491 /* Otherwise, apply the same padding to register arguments as we do
5492 to stack arguments. */
5493 return mips_pad_arg_upward (mode, type);
5494 }
5495
5496 /* Return nonzero when an argument must be passed by reference. */
5497
5498 static bool
5499 mips_pass_by_reference (cumulative_args_t cum ATTRIBUTE_UNUSED,
5500 enum machine_mode mode, const_tree type,
5501 bool named ATTRIBUTE_UNUSED)
5502 {
5503 if (mips_abi == ABI_EABI)
5504 {
5505 int size;
5506
5507 /* ??? How should SCmode be handled? */
5508 if (mode == DImode || mode == DFmode
5509 || mode == DQmode || mode == UDQmode
5510 || mode == DAmode || mode == UDAmode)
5511 return 0;
5512
5513 size = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode);
5514 return size == -1 || size > UNITS_PER_WORD;
5515 }
5516 else
5517 {
5518 /* If we have a variable-sized parameter, we have no choice. */
5519 return targetm.calls.must_pass_in_stack (mode, type);
5520 }
5521 }
5522
5523 /* Implement TARGET_CALLEE_COPIES. */
5524
5525 static bool
5526 mips_callee_copies (cumulative_args_t cum ATTRIBUTE_UNUSED,
5527 enum machine_mode mode ATTRIBUTE_UNUSED,
5528 const_tree type ATTRIBUTE_UNUSED, bool named)
5529 {
5530 return mips_abi == ABI_EABI && named;
5531 }
5532 \f
5533 /* See whether VALTYPE is a record whose fields should be returned in
5534 floating-point registers. If so, return the number of fields and
5535 list them in FIELDS (which should have two elements). Return 0
5536 otherwise.
5537
5538 For n32 & n64, a structure with one or two fields is returned in
5539 floating-point registers as long as every field has a floating-point
5540 type. */
5541
5542 static int
5543 mips_fpr_return_fields (const_tree valtype, tree *fields)
5544 {
5545 tree field;
5546 int i;
5547
5548 if (!TARGET_NEWABI)
5549 return 0;
5550
5551 if (TREE_CODE (valtype) != RECORD_TYPE)
5552 return 0;
5553
5554 i = 0;
5555 for (field = TYPE_FIELDS (valtype); field != 0; field = DECL_CHAIN (field))
5556 {
5557 if (TREE_CODE (field) != FIELD_DECL)
5558 continue;
5559
5560 if (!SCALAR_FLOAT_TYPE_P (TREE_TYPE (field)))
5561 return 0;
5562
5563 if (i == 2)
5564 return 0;
5565
5566 fields[i++] = field;
5567 }
5568 return i;
5569 }
5570
5571 /* Implement TARGET_RETURN_IN_MSB. For n32 & n64, we should return
5572 a value in the most significant part of $2/$3 if:
5573
5574 - the target is big-endian;
5575
5576 - the value has a structure or union type (we generalize this to
5577 cover aggregates from other languages too); and
5578
5579 - the structure is not returned in floating-point registers. */
5580
5581 static bool
5582 mips_return_in_msb (const_tree valtype)
5583 {
5584 tree fields[2];
5585
5586 return (TARGET_NEWABI
5587 && TARGET_BIG_ENDIAN
5588 && AGGREGATE_TYPE_P (valtype)
5589 && mips_fpr_return_fields (valtype, fields) == 0);
5590 }
5591
5592 /* Return true if the function return value MODE will get returned in a
5593 floating-point register. */
5594
5595 static bool
5596 mips_return_mode_in_fpr_p (enum machine_mode mode)
5597 {
5598 return ((GET_MODE_CLASS (mode) == MODE_FLOAT
5599 || mode == V2SFmode
5600 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5601 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_HWFPVALUE);
5602 }
5603
5604 /* Return the representation of an FPR return register when the
5605 value being returned in FP_RETURN has mode VALUE_MODE and the
5606 return type itself has mode TYPE_MODE. On NewABI targets,
5607 the two modes may be different for structures like:
5608
5609 struct __attribute__((packed)) foo { float f; }
5610
5611 where we return the SFmode value of "f" in FP_RETURN, but where
5612 the structure itself has mode BLKmode. */
5613
5614 static rtx
5615 mips_return_fpr_single (enum machine_mode type_mode,
5616 enum machine_mode value_mode)
5617 {
5618 rtx x;
5619
5620 x = gen_rtx_REG (value_mode, FP_RETURN);
5621 if (type_mode != value_mode)
5622 {
5623 x = gen_rtx_EXPR_LIST (VOIDmode, x, const0_rtx);
5624 x = gen_rtx_PARALLEL (type_mode, gen_rtvec (1, x));
5625 }
5626 return x;
5627 }
5628
5629 /* Return a composite value in a pair of floating-point registers.
5630 MODE1 and OFFSET1 are the mode and byte offset for the first value,
5631 likewise MODE2 and OFFSET2 for the second. MODE is the mode of the
5632 complete value.
5633
5634 For n32 & n64, $f0 always holds the first value and $f2 the second.
5635 Otherwise the values are packed together as closely as possible. */
5636
5637 static rtx
5638 mips_return_fpr_pair (enum machine_mode mode,
5639 enum machine_mode mode1, HOST_WIDE_INT offset1,
5640 enum machine_mode mode2, HOST_WIDE_INT offset2)
5641 {
5642 int inc;
5643
5644 inc = (TARGET_NEWABI ? 2 : MAX_FPRS_PER_FMT);
5645 return gen_rtx_PARALLEL
5646 (mode,
5647 gen_rtvec (2,
5648 gen_rtx_EXPR_LIST (VOIDmode,
5649 gen_rtx_REG (mode1, FP_RETURN),
5650 GEN_INT (offset1)),
5651 gen_rtx_EXPR_LIST (VOIDmode,
5652 gen_rtx_REG (mode2, FP_RETURN + inc),
5653 GEN_INT (offset2))));
5654
5655 }
5656
5657 /* Implement TARGET_FUNCTION_VALUE and TARGET_LIBCALL_VALUE.
5658 For normal calls, VALTYPE is the return type and MODE is VOIDmode.
5659 For libcalls, VALTYPE is null and MODE is the mode of the return value. */
5660
5661 static rtx
5662 mips_function_value_1 (const_tree valtype, const_tree fn_decl_or_type,
5663 enum machine_mode mode)
5664 {
5665 if (valtype)
5666 {
5667 tree fields[2];
5668 int unsigned_p;
5669 const_tree func;
5670
5671 if (fn_decl_or_type && DECL_P (fn_decl_or_type))
5672 func = fn_decl_or_type;
5673 else
5674 func = NULL;
5675
5676 mode = TYPE_MODE (valtype);
5677 unsigned_p = TYPE_UNSIGNED (valtype);
5678
5679 /* Since TARGET_PROMOTE_FUNCTION_MODE unconditionally promotes,
5680 return values, promote the mode here too. */
5681 mode = promote_function_mode (valtype, mode, &unsigned_p, func, 1);
5682
5683 /* Handle structures whose fields are returned in $f0/$f2. */
5684 switch (mips_fpr_return_fields (valtype, fields))
5685 {
5686 case 1:
5687 return mips_return_fpr_single (mode,
5688 TYPE_MODE (TREE_TYPE (fields[0])));
5689
5690 case 2:
5691 return mips_return_fpr_pair (mode,
5692 TYPE_MODE (TREE_TYPE (fields[0])),
5693 int_byte_position (fields[0]),
5694 TYPE_MODE (TREE_TYPE (fields[1])),
5695 int_byte_position (fields[1]));
5696 }
5697
5698 /* If a value is passed in the most significant part of a register, see
5699 whether we have to round the mode up to a whole number of words. */
5700 if (mips_return_in_msb (valtype))
5701 {
5702 HOST_WIDE_INT size = int_size_in_bytes (valtype);
5703 if (size % UNITS_PER_WORD != 0)
5704 {
5705 size += UNITS_PER_WORD - size % UNITS_PER_WORD;
5706 mode = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0);
5707 }
5708 }
5709
5710 /* For EABI, the class of return register depends entirely on MODE.
5711 For example, "struct { some_type x; }" and "union { some_type x; }"
5712 are returned in the same way as a bare "some_type" would be.
5713 Other ABIs only use FPRs for scalar, complex or vector types. */
5714 if (mips_abi != ABI_EABI && !FLOAT_TYPE_P (valtype))
5715 return gen_rtx_REG (mode, GP_RETURN);
5716 }
5717
5718 if (!TARGET_MIPS16)
5719 {
5720 /* Handle long doubles for n32 & n64. */
5721 if (mode == TFmode)
5722 return mips_return_fpr_pair (mode,
5723 DImode, 0,
5724 DImode, GET_MODE_SIZE (mode) / 2);
5725
5726 if (mips_return_mode_in_fpr_p (mode))
5727 {
5728 if (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5729 return mips_return_fpr_pair (mode,
5730 GET_MODE_INNER (mode), 0,
5731 GET_MODE_INNER (mode),
5732 GET_MODE_SIZE (mode) / 2);
5733 else
5734 return gen_rtx_REG (mode, FP_RETURN);
5735 }
5736 }
5737
5738 return gen_rtx_REG (mode, GP_RETURN);
5739 }
5740
5741 /* Implement TARGET_FUNCTION_VALUE. */
5742
5743 static rtx
5744 mips_function_value (const_tree valtype, const_tree fn_decl_or_type,
5745 bool outgoing ATTRIBUTE_UNUSED)
5746 {
5747 return mips_function_value_1 (valtype, fn_decl_or_type, VOIDmode);
5748 }
5749
5750 /* Implement TARGET_LIBCALL_VALUE. */
5751
5752 static rtx
5753 mips_libcall_value (enum machine_mode mode, const_rtx fun ATTRIBUTE_UNUSED)
5754 {
5755 return mips_function_value_1 (NULL_TREE, NULL_TREE, mode);
5756 }
5757
5758 /* Implement TARGET_FUNCTION_VALUE_REGNO_P.
5759
5760 On the MIPS, R2 R3 and F0 F2 are the only register thus used.
5761 Currently, R2 and F0 are only implemented here (C has no complex type). */
5762
5763 static bool
5764 mips_function_value_regno_p (const unsigned int regno)
5765 {
5766 if (regno == GP_RETURN
5767 || regno == FP_RETURN
5768 || (LONG_DOUBLE_TYPE_SIZE == 128
5769 && FP_RETURN != GP_RETURN
5770 && regno == FP_RETURN + 2))
5771 return true;
5772
5773 return false;
5774 }
5775
5776 /* Implement TARGET_RETURN_IN_MEMORY. Under the o32 and o64 ABIs,
5777 all BLKmode objects are returned in memory. Under the n32, n64
5778 and embedded ABIs, small structures are returned in a register.
5779 Objects with varying size must still be returned in memory, of
5780 course. */
5781
5782 static bool
5783 mips_return_in_memory (const_tree type, const_tree fndecl ATTRIBUTE_UNUSED)
5784 {
5785 return (TARGET_OLDABI
5786 ? TYPE_MODE (type) == BLKmode
5787 : !IN_RANGE (int_size_in_bytes (type), 0, 2 * UNITS_PER_WORD));
5788 }
5789 \f
5790 /* Implement TARGET_SETUP_INCOMING_VARARGS. */
5791
5792 static void
5793 mips_setup_incoming_varargs (cumulative_args_t cum, enum machine_mode mode,
5794 tree type, int *pretend_size ATTRIBUTE_UNUSED,
5795 int no_rtl)
5796 {
5797 CUMULATIVE_ARGS local_cum;
5798 int gp_saved, fp_saved;
5799
5800 /* The caller has advanced CUM up to, but not beyond, the last named
5801 argument. Advance a local copy of CUM past the last "real" named
5802 argument, to find out how many registers are left over. */
5803 local_cum = *get_cumulative_args (cum);
5804 mips_function_arg_advance (pack_cumulative_args (&local_cum), mode, type,
5805 true);
5806
5807 /* Found out how many registers we need to save. */
5808 gp_saved = MAX_ARGS_IN_REGISTERS - local_cum.num_gprs;
5809 fp_saved = (EABI_FLOAT_VARARGS_P
5810 ? MAX_ARGS_IN_REGISTERS - local_cum.num_fprs
5811 : 0);
5812
5813 if (!no_rtl)
5814 {
5815 if (gp_saved > 0)
5816 {
5817 rtx ptr, mem;
5818
5819 ptr = plus_constant (Pmode, virtual_incoming_args_rtx,
5820 REG_PARM_STACK_SPACE (cfun->decl)
5821 - gp_saved * UNITS_PER_WORD);
5822 mem = gen_frame_mem (BLKmode, ptr);
5823 set_mem_alias_set (mem, get_varargs_alias_set ());
5824
5825 move_block_from_reg (local_cum.num_gprs + GP_ARG_FIRST,
5826 mem, gp_saved);
5827 }
5828 if (fp_saved > 0)
5829 {
5830 /* We can't use move_block_from_reg, because it will use
5831 the wrong mode. */
5832 enum machine_mode mode;
5833 int off, i;
5834
5835 /* Set OFF to the offset from virtual_incoming_args_rtx of
5836 the first float register. The FP save area lies below
5837 the integer one, and is aligned to UNITS_PER_FPVALUE bytes. */
5838 off = (-gp_saved * UNITS_PER_WORD) & -UNITS_PER_FPVALUE;
5839 off -= fp_saved * UNITS_PER_FPREG;
5840
5841 mode = TARGET_SINGLE_FLOAT ? SFmode : DFmode;
5842
5843 for (i = local_cum.num_fprs; i < MAX_ARGS_IN_REGISTERS;
5844 i += MAX_FPRS_PER_FMT)
5845 {
5846 rtx ptr, mem;
5847
5848 ptr = plus_constant (Pmode, virtual_incoming_args_rtx, off);
5849 mem = gen_frame_mem (mode, ptr);
5850 set_mem_alias_set (mem, get_varargs_alias_set ());
5851 mips_emit_move (mem, gen_rtx_REG (mode, FP_ARG_FIRST + i));
5852 off += UNITS_PER_HWFPVALUE;
5853 }
5854 }
5855 }
5856 if (REG_PARM_STACK_SPACE (cfun->decl) == 0)
5857 cfun->machine->varargs_size = (gp_saved * UNITS_PER_WORD
5858 + fp_saved * UNITS_PER_FPREG);
5859 }
5860
5861 /* Implement TARGET_BUILTIN_VA_LIST. */
5862
5863 static tree
5864 mips_build_builtin_va_list (void)
5865 {
5866 if (EABI_FLOAT_VARARGS_P)
5867 {
5868 /* We keep 3 pointers, and two offsets.
5869
5870 Two pointers are to the overflow area, which starts at the CFA.
5871 One of these is constant, for addressing into the GPR save area
5872 below it. The other is advanced up the stack through the
5873 overflow region.
5874
5875 The third pointer is to the bottom of the GPR save area.
5876 Since the FPR save area is just below it, we can address
5877 FPR slots off this pointer.
5878
5879 We also keep two one-byte offsets, which are to be subtracted
5880 from the constant pointers to yield addresses in the GPR and
5881 FPR save areas. These are downcounted as float or non-float
5882 arguments are used, and when they get to zero, the argument
5883 must be obtained from the overflow region. */
5884 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff, f_res, record;
5885 tree array, index;
5886
5887 record = lang_hooks.types.make_type (RECORD_TYPE);
5888
5889 f_ovfl = build_decl (BUILTINS_LOCATION,
5890 FIELD_DECL, get_identifier ("__overflow_argptr"),
5891 ptr_type_node);
5892 f_gtop = build_decl (BUILTINS_LOCATION,
5893 FIELD_DECL, get_identifier ("__gpr_top"),
5894 ptr_type_node);
5895 f_ftop = build_decl (BUILTINS_LOCATION,
5896 FIELD_DECL, get_identifier ("__fpr_top"),
5897 ptr_type_node);
5898 f_goff = build_decl (BUILTINS_LOCATION,
5899 FIELD_DECL, get_identifier ("__gpr_offset"),
5900 unsigned_char_type_node);
5901 f_foff = build_decl (BUILTINS_LOCATION,
5902 FIELD_DECL, get_identifier ("__fpr_offset"),
5903 unsigned_char_type_node);
5904 /* Explicitly pad to the size of a pointer, so that -Wpadded won't
5905 warn on every user file. */
5906 index = build_int_cst (NULL_TREE, GET_MODE_SIZE (ptr_mode) - 2 - 1);
5907 array = build_array_type (unsigned_char_type_node,
5908 build_index_type (index));
5909 f_res = build_decl (BUILTINS_LOCATION,
5910 FIELD_DECL, get_identifier ("__reserved"), array);
5911
5912 DECL_FIELD_CONTEXT (f_ovfl) = record;
5913 DECL_FIELD_CONTEXT (f_gtop) = record;
5914 DECL_FIELD_CONTEXT (f_ftop) = record;
5915 DECL_FIELD_CONTEXT (f_goff) = record;
5916 DECL_FIELD_CONTEXT (f_foff) = record;
5917 DECL_FIELD_CONTEXT (f_res) = record;
5918
5919 TYPE_FIELDS (record) = f_ovfl;
5920 DECL_CHAIN (f_ovfl) = f_gtop;
5921 DECL_CHAIN (f_gtop) = f_ftop;
5922 DECL_CHAIN (f_ftop) = f_goff;
5923 DECL_CHAIN (f_goff) = f_foff;
5924 DECL_CHAIN (f_foff) = f_res;
5925
5926 layout_type (record);
5927 return record;
5928 }
5929 else
5930 /* Otherwise, we use 'void *'. */
5931 return ptr_type_node;
5932 }
5933
5934 /* Implement TARGET_EXPAND_BUILTIN_VA_START. */
5935
5936 static void
5937 mips_va_start (tree valist, rtx nextarg)
5938 {
5939 if (EABI_FLOAT_VARARGS_P)
5940 {
5941 const CUMULATIVE_ARGS *cum;
5942 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff;
5943 tree ovfl, gtop, ftop, goff, foff;
5944 tree t;
5945 int gpr_save_area_size;
5946 int fpr_save_area_size;
5947 int fpr_offset;
5948
5949 cum = &crtl->args.info;
5950 gpr_save_area_size
5951 = (MAX_ARGS_IN_REGISTERS - cum->num_gprs) * UNITS_PER_WORD;
5952 fpr_save_area_size
5953 = (MAX_ARGS_IN_REGISTERS - cum->num_fprs) * UNITS_PER_FPREG;
5954
5955 f_ovfl = TYPE_FIELDS (va_list_type_node);
5956 f_gtop = DECL_CHAIN (f_ovfl);
5957 f_ftop = DECL_CHAIN (f_gtop);
5958 f_goff = DECL_CHAIN (f_ftop);
5959 f_foff = DECL_CHAIN (f_goff);
5960
5961 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl,
5962 NULL_TREE);
5963 gtop = build3 (COMPONENT_REF, TREE_TYPE (f_gtop), valist, f_gtop,
5964 NULL_TREE);
5965 ftop = build3 (COMPONENT_REF, TREE_TYPE (f_ftop), valist, f_ftop,
5966 NULL_TREE);
5967 goff = build3 (COMPONENT_REF, TREE_TYPE (f_goff), valist, f_goff,
5968 NULL_TREE);
5969 foff = build3 (COMPONENT_REF, TREE_TYPE (f_foff), valist, f_foff,
5970 NULL_TREE);
5971
5972 /* Emit code to initialize OVFL, which points to the next varargs
5973 stack argument. CUM->STACK_WORDS gives the number of stack
5974 words used by named arguments. */
5975 t = make_tree (TREE_TYPE (ovfl), virtual_incoming_args_rtx);
5976 if (cum->stack_words > 0)
5977 t = fold_build_pointer_plus_hwi (t, cum->stack_words * UNITS_PER_WORD);
5978 t = build2 (MODIFY_EXPR, TREE_TYPE (ovfl), ovfl, t);
5979 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5980
5981 /* Emit code to initialize GTOP, the top of the GPR save area. */
5982 t = make_tree (TREE_TYPE (gtop), virtual_incoming_args_rtx);
5983 t = build2 (MODIFY_EXPR, TREE_TYPE (gtop), gtop, t);
5984 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5985
5986 /* Emit code to initialize FTOP, the top of the FPR save area.
5987 This address is gpr_save_area_bytes below GTOP, rounded
5988 down to the next fp-aligned boundary. */
5989 t = make_tree (TREE_TYPE (ftop), virtual_incoming_args_rtx);
5990 fpr_offset = gpr_save_area_size + UNITS_PER_FPVALUE - 1;
5991 fpr_offset &= -UNITS_PER_FPVALUE;
5992 if (fpr_offset)
5993 t = fold_build_pointer_plus_hwi (t, -fpr_offset);
5994 t = build2 (MODIFY_EXPR, TREE_TYPE (ftop), ftop, t);
5995 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5996
5997 /* Emit code to initialize GOFF, the offset from GTOP of the
5998 next GPR argument. */
5999 t = build2 (MODIFY_EXPR, TREE_TYPE (goff), goff,
6000 build_int_cst (TREE_TYPE (goff), gpr_save_area_size));
6001 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
6002
6003 /* Likewise emit code to initialize FOFF, the offset from FTOP
6004 of the next FPR argument. */
6005 t = build2 (MODIFY_EXPR, TREE_TYPE (foff), foff,
6006 build_int_cst (TREE_TYPE (foff), fpr_save_area_size));
6007 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
6008 }
6009 else
6010 {
6011 nextarg = plus_constant (Pmode, nextarg, -cfun->machine->varargs_size);
6012 std_expand_builtin_va_start (valist, nextarg);
6013 }
6014 }
6015
6016 /* Like std_gimplify_va_arg_expr, but apply alignment to zero-sized
6017 types as well. */
6018
6019 static tree
6020 mips_std_gimplify_va_arg_expr (tree valist, tree type, gimple_seq *pre_p,
6021 gimple_seq *post_p)
6022 {
6023 tree addr, t, type_size, rounded_size, valist_tmp;
6024 unsigned HOST_WIDE_INT align, boundary;
6025 bool indirect;
6026
6027 indirect = pass_by_reference (NULL, TYPE_MODE (type), type, false);
6028 if (indirect)
6029 type = build_pointer_type (type);
6030
6031 align = PARM_BOUNDARY / BITS_PER_UNIT;
6032 boundary = targetm.calls.function_arg_boundary (TYPE_MODE (type), type);
6033
6034 /* When we align parameter on stack for caller, if the parameter
6035 alignment is beyond MAX_SUPPORTED_STACK_ALIGNMENT, it will be
6036 aligned at MAX_SUPPORTED_STACK_ALIGNMENT. We will match callee
6037 here with caller. */
6038 if (boundary > MAX_SUPPORTED_STACK_ALIGNMENT)
6039 boundary = MAX_SUPPORTED_STACK_ALIGNMENT;
6040
6041 boundary /= BITS_PER_UNIT;
6042
6043 /* Hoist the valist value into a temporary for the moment. */
6044 valist_tmp = get_initialized_tmp_var (valist, pre_p, NULL);
6045
6046 /* va_list pointer is aligned to PARM_BOUNDARY. If argument actually
6047 requires greater alignment, we must perform dynamic alignment. */
6048 if (boundary > align)
6049 {
6050 t = build2 (MODIFY_EXPR, TREE_TYPE (valist), valist_tmp,
6051 fold_build_pointer_plus_hwi (valist_tmp, boundary - 1));
6052 gimplify_and_add (t, pre_p);
6053
6054 t = build2 (MODIFY_EXPR, TREE_TYPE (valist), valist_tmp,
6055 fold_build2 (BIT_AND_EXPR, TREE_TYPE (valist),
6056 valist_tmp,
6057 build_int_cst (TREE_TYPE (valist), -boundary)));
6058 gimplify_and_add (t, pre_p);
6059 }
6060 else
6061 boundary = align;
6062
6063 /* If the actual alignment is less than the alignment of the type,
6064 adjust the type accordingly so that we don't assume strict alignment
6065 when dereferencing the pointer. */
6066 boundary *= BITS_PER_UNIT;
6067 if (boundary < TYPE_ALIGN (type))
6068 {
6069 type = build_variant_type_copy (type);
6070 TYPE_ALIGN (type) = boundary;
6071 }
6072
6073 /* Compute the rounded size of the type. */
6074 type_size = size_in_bytes (type);
6075 rounded_size = round_up (type_size, align);
6076
6077 /* Reduce rounded_size so it's sharable with the postqueue. */
6078 gimplify_expr (&rounded_size, pre_p, post_p, is_gimple_val, fb_rvalue);
6079
6080 /* Get AP. */
6081 addr = valist_tmp;
6082 if (PAD_VARARGS_DOWN && !integer_zerop (rounded_size))
6083 {
6084 /* Small args are padded downward. */
6085 t = fold_build2_loc (input_location, GT_EXPR, sizetype,
6086 rounded_size, size_int (align));
6087 t = fold_build3 (COND_EXPR, sizetype, t, size_zero_node,
6088 size_binop (MINUS_EXPR, rounded_size, type_size));
6089 addr = fold_build_pointer_plus (addr, t);
6090 }
6091
6092 /* Compute new value for AP. */
6093 t = fold_build_pointer_plus (valist_tmp, rounded_size);
6094 t = build2 (MODIFY_EXPR, TREE_TYPE (valist), valist, t);
6095 gimplify_and_add (t, pre_p);
6096
6097 addr = fold_convert (build_pointer_type (type), addr);
6098
6099 if (indirect)
6100 addr = build_va_arg_indirect_ref (addr);
6101
6102 return build_va_arg_indirect_ref (addr);
6103 }
6104
6105 /* Implement TARGET_GIMPLIFY_VA_ARG_EXPR. */
6106
6107 static tree
6108 mips_gimplify_va_arg_expr (tree valist, tree type, gimple_seq *pre_p,
6109 gimple_seq *post_p)
6110 {
6111 tree addr;
6112 bool indirect_p;
6113
6114 indirect_p = pass_by_reference (NULL, TYPE_MODE (type), type, 0);
6115 if (indirect_p)
6116 type = build_pointer_type (type);
6117
6118 if (!EABI_FLOAT_VARARGS_P)
6119 addr = mips_std_gimplify_va_arg_expr (valist, type, pre_p, post_p);
6120 else
6121 {
6122 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff;
6123 tree ovfl, top, off, align;
6124 HOST_WIDE_INT size, rsize, osize;
6125 tree t, u;
6126
6127 f_ovfl = TYPE_FIELDS (va_list_type_node);
6128 f_gtop = DECL_CHAIN (f_ovfl);
6129 f_ftop = DECL_CHAIN (f_gtop);
6130 f_goff = DECL_CHAIN (f_ftop);
6131 f_foff = DECL_CHAIN (f_goff);
6132
6133 /* Let:
6134
6135 TOP be the top of the GPR or FPR save area;
6136 OFF be the offset from TOP of the next register;
6137 ADDR_RTX be the address of the argument;
6138 SIZE be the number of bytes in the argument type;
6139 RSIZE be the number of bytes used to store the argument
6140 when it's in the register save area; and
6141 OSIZE be the number of bytes used to store it when it's
6142 in the stack overflow area.
6143
6144 The code we want is:
6145
6146 1: off &= -rsize; // round down
6147 2: if (off != 0)
6148 3: {
6149 4: addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0);
6150 5: off -= rsize;
6151 6: }
6152 7: else
6153 8: {
6154 9: ovfl = ((intptr_t) ovfl + osize - 1) & -osize;
6155 10: addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0);
6156 11: ovfl += osize;
6157 14: }
6158
6159 [1] and [9] can sometimes be optimized away. */
6160
6161 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl,
6162 NULL_TREE);
6163 size = int_size_in_bytes (type);
6164
6165 if (GET_MODE_CLASS (TYPE_MODE (type)) == MODE_FLOAT
6166 && GET_MODE_SIZE (TYPE_MODE (type)) <= UNITS_PER_FPVALUE)
6167 {
6168 top = build3 (COMPONENT_REF, TREE_TYPE (f_ftop),
6169 unshare_expr (valist), f_ftop, NULL_TREE);
6170 off = build3 (COMPONENT_REF, TREE_TYPE (f_foff),
6171 unshare_expr (valist), f_foff, NULL_TREE);
6172
6173 /* When va_start saves FPR arguments to the stack, each slot
6174 takes up UNITS_PER_HWFPVALUE bytes, regardless of the
6175 argument's precision. */
6176 rsize = UNITS_PER_HWFPVALUE;
6177
6178 /* Overflow arguments are padded to UNITS_PER_WORD bytes
6179 (= PARM_BOUNDARY bits). This can be different from RSIZE
6180 in two cases:
6181
6182 (1) On 32-bit targets when TYPE is a structure such as:
6183
6184 struct s { float f; };
6185
6186 Such structures are passed in paired FPRs, so RSIZE
6187 will be 8 bytes. However, the structure only takes
6188 up 4 bytes of memory, so OSIZE will only be 4.
6189
6190 (2) In combinations such as -mgp64 -msingle-float
6191 -fshort-double. Doubles passed in registers will then take
6192 up 4 (UNITS_PER_HWFPVALUE) bytes, but those passed on the
6193 stack take up UNITS_PER_WORD bytes. */
6194 osize = MAX (GET_MODE_SIZE (TYPE_MODE (type)), UNITS_PER_WORD);
6195 }
6196 else
6197 {
6198 top = build3 (COMPONENT_REF, TREE_TYPE (f_gtop),
6199 unshare_expr (valist), f_gtop, NULL_TREE);
6200 off = build3 (COMPONENT_REF, TREE_TYPE (f_goff),
6201 unshare_expr (valist), f_goff, NULL_TREE);
6202 rsize = (size + UNITS_PER_WORD - 1) & -UNITS_PER_WORD;
6203 if (rsize > UNITS_PER_WORD)
6204 {
6205 /* [1] Emit code for: off &= -rsize. */
6206 t = build2 (BIT_AND_EXPR, TREE_TYPE (off), unshare_expr (off),
6207 build_int_cst (TREE_TYPE (off), -rsize));
6208 gimplify_assign (unshare_expr (off), t, pre_p);
6209 }
6210 osize = rsize;
6211 }
6212
6213 /* [2] Emit code to branch if off == 0. */
6214 t = build2 (NE_EXPR, boolean_type_node, unshare_expr (off),
6215 build_int_cst (TREE_TYPE (off), 0));
6216 addr = build3 (COND_EXPR, ptr_type_node, t, NULL_TREE, NULL_TREE);
6217
6218 /* [5] Emit code for: off -= rsize. We do this as a form of
6219 post-decrement not available to C. */
6220 t = fold_convert (TREE_TYPE (off), build_int_cst (NULL_TREE, rsize));
6221 t = build2 (POSTDECREMENT_EXPR, TREE_TYPE (off), off, t);
6222
6223 /* [4] Emit code for:
6224 addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0). */
6225 t = fold_convert (sizetype, t);
6226 t = fold_build1 (NEGATE_EXPR, sizetype, t);
6227 t = fold_build_pointer_plus (top, t);
6228 if (BYTES_BIG_ENDIAN && rsize > size)
6229 t = fold_build_pointer_plus_hwi (t, rsize - size);
6230 COND_EXPR_THEN (addr) = t;
6231
6232 if (osize > UNITS_PER_WORD)
6233 {
6234 /* [9] Emit: ovfl = ((intptr_t) ovfl + osize - 1) & -osize. */
6235 t = fold_build_pointer_plus_hwi (unshare_expr (ovfl), osize - 1);
6236 u = build_int_cst (TREE_TYPE (t), -osize);
6237 t = build2 (BIT_AND_EXPR, TREE_TYPE (t), t, u);
6238 align = build2 (MODIFY_EXPR, TREE_TYPE (ovfl),
6239 unshare_expr (ovfl), t);
6240 }
6241 else
6242 align = NULL;
6243
6244 /* [10, 11] Emit code for:
6245 addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0)
6246 ovfl += osize. */
6247 u = fold_convert (TREE_TYPE (ovfl), build_int_cst (NULL_TREE, osize));
6248 t = build2 (POSTINCREMENT_EXPR, TREE_TYPE (ovfl), ovfl, u);
6249 if (BYTES_BIG_ENDIAN && osize > size)
6250 t = fold_build_pointer_plus_hwi (t, osize - size);
6251
6252 /* String [9] and [10, 11] together. */
6253 if (align)
6254 t = build2 (COMPOUND_EXPR, TREE_TYPE (t), align, t);
6255 COND_EXPR_ELSE (addr) = t;
6256
6257 addr = fold_convert (build_pointer_type (type), addr);
6258 addr = build_va_arg_indirect_ref (addr);
6259 }
6260
6261 if (indirect_p)
6262 addr = build_va_arg_indirect_ref (addr);
6263
6264 return addr;
6265 }
6266 \f
6267 /* Declare a unique, locally-binding function called NAME, then start
6268 its definition. */
6269
6270 static void
6271 mips_start_unique_function (const char *name)
6272 {
6273 tree decl;
6274
6275 decl = build_decl (BUILTINS_LOCATION, FUNCTION_DECL,
6276 get_identifier (name),
6277 build_function_type_list (void_type_node, NULL_TREE));
6278 DECL_RESULT (decl) = build_decl (BUILTINS_LOCATION, RESULT_DECL,
6279 NULL_TREE, void_type_node);
6280 TREE_PUBLIC (decl) = 1;
6281 TREE_STATIC (decl) = 1;
6282
6283 cgraph_node::create (decl)->set_comdat_group (DECL_ASSEMBLER_NAME (decl));
6284
6285 targetm.asm_out.unique_section (decl, 0);
6286 switch_to_section (get_named_section (decl, NULL, 0));
6287
6288 targetm.asm_out.globalize_label (asm_out_file, name);
6289 fputs ("\t.hidden\t", asm_out_file);
6290 assemble_name (asm_out_file, name);
6291 putc ('\n', asm_out_file);
6292 }
6293
6294 /* Start a definition of function NAME. MIPS16_P indicates whether the
6295 function contains MIPS16 code. */
6296
6297 static void
6298 mips_start_function_definition (const char *name, bool mips16_p)
6299 {
6300 if (mips16_p)
6301 fprintf (asm_out_file, "\t.set\tmips16\n");
6302 else
6303 fprintf (asm_out_file, "\t.set\tnomips16\n");
6304
6305 if (TARGET_MICROMIPS)
6306 fprintf (asm_out_file, "\t.set\tmicromips\n");
6307 #ifdef HAVE_GAS_MICROMIPS
6308 else
6309 fprintf (asm_out_file, "\t.set\tnomicromips\n");
6310 #endif
6311
6312 if (!flag_inhibit_size_directive)
6313 {
6314 fputs ("\t.ent\t", asm_out_file);
6315 assemble_name (asm_out_file, name);
6316 fputs ("\n", asm_out_file);
6317 }
6318
6319 ASM_OUTPUT_TYPE_DIRECTIVE (asm_out_file, name, "function");
6320
6321 /* Start the definition proper. */
6322 assemble_name (asm_out_file, name);
6323 fputs (":\n", asm_out_file);
6324 }
6325
6326 /* End a function definition started by mips_start_function_definition. */
6327
6328 static void
6329 mips_end_function_definition (const char *name)
6330 {
6331 if (!flag_inhibit_size_directive)
6332 {
6333 fputs ("\t.end\t", asm_out_file);
6334 assemble_name (asm_out_file, name);
6335 fputs ("\n", asm_out_file);
6336 }
6337 }
6338
6339 /* If *STUB_PTR points to a stub, output a comdat-style definition for it,
6340 then free *STUB_PTR. */
6341
6342 static void
6343 mips_finish_stub (mips_one_only_stub **stub_ptr)
6344 {
6345 mips_one_only_stub *stub = *stub_ptr;
6346 if (!stub)
6347 return;
6348
6349 const char *name = stub->get_name ();
6350 mips_start_unique_function (name);
6351 mips_start_function_definition (name, false);
6352 stub->output_body ();
6353 mips_end_function_definition (name);
6354 delete stub;
6355 *stub_ptr = 0;
6356 }
6357 \f
6358 /* Return true if calls to X can use R_MIPS_CALL* relocations. */
6359
6360 static bool
6361 mips_ok_for_lazy_binding_p (rtx x)
6362 {
6363 return (TARGET_USE_GOT
6364 && GET_CODE (x) == SYMBOL_REF
6365 && !SYMBOL_REF_BIND_NOW_P (x)
6366 && !mips_symbol_binds_local_p (x));
6367 }
6368
6369 /* Load function address ADDR into register DEST. TYPE is as for
6370 mips_expand_call. Return true if we used an explicit lazy-binding
6371 sequence. */
6372
6373 static bool
6374 mips_load_call_address (enum mips_call_type type, rtx dest, rtx addr)
6375 {
6376 /* If we're generating PIC, and this call is to a global function,
6377 try to allow its address to be resolved lazily. This isn't
6378 possible for sibcalls when $gp is call-saved because the value
6379 of $gp on entry to the stub would be our caller's gp, not ours. */
6380 if (TARGET_EXPLICIT_RELOCS
6381 && !(type == MIPS_CALL_SIBCALL && TARGET_CALL_SAVED_GP)
6382 && mips_ok_for_lazy_binding_p (addr))
6383 {
6384 addr = mips_got_load (dest, addr, SYMBOL_GOTOFF_CALL);
6385 emit_insn (gen_rtx_SET (VOIDmode, dest, addr));
6386 return true;
6387 }
6388 else
6389 {
6390 mips_emit_move (dest, addr);
6391 return false;
6392 }
6393 }
6394 \f
6395 /* Each locally-defined hard-float MIPS16 function has a local symbol
6396 associated with it. This hash table maps the function symbol (FUNC)
6397 to the local symbol (LOCAL). */
6398 struct GTY(()) mips16_local_alias {
6399 rtx func;
6400 rtx local;
6401 };
6402 static GTY ((param_is (struct mips16_local_alias))) htab_t mips16_local_aliases;
6403
6404 /* Hash table callbacks for mips16_local_aliases. */
6405
6406 static hashval_t
6407 mips16_local_aliases_hash (const void *entry)
6408 {
6409 const struct mips16_local_alias *alias;
6410
6411 alias = (const struct mips16_local_alias *) entry;
6412 return htab_hash_string (XSTR (alias->func, 0));
6413 }
6414
6415 static int
6416 mips16_local_aliases_eq (const void *entry1, const void *entry2)
6417 {
6418 const struct mips16_local_alias *alias1, *alias2;
6419
6420 alias1 = (const struct mips16_local_alias *) entry1;
6421 alias2 = (const struct mips16_local_alias *) entry2;
6422 return rtx_equal_p (alias1->func, alias2->func);
6423 }
6424
6425 /* FUNC is the symbol for a locally-defined hard-float MIPS16 function.
6426 Return a local alias for it, creating a new one if necessary. */
6427
6428 static rtx
6429 mips16_local_alias (rtx func)
6430 {
6431 struct mips16_local_alias *alias, tmp_alias;
6432 void **slot;
6433
6434 /* Create the hash table if this is the first call. */
6435 if (mips16_local_aliases == NULL)
6436 mips16_local_aliases = htab_create_ggc (37, mips16_local_aliases_hash,
6437 mips16_local_aliases_eq, NULL);
6438
6439 /* Look up the function symbol, creating a new entry if need be. */
6440 tmp_alias.func = func;
6441 slot = htab_find_slot (mips16_local_aliases, &tmp_alias, INSERT);
6442 gcc_assert (slot != NULL);
6443
6444 alias = (struct mips16_local_alias *) *slot;
6445 if (alias == NULL)
6446 {
6447 const char *func_name, *local_name;
6448 rtx local;
6449
6450 /* Create a new SYMBOL_REF for the local symbol. The choice of
6451 __fn_local_* is based on the __fn_stub_* names that we've
6452 traditionally used for the non-MIPS16 stub. */
6453 func_name = targetm.strip_name_encoding (XSTR (func, 0));
6454 local_name = ACONCAT (("__fn_local_", func_name, NULL));
6455 local = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (local_name));
6456 SYMBOL_REF_FLAGS (local) = SYMBOL_REF_FLAGS (func) | SYMBOL_FLAG_LOCAL;
6457
6458 /* Create a new structure to represent the mapping. */
6459 alias = ggc_alloc<struct mips16_local_alias> ();
6460 alias->func = func;
6461 alias->local = local;
6462 *slot = alias;
6463 }
6464 return alias->local;
6465 }
6466 \f
6467 /* A chained list of functions for which mips16_build_call_stub has already
6468 generated a stub. NAME is the name of the function and FP_RET_P is true
6469 if the function returns a value in floating-point registers. */
6470 struct mips16_stub {
6471 struct mips16_stub *next;
6472 char *name;
6473 bool fp_ret_p;
6474 };
6475 static struct mips16_stub *mips16_stubs;
6476
6477 /* Return the two-character string that identifies floating-point
6478 return mode MODE in the name of a MIPS16 function stub. */
6479
6480 static const char *
6481 mips16_call_stub_mode_suffix (enum machine_mode mode)
6482 {
6483 if (mode == SFmode)
6484 return "sf";
6485 else if (mode == DFmode)
6486 return "df";
6487 else if (mode == SCmode)
6488 return "sc";
6489 else if (mode == DCmode)
6490 return "dc";
6491 else if (mode == V2SFmode)
6492 return "df";
6493 else
6494 gcc_unreachable ();
6495 }
6496
6497 /* Write instructions to move a 32-bit value between general register
6498 GPREG and floating-point register FPREG. DIRECTION is 't' to move
6499 from GPREG to FPREG and 'f' to move in the opposite direction. */
6500
6501 static void
6502 mips_output_32bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg)
6503 {
6504 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6505 reg_names[gpreg], reg_names[fpreg]);
6506 }
6507
6508 /* Likewise for 64-bit values. */
6509
6510 static void
6511 mips_output_64bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg)
6512 {
6513 if (TARGET_64BIT)
6514 fprintf (asm_out_file, "\tdm%cc1\t%s,%s\n", direction,
6515 reg_names[gpreg], reg_names[fpreg]);
6516 else if (TARGET_FLOAT64)
6517 {
6518 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6519 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]);
6520 fprintf (asm_out_file, "\tm%chc1\t%s,%s\n", direction,
6521 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg]);
6522 }
6523 else
6524 {
6525 /* Move the least-significant word. */
6526 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6527 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]);
6528 /* ...then the most significant word. */
6529 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6530 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg + 1]);
6531 }
6532 }
6533
6534 /* Write out code to move floating-point arguments into or out of
6535 general registers. FP_CODE is the code describing which arguments
6536 are present (see the comment above the definition of CUMULATIVE_ARGS
6537 in mips.h). DIRECTION is as for mips_output_32bit_xfer. */
6538
6539 static void
6540 mips_output_args_xfer (int fp_code, char direction)
6541 {
6542 unsigned int gparg, fparg, f;
6543 CUMULATIVE_ARGS cum;
6544
6545 /* This code only works for o32 and o64. */
6546 gcc_assert (TARGET_OLDABI);
6547
6548 mips_init_cumulative_args (&cum, NULL);
6549
6550 for (f = (unsigned int) fp_code; f != 0; f >>= 2)
6551 {
6552 enum machine_mode mode;
6553 struct mips_arg_info info;
6554
6555 if ((f & 3) == 1)
6556 mode = SFmode;
6557 else if ((f & 3) == 2)
6558 mode = DFmode;
6559 else
6560 gcc_unreachable ();
6561
6562 mips_get_arg_info (&info, &cum, mode, NULL, true);
6563 gparg = mips_arg_regno (&info, false);
6564 fparg = mips_arg_regno (&info, true);
6565
6566 if (mode == SFmode)
6567 mips_output_32bit_xfer (direction, gparg, fparg);
6568 else
6569 mips_output_64bit_xfer (direction, gparg, fparg);
6570
6571 mips_function_arg_advance (pack_cumulative_args (&cum), mode, NULL, true);
6572 }
6573 }
6574
6575 /* Write a MIPS16 stub for the current function. This stub is used
6576 for functions which take arguments in the floating-point registers.
6577 It is normal-mode code that moves the floating-point arguments
6578 into the general registers and then jumps to the MIPS16 code. */
6579
6580 static void
6581 mips16_build_function_stub (void)
6582 {
6583 const char *fnname, *alias_name, *separator;
6584 char *secname, *stubname;
6585 tree stubdecl;
6586 unsigned int f;
6587 rtx symbol, alias;
6588
6589 /* Create the name of the stub, and its unique section. */
6590 symbol = XEXP (DECL_RTL (current_function_decl), 0);
6591 alias = mips16_local_alias (symbol);
6592
6593 fnname = targetm.strip_name_encoding (XSTR (symbol, 0));
6594 alias_name = targetm.strip_name_encoding (XSTR (alias, 0));
6595 secname = ACONCAT ((".mips16.fn.", fnname, NULL));
6596 stubname = ACONCAT (("__fn_stub_", fnname, NULL));
6597
6598 /* Build a decl for the stub. */
6599 stubdecl = build_decl (BUILTINS_LOCATION,
6600 FUNCTION_DECL, get_identifier (stubname),
6601 build_function_type_list (void_type_node, NULL_TREE));
6602 set_decl_section_name (stubdecl, secname);
6603 DECL_RESULT (stubdecl) = build_decl (BUILTINS_LOCATION,
6604 RESULT_DECL, NULL_TREE, void_type_node);
6605
6606 /* Output a comment. */
6607 fprintf (asm_out_file, "\t# Stub function for %s (",
6608 current_function_name ());
6609 separator = "";
6610 for (f = (unsigned int) crtl->args.info.fp_code; f != 0; f >>= 2)
6611 {
6612 fprintf (asm_out_file, "%s%s", separator,
6613 (f & 3) == 1 ? "float" : "double");
6614 separator = ", ";
6615 }
6616 fprintf (asm_out_file, ")\n");
6617
6618 /* Start the function definition. */
6619 assemble_start_function (stubdecl, stubname);
6620 mips_start_function_definition (stubname, false);
6621
6622 /* If generating pic2 code, either set up the global pointer or
6623 switch to pic0. */
6624 if (TARGET_ABICALLS_PIC2)
6625 {
6626 if (TARGET_ABSOLUTE_ABICALLS)
6627 fprintf (asm_out_file, "\t.option\tpic0\n");
6628 else
6629 {
6630 output_asm_insn ("%(.cpload\t%^%)", NULL);
6631 /* Emit an R_MIPS_NONE relocation to tell the linker what the
6632 target function is. Use a local GOT access when loading the
6633 symbol, to cut down on the number of unnecessary GOT entries
6634 for stubs that aren't needed. */
6635 output_asm_insn (".reloc\t0,R_MIPS_NONE,%0", &symbol);
6636 symbol = alias;
6637 }
6638 }
6639
6640 /* Load the address of the MIPS16 function into $25. Do this first so
6641 that targets with coprocessor interlocks can use an MFC1 to fill the
6642 delay slot. */
6643 output_asm_insn ("la\t%^,%0", &symbol);
6644
6645 /* Move the arguments from floating-point registers to general registers. */
6646 mips_output_args_xfer (crtl->args.info.fp_code, 'f');
6647
6648 /* Jump to the MIPS16 function. */
6649 output_asm_insn ("jr\t%^", NULL);
6650
6651 if (TARGET_ABICALLS_PIC2 && TARGET_ABSOLUTE_ABICALLS)
6652 fprintf (asm_out_file, "\t.option\tpic2\n");
6653
6654 mips_end_function_definition (stubname);
6655
6656 /* If the linker needs to create a dynamic symbol for the target
6657 function, it will associate the symbol with the stub (which,
6658 unlike the target function, follows the proper calling conventions).
6659 It is therefore useful to have a local alias for the target function,
6660 so that it can still be identified as MIPS16 code. As an optimization,
6661 this symbol can also be used for indirect MIPS16 references from
6662 within this file. */
6663 ASM_OUTPUT_DEF (asm_out_file, alias_name, fnname);
6664
6665 switch_to_section (function_section (current_function_decl));
6666 }
6667
6668 /* The current function is a MIPS16 function that returns a value in an FPR.
6669 Copy the return value from its soft-float to its hard-float location.
6670 libgcc2 has special non-MIPS16 helper functions for each case. */
6671
6672 static void
6673 mips16_copy_fpr_return_value (void)
6674 {
6675 rtx fn, insn, retval;
6676 tree return_type;
6677 enum machine_mode return_mode;
6678 const char *name;
6679
6680 return_type = DECL_RESULT (current_function_decl);
6681 return_mode = DECL_MODE (return_type);
6682
6683 name = ACONCAT (("__mips16_ret_",
6684 mips16_call_stub_mode_suffix (return_mode),
6685 NULL));
6686 fn = mips16_stub_function (name);
6687
6688 /* The function takes arguments in $2 (and possibly $3), so calls
6689 to it cannot be lazily bound. */
6690 SYMBOL_REF_FLAGS (fn) |= SYMBOL_FLAG_BIND_NOW;
6691
6692 /* Model the call as something that takes the GPR return value as
6693 argument and returns an "updated" value. */
6694 retval = gen_rtx_REG (return_mode, GP_RETURN);
6695 insn = mips_expand_call (MIPS_CALL_EPILOGUE, retval, fn,
6696 const0_rtx, NULL_RTX, false);
6697 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), retval);
6698 }
6699
6700 /* Consider building a stub for a MIPS16 call to function *FN_PTR.
6701 RETVAL is the location of the return value, or null if this is
6702 a "call" rather than a "call_value". ARGS_SIZE is the size of the
6703 arguments and FP_CODE is the code built by mips_function_arg;
6704 see the comment before the fp_code field in CUMULATIVE_ARGS for details.
6705
6706 There are three alternatives:
6707
6708 - If a stub was needed, emit the call and return the call insn itself.
6709
6710 - If we can avoid using a stub by redirecting the call, set *FN_PTR
6711 to the new target and return null.
6712
6713 - If *FN_PTR doesn't need a stub, return null and leave *FN_PTR
6714 unmodified.
6715
6716 A stub is needed for calls to functions that, in normal mode,
6717 receive arguments in FPRs or return values in FPRs. The stub
6718 copies the arguments from their soft-float positions to their
6719 hard-float positions, calls the real function, then copies the
6720 return value from its hard-float position to its soft-float
6721 position.
6722
6723 We can emit a JAL to *FN_PTR even when *FN_PTR might need a stub.
6724 If *FN_PTR turns out to be to a non-MIPS16 function, the linker
6725 automatically redirects the JAL to the stub, otherwise the JAL
6726 continues to call FN directly. */
6727
6728 static rtx_insn *
6729 mips16_build_call_stub (rtx retval, rtx *fn_ptr, rtx args_size, int fp_code)
6730 {
6731 const char *fnname;
6732 bool fp_ret_p;
6733 struct mips16_stub *l;
6734 rtx_insn *insn;
6735 rtx pattern, fn;
6736
6737 /* We don't need to do anything if we aren't in MIPS16 mode, or if
6738 we were invoked with the -msoft-float option. */
6739 if (!TARGET_MIPS16 || TARGET_SOFT_FLOAT_ABI)
6740 return NULL;
6741
6742 /* Figure out whether the value might come back in a floating-point
6743 register. */
6744 fp_ret_p = retval && mips_return_mode_in_fpr_p (GET_MODE (retval));
6745
6746 /* We don't need to do anything if there were no floating-point
6747 arguments and the value will not be returned in a floating-point
6748 register. */
6749 if (fp_code == 0 && !fp_ret_p)
6750 return NULL;
6751
6752 /* We don't need to do anything if this is a call to a special
6753 MIPS16 support function. */
6754 fn = *fn_ptr;
6755 if (mips16_stub_function_p (fn))
6756 return NULL;
6757
6758 /* If we're calling a locally-defined MIPS16 function, we know that
6759 it will return values in both the "soft-float" and "hard-float"
6760 registers. There is no need to use a stub to move the latter
6761 to the former. */
6762 if (fp_code == 0 && mips16_local_function_p (fn))
6763 return NULL;
6764
6765 /* This code will only work for o32 and o64 abis. The other ABI's
6766 require more sophisticated support. */
6767 gcc_assert (TARGET_OLDABI);
6768
6769 /* If we're calling via a function pointer, use one of the magic
6770 libgcc.a stubs provided for each (FP_CODE, FP_RET_P) combination.
6771 Each stub expects the function address to arrive in register $2. */
6772 if (GET_CODE (fn) != SYMBOL_REF
6773 || !call_insn_operand (fn, VOIDmode))
6774 {
6775 char buf[30];
6776 rtx stub_fn, addr;
6777 rtx_insn *insn;
6778 bool lazy_p;
6779
6780 /* If this is a locally-defined and locally-binding function,
6781 avoid the stub by calling the local alias directly. */
6782 if (mips16_local_function_p (fn))
6783 {
6784 *fn_ptr = mips16_local_alias (fn);
6785 return NULL;
6786 }
6787
6788 /* Create a SYMBOL_REF for the libgcc.a function. */
6789 if (fp_ret_p)
6790 sprintf (buf, "__mips16_call_stub_%s_%d",
6791 mips16_call_stub_mode_suffix (GET_MODE (retval)),
6792 fp_code);
6793 else
6794 sprintf (buf, "__mips16_call_stub_%d", fp_code);
6795 stub_fn = mips16_stub_function (buf);
6796
6797 /* The function uses $2 as an argument, so calls to it
6798 cannot be lazily bound. */
6799 SYMBOL_REF_FLAGS (stub_fn) |= SYMBOL_FLAG_BIND_NOW;
6800
6801 /* Load the target function into $2. */
6802 addr = gen_rtx_REG (Pmode, GP_REG_FIRST + 2);
6803 lazy_p = mips_load_call_address (MIPS_CALL_NORMAL, addr, fn);
6804
6805 /* Emit the call. */
6806 insn = mips_expand_call (MIPS_CALL_NORMAL, retval, stub_fn,
6807 args_size, NULL_RTX, lazy_p);
6808
6809 /* Tell GCC that this call does indeed use the value of $2. */
6810 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), addr);
6811
6812 /* If we are handling a floating-point return value, we need to
6813 save $18 in the function prologue. Putting a note on the
6814 call will mean that df_regs_ever_live_p ($18) will be true if the
6815 call is not eliminated, and we can check that in the prologue
6816 code. */
6817 if (fp_ret_p)
6818 CALL_INSN_FUNCTION_USAGE (insn) =
6819 gen_rtx_EXPR_LIST (VOIDmode,
6820 gen_rtx_CLOBBER (VOIDmode,
6821 gen_rtx_REG (word_mode, 18)),
6822 CALL_INSN_FUNCTION_USAGE (insn));
6823
6824 return insn;
6825 }
6826
6827 /* We know the function we are going to call. If we have already
6828 built a stub, we don't need to do anything further. */
6829 fnname = targetm.strip_name_encoding (XSTR (fn, 0));
6830 for (l = mips16_stubs; l != NULL; l = l->next)
6831 if (strcmp (l->name, fnname) == 0)
6832 break;
6833
6834 if (l == NULL)
6835 {
6836 const char *separator;
6837 char *secname, *stubname;
6838 tree stubid, stubdecl;
6839 unsigned int f;
6840
6841 /* If the function does not return in FPRs, the special stub
6842 section is named
6843 .mips16.call.FNNAME
6844
6845 If the function does return in FPRs, the stub section is named
6846 .mips16.call.fp.FNNAME
6847
6848 Build a decl for the stub. */
6849 secname = ACONCAT ((".mips16.call.", fp_ret_p ? "fp." : "",
6850 fnname, NULL));
6851 stubname = ACONCAT (("__call_stub_", fp_ret_p ? "fp_" : "",
6852 fnname, NULL));
6853 stubid = get_identifier (stubname);
6854 stubdecl = build_decl (BUILTINS_LOCATION,
6855 FUNCTION_DECL, stubid,
6856 build_function_type_list (void_type_node,
6857 NULL_TREE));
6858 set_decl_section_name (stubdecl, secname);
6859 DECL_RESULT (stubdecl) = build_decl (BUILTINS_LOCATION,
6860 RESULT_DECL, NULL_TREE,
6861 void_type_node);
6862
6863 /* Output a comment. */
6864 fprintf (asm_out_file, "\t# Stub function to call %s%s (",
6865 (fp_ret_p
6866 ? (GET_MODE (retval) == SFmode ? "float " : "double ")
6867 : ""),
6868 fnname);
6869 separator = "";
6870 for (f = (unsigned int) fp_code; f != 0; f >>= 2)
6871 {
6872 fprintf (asm_out_file, "%s%s", separator,
6873 (f & 3) == 1 ? "float" : "double");
6874 separator = ", ";
6875 }
6876 fprintf (asm_out_file, ")\n");
6877
6878 /* Start the function definition. */
6879 assemble_start_function (stubdecl, stubname);
6880 mips_start_function_definition (stubname, false);
6881
6882 if (fp_ret_p)
6883 {
6884 fprintf (asm_out_file, "\t.cfi_startproc\n");
6885
6886 /* Create a fake CFA 4 bytes below the stack pointer.
6887 This works around unwinders (like libgcc's) that expect
6888 the CFA for non-signal frames to be unique. */
6889 fprintf (asm_out_file, "\t.cfi_def_cfa 29,-4\n");
6890
6891 /* "Save" $sp in itself so we don't use the fake CFA.
6892 This is: DW_CFA_val_expression r29, { DW_OP_reg29 }. */
6893 fprintf (asm_out_file, "\t.cfi_escape 0x16,29,1,0x6d\n");
6894 }
6895 else
6896 {
6897 /* Load the address of the MIPS16 function into $25. Do this
6898 first so that targets with coprocessor interlocks can use
6899 an MFC1 to fill the delay slot. */
6900 if (TARGET_EXPLICIT_RELOCS)
6901 {
6902 output_asm_insn ("lui\t%^,%%hi(%0)", &fn);
6903 output_asm_insn ("addiu\t%^,%^,%%lo(%0)", &fn);
6904 }
6905 else
6906 output_asm_insn ("la\t%^,%0", &fn);
6907 }
6908
6909 /* Move the arguments from general registers to floating-point
6910 registers. */
6911 mips_output_args_xfer (fp_code, 't');
6912
6913 if (fp_ret_p)
6914 {
6915 /* Save the return address in $18 and call the non-MIPS16 function.
6916 The stub's caller knows that $18 might be clobbered, even though
6917 $18 is usually a call-saved register. */
6918 fprintf (asm_out_file, "\tmove\t%s,%s\n",
6919 reg_names[GP_REG_FIRST + 18], reg_names[RETURN_ADDR_REGNUM]);
6920 output_asm_insn (MIPS_CALL ("jal", &fn, 0, -1), &fn);
6921 fprintf (asm_out_file, "\t.cfi_register 31,18\n");
6922
6923 /* Move the result from floating-point registers to
6924 general registers. */
6925 switch (GET_MODE (retval))
6926 {
6927 case SCmode:
6928 mips_output_32bit_xfer ('f', GP_RETURN + TARGET_BIG_ENDIAN,
6929 TARGET_BIG_ENDIAN
6930 ? FP_REG_FIRST + MAX_FPRS_PER_FMT
6931 : FP_REG_FIRST);
6932 mips_output_32bit_xfer ('f', GP_RETURN + TARGET_LITTLE_ENDIAN,
6933 TARGET_LITTLE_ENDIAN
6934 ? FP_REG_FIRST + MAX_FPRS_PER_FMT
6935 : FP_REG_FIRST);
6936 if (GET_MODE (retval) == SCmode && TARGET_64BIT)
6937 {
6938 /* On 64-bit targets, complex floats are returned in
6939 a single GPR, such that "sd" on a suitably-aligned
6940 target would store the value correctly. */
6941 fprintf (asm_out_file, "\tdsll\t%s,%s,32\n",
6942 reg_names[GP_RETURN + TARGET_BIG_ENDIAN],
6943 reg_names[GP_RETURN + TARGET_BIG_ENDIAN]);
6944 fprintf (asm_out_file, "\tdsll\t%s,%s,32\n",
6945 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN],
6946 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN]);
6947 fprintf (asm_out_file, "\tdsrl\t%s,%s,32\n",
6948 reg_names[GP_RETURN + TARGET_BIG_ENDIAN],
6949 reg_names[GP_RETURN + TARGET_BIG_ENDIAN]);
6950 fprintf (asm_out_file, "\tor\t%s,%s,%s\n",
6951 reg_names[GP_RETURN],
6952 reg_names[GP_RETURN],
6953 reg_names[GP_RETURN + 1]);
6954 }
6955 break;
6956
6957 case SFmode:
6958 mips_output_32bit_xfer ('f', GP_RETURN, FP_REG_FIRST);
6959 break;
6960
6961 case DCmode:
6962 mips_output_64bit_xfer ('f', GP_RETURN + (8 / UNITS_PER_WORD),
6963 FP_REG_FIRST + MAX_FPRS_PER_FMT);
6964 /* Fall though. */
6965 case DFmode:
6966 case V2SFmode:
6967 mips_output_64bit_xfer ('f', GP_RETURN, FP_REG_FIRST);
6968 break;
6969
6970 default:
6971 gcc_unreachable ();
6972 }
6973 fprintf (asm_out_file, "\tjr\t%s\n", reg_names[GP_REG_FIRST + 18]);
6974 fprintf (asm_out_file, "\t.cfi_endproc\n");
6975 }
6976 else
6977 {
6978 /* Jump to the previously-loaded address. */
6979 output_asm_insn ("jr\t%^", NULL);
6980 }
6981
6982 #ifdef ASM_DECLARE_FUNCTION_SIZE
6983 ASM_DECLARE_FUNCTION_SIZE (asm_out_file, stubname, stubdecl);
6984 #endif
6985
6986 mips_end_function_definition (stubname);
6987
6988 /* Record this stub. */
6989 l = XNEW (struct mips16_stub);
6990 l->name = xstrdup (fnname);
6991 l->fp_ret_p = fp_ret_p;
6992 l->next = mips16_stubs;
6993 mips16_stubs = l;
6994 }
6995
6996 /* If we expect a floating-point return value, but we've built a
6997 stub which does not expect one, then we're in trouble. We can't
6998 use the existing stub, because it won't handle the floating-point
6999 value. We can't build a new stub, because the linker won't know
7000 which stub to use for the various calls in this object file.
7001 Fortunately, this case is illegal, since it means that a function
7002 was declared in two different ways in a single compilation. */
7003 if (fp_ret_p && !l->fp_ret_p)
7004 error ("cannot handle inconsistent calls to %qs", fnname);
7005
7006 if (retval == NULL_RTX)
7007 pattern = gen_call_internal_direct (fn, args_size);
7008 else
7009 pattern = gen_call_value_internal_direct (retval, fn, args_size);
7010 insn = mips_emit_call_insn (pattern, fn, fn, false);
7011
7012 /* If we are calling a stub which handles a floating-point return
7013 value, we need to arrange to save $18 in the prologue. We do this
7014 by marking the function call as using the register. The prologue
7015 will later see that it is used, and emit code to save it. */
7016 if (fp_ret_p)
7017 CALL_INSN_FUNCTION_USAGE (insn) =
7018 gen_rtx_EXPR_LIST (VOIDmode,
7019 gen_rtx_CLOBBER (VOIDmode,
7020 gen_rtx_REG (word_mode, 18)),
7021 CALL_INSN_FUNCTION_USAGE (insn));
7022
7023 return insn;
7024 }
7025 \f
7026 /* Expand a call of type TYPE. RESULT is where the result will go (null
7027 for "call"s and "sibcall"s), ADDR is the address of the function,
7028 ARGS_SIZE is the size of the arguments and AUX is the value passed
7029 to us by mips_function_arg. LAZY_P is true if this call already
7030 involves a lazily-bound function address (such as when calling
7031 functions through a MIPS16 hard-float stub).
7032
7033 Return the call itself. */
7034
7035 rtx_insn *
7036 mips_expand_call (enum mips_call_type type, rtx result, rtx addr,
7037 rtx args_size, rtx aux, bool lazy_p)
7038 {
7039 rtx orig_addr, pattern;
7040 rtx_insn *insn;
7041 int fp_code;
7042
7043 fp_code = aux == 0 ? 0 : (int) GET_MODE (aux);
7044 insn = mips16_build_call_stub (result, &addr, args_size, fp_code);
7045 if (insn)
7046 {
7047 gcc_assert (!lazy_p && type == MIPS_CALL_NORMAL);
7048 return insn;
7049 }
7050
7051 orig_addr = addr;
7052 if (!call_insn_operand (addr, VOIDmode))
7053 {
7054 if (type == MIPS_CALL_EPILOGUE)
7055 addr = MIPS_EPILOGUE_TEMP (Pmode);
7056 else
7057 addr = gen_reg_rtx (Pmode);
7058 lazy_p |= mips_load_call_address (type, addr, orig_addr);
7059 }
7060
7061 if (result == 0)
7062 {
7063 rtx (*fn) (rtx, rtx);
7064
7065 if (type == MIPS_CALL_SIBCALL)
7066 fn = gen_sibcall_internal;
7067 else
7068 fn = gen_call_internal;
7069
7070 pattern = fn (addr, args_size);
7071 }
7072 else if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 2)
7073 {
7074 /* Handle return values created by mips_return_fpr_pair. */
7075 rtx (*fn) (rtx, rtx, rtx, rtx);
7076 rtx reg1, reg2;
7077
7078 if (type == MIPS_CALL_SIBCALL)
7079 fn = gen_sibcall_value_multiple_internal;
7080 else
7081 fn = gen_call_value_multiple_internal;
7082
7083 reg1 = XEXP (XVECEXP (result, 0, 0), 0);
7084 reg2 = XEXP (XVECEXP (result, 0, 1), 0);
7085 pattern = fn (reg1, addr, args_size, reg2);
7086 }
7087 else
7088 {
7089 rtx (*fn) (rtx, rtx, rtx);
7090
7091 if (type == MIPS_CALL_SIBCALL)
7092 fn = gen_sibcall_value_internal;
7093 else
7094 fn = gen_call_value_internal;
7095
7096 /* Handle return values created by mips_return_fpr_single. */
7097 if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 1)
7098 result = XEXP (XVECEXP (result, 0, 0), 0);
7099 pattern = fn (result, addr, args_size);
7100 }
7101
7102 return mips_emit_call_insn (pattern, orig_addr, addr, lazy_p);
7103 }
7104
7105 /* Split call instruction INSN into a $gp-clobbering call and
7106 (where necessary) an instruction to restore $gp from its save slot.
7107 CALL_PATTERN is the pattern of the new call. */
7108
7109 void
7110 mips_split_call (rtx insn, rtx call_pattern)
7111 {
7112 emit_call_insn (call_pattern);
7113 if (!find_reg_note (insn, REG_NORETURN, 0))
7114 mips_restore_gp_from_cprestore_slot (gen_rtx_REG (Pmode,
7115 POST_CALL_TMP_REG));
7116 }
7117
7118 /* Return true if a call to DECL may need to use JALX. */
7119
7120 static bool
7121 mips_call_may_need_jalx_p (tree decl)
7122 {
7123 /* If the current translation unit would use a different mode for DECL,
7124 assume that the call needs JALX. */
7125 if (mips_get_compress_mode (decl) != TARGET_COMPRESSION)
7126 return true;
7127
7128 /* mips_get_compress_mode is always accurate for locally-binding
7129 functions in the current translation unit. */
7130 if (!DECL_EXTERNAL (decl) && targetm.binds_local_p (decl))
7131 return false;
7132
7133 /* When -minterlink-compressed is in effect, assume that functions
7134 could use a different encoding mode unless an attribute explicitly
7135 tells us otherwise. */
7136 if (TARGET_INTERLINK_COMPRESSED)
7137 {
7138 if (!TARGET_COMPRESSION
7139 && mips_get_compress_off_flags (DECL_ATTRIBUTES (decl)) ==0)
7140 return true;
7141 if (TARGET_COMPRESSION
7142 && mips_get_compress_on_flags (DECL_ATTRIBUTES (decl)) == 0)
7143 return true;
7144 }
7145
7146 return false;
7147 }
7148
7149 /* Implement TARGET_FUNCTION_OK_FOR_SIBCALL. */
7150
7151 static bool
7152 mips_function_ok_for_sibcall (tree decl, tree exp ATTRIBUTE_UNUSED)
7153 {
7154 if (!TARGET_SIBCALLS)
7155 return false;
7156
7157 /* Interrupt handlers need special epilogue code and therefore can't
7158 use sibcalls. */
7159 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl)))
7160 return false;
7161
7162 /* Direct Js are only possible to functions that use the same ISA encoding.
7163 There is no JX counterpoart of JALX. */
7164 if (decl
7165 && const_call_insn_operand (XEXP (DECL_RTL (decl), 0), VOIDmode)
7166 && mips_call_may_need_jalx_p (decl))
7167 return false;
7168
7169 /* Sibling calls should not prevent lazy binding. Lazy-binding stubs
7170 require $gp to be valid on entry, so sibcalls can only use stubs
7171 if $gp is call-clobbered. */
7172 if (decl
7173 && TARGET_CALL_SAVED_GP
7174 && !TARGET_ABICALLS_PIC0
7175 && !targetm.binds_local_p (decl))
7176 return false;
7177
7178 /* Otherwise OK. */
7179 return true;
7180 }
7181 \f
7182 /* Implement MOVE_BY_PIECES_P. */
7183
7184 bool
7185 mips_move_by_pieces_p (unsigned HOST_WIDE_INT size, unsigned int align)
7186 {
7187 if (HAVE_movmemsi)
7188 {
7189 /* movmemsi is meant to generate code that is at least as good as
7190 move_by_pieces. However, movmemsi effectively uses a by-pieces
7191 implementation both for moves smaller than a word and for
7192 word-aligned moves of no more than MIPS_MAX_MOVE_BYTES_STRAIGHT
7193 bytes. We should allow the tree-level optimisers to do such
7194 moves by pieces, as it often exposes other optimization
7195 opportunities. We might as well continue to use movmemsi at
7196 the rtl level though, as it produces better code when
7197 scheduling is disabled (such as at -O). */
7198 if (currently_expanding_to_rtl)
7199 return false;
7200 if (align < BITS_PER_WORD)
7201 return size < UNITS_PER_WORD;
7202 return size <= MIPS_MAX_MOVE_BYTES_STRAIGHT;
7203 }
7204 /* The default value. If this becomes a target hook, we should
7205 call the default definition instead. */
7206 return (move_by_pieces_ninsns (size, align, MOVE_MAX_PIECES + 1)
7207 < (unsigned int) MOVE_RATIO (optimize_insn_for_speed_p ()));
7208 }
7209
7210 /* Implement STORE_BY_PIECES_P. */
7211
7212 bool
7213 mips_store_by_pieces_p (unsigned HOST_WIDE_INT size, unsigned int align)
7214 {
7215 /* Storing by pieces involves moving constants into registers
7216 of size MIN (ALIGN, BITS_PER_WORD), then storing them.
7217 We need to decide whether it is cheaper to load the address of
7218 constant data into a register and use a block move instead. */
7219
7220 /* If the data is only byte aligned, then:
7221
7222 (a1) A block move of less than 4 bytes would involve three 3 LBs and
7223 3 SBs. We might as well use 3 single-instruction LIs and 3 SBs
7224 instead.
7225
7226 (a2) A block move of 4 bytes from aligned source data can use an
7227 LW/SWL/SWR sequence. This is often better than the 4 LIs and
7228 4 SBs that we would generate when storing by pieces. */
7229 if (align <= BITS_PER_UNIT)
7230 return size < 4;
7231
7232 /* If the data is 2-byte aligned, then:
7233
7234 (b1) A block move of less than 4 bytes would use a combination of LBs,
7235 LHs, SBs and SHs. We get better code by using single-instruction
7236 LIs, SBs and SHs instead.
7237
7238 (b2) A block move of 4 bytes from aligned source data would again use
7239 an LW/SWL/SWR sequence. In most cases, loading the address of
7240 the source data would require at least one extra instruction.
7241 It is often more efficient to use 2 single-instruction LIs and
7242 2 SHs instead.
7243
7244 (b3) A block move of up to 3 additional bytes would be like (b1).
7245
7246 (b4) A block move of 8 bytes from aligned source data can use two
7247 LW/SWL/SWR sequences or a single LD/SDL/SDR sequence. Both
7248 sequences are better than the 4 LIs and 4 SHs that we'd generate
7249 when storing by pieces.
7250
7251 The reasoning for higher alignments is similar:
7252
7253 (c1) A block move of less than 4 bytes would be the same as (b1).
7254
7255 (c2) A block move of 4 bytes would use an LW/SW sequence. Again,
7256 loading the address of the source data would typically require
7257 at least one extra instruction. It is generally better to use
7258 LUI/ORI/SW instead.
7259
7260 (c3) A block move of up to 3 additional bytes would be like (b1).
7261
7262 (c4) A block move of 8 bytes can use two LW/SW sequences or a single
7263 LD/SD sequence, and in these cases we've traditionally preferred
7264 the memory copy over the more bulky constant moves. */
7265 return size < 8;
7266 }
7267
7268 /* Emit straight-line code to move LENGTH bytes from SRC to DEST.
7269 Assume that the areas do not overlap. */
7270
7271 static void
7272 mips_block_move_straight (rtx dest, rtx src, HOST_WIDE_INT length)
7273 {
7274 HOST_WIDE_INT offset, delta;
7275 unsigned HOST_WIDE_INT bits;
7276 int i;
7277 enum machine_mode mode;
7278 rtx *regs;
7279
7280 /* Work out how many bits to move at a time. If both operands have
7281 half-word alignment, it is usually better to move in half words.
7282 For instance, lh/lh/sh/sh is usually better than lwl/lwr/swl/swr
7283 and lw/lw/sw/sw is usually better than ldl/ldr/sdl/sdr.
7284 Otherwise move word-sized chunks. */
7285 if (MEM_ALIGN (src) == BITS_PER_WORD / 2
7286 && MEM_ALIGN (dest) == BITS_PER_WORD / 2)
7287 bits = BITS_PER_WORD / 2;
7288 else
7289 bits = BITS_PER_WORD;
7290
7291 mode = mode_for_size (bits, MODE_INT, 0);
7292 delta = bits / BITS_PER_UNIT;
7293
7294 /* Allocate a buffer for the temporary registers. */
7295 regs = XALLOCAVEC (rtx, length / delta);
7296
7297 /* Load as many BITS-sized chunks as possible. Use a normal load if
7298 the source has enough alignment, otherwise use left/right pairs. */
7299 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++)
7300 {
7301 regs[i] = gen_reg_rtx (mode);
7302 if (MEM_ALIGN (src) >= bits)
7303 mips_emit_move (regs[i], adjust_address (src, mode, offset));
7304 else
7305 {
7306 rtx part = adjust_address (src, BLKmode, offset);
7307 set_mem_size (part, delta);
7308 if (!mips_expand_ext_as_unaligned_load (regs[i], part, bits, 0, 0))
7309 gcc_unreachable ();
7310 }
7311 }
7312
7313 /* Copy the chunks to the destination. */
7314 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++)
7315 if (MEM_ALIGN (dest) >= bits)
7316 mips_emit_move (adjust_address (dest, mode, offset), regs[i]);
7317 else
7318 {
7319 rtx part = adjust_address (dest, BLKmode, offset);
7320 set_mem_size (part, delta);
7321 if (!mips_expand_ins_as_unaligned_store (part, regs[i], bits, 0))
7322 gcc_unreachable ();
7323 }
7324
7325 /* Mop up any left-over bytes. */
7326 if (offset < length)
7327 {
7328 src = adjust_address (src, BLKmode, offset);
7329 dest = adjust_address (dest, BLKmode, offset);
7330 move_by_pieces (dest, src, length - offset,
7331 MIN (MEM_ALIGN (src), MEM_ALIGN (dest)), 0);
7332 }
7333 }
7334
7335 /* Helper function for doing a loop-based block operation on memory
7336 reference MEM. Each iteration of the loop will operate on LENGTH
7337 bytes of MEM.
7338
7339 Create a new base register for use within the loop and point it to
7340 the start of MEM. Create a new memory reference that uses this
7341 register. Store them in *LOOP_REG and *LOOP_MEM respectively. */
7342
7343 static void
7344 mips_adjust_block_mem (rtx mem, HOST_WIDE_INT length,
7345 rtx *loop_reg, rtx *loop_mem)
7346 {
7347 *loop_reg = copy_addr_to_reg (XEXP (mem, 0));
7348
7349 /* Although the new mem does not refer to a known location,
7350 it does keep up to LENGTH bytes of alignment. */
7351 *loop_mem = change_address (mem, BLKmode, *loop_reg);
7352 set_mem_align (*loop_mem, MIN (MEM_ALIGN (mem), length * BITS_PER_UNIT));
7353 }
7354
7355 /* Move LENGTH bytes from SRC to DEST using a loop that moves BYTES_PER_ITER
7356 bytes at a time. LENGTH must be at least BYTES_PER_ITER. Assume that
7357 the memory regions do not overlap. */
7358
7359 static void
7360 mips_block_move_loop (rtx dest, rtx src, HOST_WIDE_INT length,
7361 HOST_WIDE_INT bytes_per_iter)
7362 {
7363 rtx_code_label *label;
7364 rtx src_reg, dest_reg, final_src, test;
7365 HOST_WIDE_INT leftover;
7366
7367 leftover = length % bytes_per_iter;
7368 length -= leftover;
7369
7370 /* Create registers and memory references for use within the loop. */
7371 mips_adjust_block_mem (src, bytes_per_iter, &src_reg, &src);
7372 mips_adjust_block_mem (dest, bytes_per_iter, &dest_reg, &dest);
7373
7374 /* Calculate the value that SRC_REG should have after the last iteration
7375 of the loop. */
7376 final_src = expand_simple_binop (Pmode, PLUS, src_reg, GEN_INT (length),
7377 0, 0, OPTAB_WIDEN);
7378
7379 /* Emit the start of the loop. */
7380 label = gen_label_rtx ();
7381 emit_label (label);
7382
7383 /* Emit the loop body. */
7384 mips_block_move_straight (dest, src, bytes_per_iter);
7385
7386 /* Move on to the next block. */
7387 mips_emit_move (src_reg, plus_constant (Pmode, src_reg, bytes_per_iter));
7388 mips_emit_move (dest_reg, plus_constant (Pmode, dest_reg, bytes_per_iter));
7389
7390 /* Emit the loop condition. */
7391 test = gen_rtx_NE (VOIDmode, src_reg, final_src);
7392 if (Pmode == DImode)
7393 emit_jump_insn (gen_cbranchdi4 (test, src_reg, final_src, label));
7394 else
7395 emit_jump_insn (gen_cbranchsi4 (test, src_reg, final_src, label));
7396
7397 /* Mop up any left-over bytes. */
7398 if (leftover)
7399 mips_block_move_straight (dest, src, leftover);
7400 }
7401
7402 /* Expand a movmemsi instruction, which copies LENGTH bytes from
7403 memory reference SRC to memory reference DEST. */
7404
7405 bool
7406 mips_expand_block_move (rtx dest, rtx src, rtx length)
7407 {
7408 if (CONST_INT_P (length))
7409 {
7410 if (INTVAL (length) <= MIPS_MAX_MOVE_BYTES_STRAIGHT)
7411 {
7412 mips_block_move_straight (dest, src, INTVAL (length));
7413 return true;
7414 }
7415 else if (optimize)
7416 {
7417 mips_block_move_loop (dest, src, INTVAL (length),
7418 MIPS_MAX_MOVE_BYTES_PER_LOOP_ITER);
7419 return true;
7420 }
7421 }
7422 return false;
7423 }
7424 \f
7425 /* Expand a loop of synci insns for the address range [BEGIN, END). */
7426
7427 void
7428 mips_expand_synci_loop (rtx begin, rtx end)
7429 {
7430 rtx inc, cmp_result, mask, length;
7431 rtx_code_label *label, *end_label;
7432
7433 /* Create end_label. */
7434 end_label = gen_label_rtx ();
7435
7436 /* Check if begin equals end. */
7437 cmp_result = gen_rtx_EQ (VOIDmode, begin, end);
7438 emit_jump_insn (gen_condjump (cmp_result, end_label));
7439
7440 /* Load INC with the cache line size (rdhwr INC,$1). */
7441 inc = gen_reg_rtx (Pmode);
7442 emit_insn (PMODE_INSN (gen_rdhwr_synci_step, (inc)));
7443
7444 /* Check if inc is 0. */
7445 cmp_result = gen_rtx_EQ (VOIDmode, inc, const0_rtx);
7446 emit_jump_insn (gen_condjump (cmp_result, end_label));
7447
7448 /* Calculate mask. */
7449 mask = mips_force_unary (Pmode, NEG, inc);
7450
7451 /* Mask out begin by mask. */
7452 begin = mips_force_binary (Pmode, AND, begin, mask);
7453
7454 /* Calculate length. */
7455 length = mips_force_binary (Pmode, MINUS, end, begin);
7456
7457 /* Loop back to here. */
7458 label = gen_label_rtx ();
7459 emit_label (label);
7460
7461 emit_insn (gen_synci (begin));
7462
7463 /* Update length. */
7464 mips_emit_binary (MINUS, length, length, inc);
7465
7466 /* Update begin. */
7467 mips_emit_binary (PLUS, begin, begin, inc);
7468
7469 /* Check if length is greater than 0. */
7470 cmp_result = gen_rtx_GT (VOIDmode, length, const0_rtx);
7471 emit_jump_insn (gen_condjump (cmp_result, label));
7472
7473 emit_label (end_label);
7474 }
7475 \f
7476 /* Expand a QI or HI mode atomic memory operation.
7477
7478 GENERATOR contains a pointer to the gen_* function that generates
7479 the SI mode underlying atomic operation using masks that we
7480 calculate.
7481
7482 RESULT is the return register for the operation. Its value is NULL
7483 if unused.
7484
7485 MEM is the location of the atomic access.
7486
7487 OLDVAL is the first operand for the operation.
7488
7489 NEWVAL is the optional second operand for the operation. Its value
7490 is NULL if unused. */
7491
7492 void
7493 mips_expand_atomic_qihi (union mips_gen_fn_ptrs generator,
7494 rtx result, rtx mem, rtx oldval, rtx newval)
7495 {
7496 rtx orig_addr, memsi_addr, memsi, shift, shiftsi, unshifted_mask;
7497 rtx unshifted_mask_reg, mask, inverted_mask, si_op;
7498 rtx res = NULL;
7499 enum machine_mode mode;
7500
7501 mode = GET_MODE (mem);
7502
7503 /* Compute the address of the containing SImode value. */
7504 orig_addr = force_reg (Pmode, XEXP (mem, 0));
7505 memsi_addr = mips_force_binary (Pmode, AND, orig_addr,
7506 force_reg (Pmode, GEN_INT (-4)));
7507
7508 /* Create a memory reference for it. */
7509 memsi = gen_rtx_MEM (SImode, memsi_addr);
7510 set_mem_alias_set (memsi, ALIAS_SET_MEMORY_BARRIER);
7511 MEM_VOLATILE_P (memsi) = MEM_VOLATILE_P (mem);
7512
7513 /* Work out the byte offset of the QImode or HImode value,
7514 counting from the least significant byte. */
7515 shift = mips_force_binary (Pmode, AND, orig_addr, GEN_INT (3));
7516 if (TARGET_BIG_ENDIAN)
7517 mips_emit_binary (XOR, shift, shift, GEN_INT (mode == QImode ? 3 : 2));
7518
7519 /* Multiply by eight to convert the shift value from bytes to bits. */
7520 mips_emit_binary (ASHIFT, shift, shift, GEN_INT (3));
7521
7522 /* Make the final shift an SImode value, so that it can be used in
7523 SImode operations. */
7524 shiftsi = force_reg (SImode, gen_lowpart (SImode, shift));
7525
7526 /* Set MASK to an inclusive mask of the QImode or HImode value. */
7527 unshifted_mask = GEN_INT (GET_MODE_MASK (mode));
7528 unshifted_mask_reg = force_reg (SImode, unshifted_mask);
7529 mask = mips_force_binary (SImode, ASHIFT, unshifted_mask_reg, shiftsi);
7530
7531 /* Compute the equivalent exclusive mask. */
7532 inverted_mask = gen_reg_rtx (SImode);
7533 emit_insn (gen_rtx_SET (VOIDmode, inverted_mask,
7534 gen_rtx_NOT (SImode, mask)));
7535
7536 /* Shift the old value into place. */
7537 if (oldval != const0_rtx)
7538 {
7539 oldval = convert_modes (SImode, mode, oldval, true);
7540 oldval = force_reg (SImode, oldval);
7541 oldval = mips_force_binary (SImode, ASHIFT, oldval, shiftsi);
7542 }
7543
7544 /* Do the same for the new value. */
7545 if (newval && newval != const0_rtx)
7546 {
7547 newval = convert_modes (SImode, mode, newval, true);
7548 newval = force_reg (SImode, newval);
7549 newval = mips_force_binary (SImode, ASHIFT, newval, shiftsi);
7550 }
7551
7552 /* Do the SImode atomic access. */
7553 if (result)
7554 res = gen_reg_rtx (SImode);
7555 if (newval)
7556 si_op = generator.fn_6 (res, memsi, mask, inverted_mask, oldval, newval);
7557 else if (result)
7558 si_op = generator.fn_5 (res, memsi, mask, inverted_mask, oldval);
7559 else
7560 si_op = generator.fn_4 (memsi, mask, inverted_mask, oldval);
7561
7562 emit_insn (si_op);
7563
7564 if (result)
7565 {
7566 /* Shift and convert the result. */
7567 mips_emit_binary (AND, res, res, mask);
7568 mips_emit_binary (LSHIFTRT, res, res, shiftsi);
7569 mips_emit_move (result, gen_lowpart (GET_MODE (result), res));
7570 }
7571 }
7572
7573 /* Return true if it is possible to use left/right accesses for a
7574 bitfield of WIDTH bits starting BITPOS bits into BLKmode memory OP.
7575 When returning true, update *LEFT and *RIGHT as follows:
7576
7577 *LEFT is a QImode reference to the first byte if big endian or
7578 the last byte if little endian. This address can be used in the
7579 left-side instructions (LWL, SWL, LDL, SDL).
7580
7581 *RIGHT is a QImode reference to the opposite end of the field and
7582 can be used in the patterning right-side instruction. */
7583
7584 static bool
7585 mips_get_unaligned_mem (rtx op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos,
7586 rtx *left, rtx *right)
7587 {
7588 rtx first, last;
7589
7590 /* Check that the size is valid. */
7591 if (width != 32 && (!TARGET_64BIT || width != 64))
7592 return false;
7593
7594 /* We can only access byte-aligned values. Since we are always passed
7595 a reference to the first byte of the field, it is not necessary to
7596 do anything with BITPOS after this check. */
7597 if (bitpos % BITS_PER_UNIT != 0)
7598 return false;
7599
7600 /* Reject aligned bitfields: we want to use a normal load or store
7601 instead of a left/right pair. */
7602 if (MEM_ALIGN (op) >= width)
7603 return false;
7604
7605 /* Get references to both ends of the field. */
7606 first = adjust_address (op, QImode, 0);
7607 last = adjust_address (op, QImode, width / BITS_PER_UNIT - 1);
7608
7609 /* Allocate to LEFT and RIGHT according to endianness. LEFT should
7610 correspond to the MSB and RIGHT to the LSB. */
7611 if (TARGET_BIG_ENDIAN)
7612 *left = first, *right = last;
7613 else
7614 *left = last, *right = first;
7615
7616 return true;
7617 }
7618
7619 /* Try to use left/right loads to expand an "extv" or "extzv" pattern.
7620 DEST, SRC, WIDTH and BITPOS are the operands passed to the expander;
7621 the operation is the equivalent of:
7622
7623 (set DEST (*_extract SRC WIDTH BITPOS))
7624
7625 Return true on success. */
7626
7627 bool
7628 mips_expand_ext_as_unaligned_load (rtx dest, rtx src, HOST_WIDE_INT width,
7629 HOST_WIDE_INT bitpos, bool unsigned_p)
7630 {
7631 rtx left, right, temp;
7632 rtx dest1 = NULL_RTX;
7633
7634 /* If TARGET_64BIT, the destination of a 32-bit "extz" or "extzv" will
7635 be a DImode, create a new temp and emit a zero extend at the end. */
7636 if (GET_MODE (dest) == DImode
7637 && REG_P (dest)
7638 && GET_MODE_BITSIZE (SImode) == width)
7639 {
7640 dest1 = dest;
7641 dest = gen_reg_rtx (SImode);
7642 }
7643
7644 if (!mips_get_unaligned_mem (src, width, bitpos, &left, &right))
7645 return false;
7646
7647 temp = gen_reg_rtx (GET_MODE (dest));
7648 if (GET_MODE (dest) == DImode)
7649 {
7650 emit_insn (gen_mov_ldl (temp, src, left));
7651 emit_insn (gen_mov_ldr (dest, copy_rtx (src), right, temp));
7652 }
7653 else
7654 {
7655 emit_insn (gen_mov_lwl (temp, src, left));
7656 emit_insn (gen_mov_lwr (dest, copy_rtx (src), right, temp));
7657 }
7658
7659 /* If we were loading 32bits and the original register was DI then
7660 sign/zero extend into the orignal dest. */
7661 if (dest1)
7662 {
7663 if (unsigned_p)
7664 emit_insn (gen_zero_extendsidi2 (dest1, dest));
7665 else
7666 emit_insn (gen_extendsidi2 (dest1, dest));
7667 }
7668 return true;
7669 }
7670
7671 /* Try to use left/right stores to expand an "ins" pattern. DEST, WIDTH,
7672 BITPOS and SRC are the operands passed to the expander; the operation
7673 is the equivalent of:
7674
7675 (set (zero_extract DEST WIDTH BITPOS) SRC)
7676
7677 Return true on success. */
7678
7679 bool
7680 mips_expand_ins_as_unaligned_store (rtx dest, rtx src, HOST_WIDE_INT width,
7681 HOST_WIDE_INT bitpos)
7682 {
7683 rtx left, right;
7684 enum machine_mode mode;
7685
7686 if (!mips_get_unaligned_mem (dest, width, bitpos, &left, &right))
7687 return false;
7688
7689 mode = mode_for_size (width, MODE_INT, 0);
7690 src = gen_lowpart (mode, src);
7691 if (mode == DImode)
7692 {
7693 emit_insn (gen_mov_sdl (dest, src, left));
7694 emit_insn (gen_mov_sdr (copy_rtx (dest), copy_rtx (src), right));
7695 }
7696 else
7697 {
7698 emit_insn (gen_mov_swl (dest, src, left));
7699 emit_insn (gen_mov_swr (copy_rtx (dest), copy_rtx (src), right));
7700 }
7701 return true;
7702 }
7703
7704 /* Return true if X is a MEM with the same size as MODE. */
7705
7706 bool
7707 mips_mem_fits_mode_p (enum machine_mode mode, rtx x)
7708 {
7709 return (MEM_P (x)
7710 && MEM_SIZE_KNOWN_P (x)
7711 && MEM_SIZE (x) == GET_MODE_SIZE (mode));
7712 }
7713
7714 /* Return true if (zero_extract OP WIDTH BITPOS) can be used as the
7715 source of an "ext" instruction or the destination of an "ins"
7716 instruction. OP must be a register operand and the following
7717 conditions must hold:
7718
7719 0 <= BITPOS < GET_MODE_BITSIZE (GET_MODE (op))
7720 0 < WIDTH <= GET_MODE_BITSIZE (GET_MODE (op))
7721 0 < BITPOS + WIDTH <= GET_MODE_BITSIZE (GET_MODE (op))
7722
7723 Also reject lengths equal to a word as they are better handled
7724 by the move patterns. */
7725
7726 bool
7727 mips_use_ins_ext_p (rtx op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos)
7728 {
7729 if (!ISA_HAS_EXT_INS
7730 || !register_operand (op, VOIDmode)
7731 || GET_MODE_BITSIZE (GET_MODE (op)) > BITS_PER_WORD)
7732 return false;
7733
7734 if (!IN_RANGE (width, 1, GET_MODE_BITSIZE (GET_MODE (op)) - 1))
7735 return false;
7736
7737 if (bitpos < 0 || bitpos + width > GET_MODE_BITSIZE (GET_MODE (op)))
7738 return false;
7739
7740 return true;
7741 }
7742
7743 /* Check if MASK and SHIFT are valid in mask-low-and-shift-left
7744 operation if MAXLEN is the maxium length of consecutive bits that
7745 can make up MASK. MODE is the mode of the operation. See
7746 mask_low_and_shift_len for the actual definition. */
7747
7748 bool
7749 mask_low_and_shift_p (enum machine_mode mode, rtx mask, rtx shift, int maxlen)
7750 {
7751 return IN_RANGE (mask_low_and_shift_len (mode, mask, shift), 1, maxlen);
7752 }
7753
7754 /* Return true iff OP1 and OP2 are valid operands together for the
7755 *and<MODE>3 and *and<MODE>3_mips16 patterns. For the cases to consider,
7756 see the table in the comment before the pattern. */
7757
7758 bool
7759 and_operands_ok (enum machine_mode mode, rtx op1, rtx op2)
7760 {
7761 return (memory_operand (op1, mode)
7762 ? and_load_operand (op2, mode)
7763 : and_reg_operand (op2, mode));
7764 }
7765
7766 /* The canonical form of a mask-low-and-shift-left operation is
7767 (and (ashift X SHIFT) MASK) where MASK has the lower SHIFT number of bits
7768 cleared. Thus we need to shift MASK to the right before checking if it
7769 is a valid mask value. MODE is the mode of the operation. If true
7770 return the length of the mask, otherwise return -1. */
7771
7772 int
7773 mask_low_and_shift_len (enum machine_mode mode, rtx mask, rtx shift)
7774 {
7775 HOST_WIDE_INT shval;
7776
7777 shval = INTVAL (shift) & (GET_MODE_BITSIZE (mode) - 1);
7778 return exact_log2 ((UINTVAL (mask) >> shval) + 1);
7779 }
7780 \f
7781 /* Return true if -msplit-addresses is selected and should be honored.
7782
7783 -msplit-addresses is a half-way house between explicit relocations
7784 and the traditional assembler macros. It can split absolute 32-bit
7785 symbolic constants into a high/lo_sum pair but uses macros for other
7786 sorts of access.
7787
7788 Like explicit relocation support for REL targets, it relies
7789 on GNU extensions in the assembler and the linker.
7790
7791 Although this code should work for -O0, it has traditionally
7792 been treated as an optimization. */
7793
7794 static bool
7795 mips_split_addresses_p (void)
7796 {
7797 return (TARGET_SPLIT_ADDRESSES
7798 && optimize
7799 && !TARGET_MIPS16
7800 && !flag_pic
7801 && !ABI_HAS_64BIT_SYMBOLS);
7802 }
7803
7804 /* (Re-)Initialize mips_split_p, mips_lo_relocs and mips_hi_relocs. */
7805
7806 static void
7807 mips_init_relocs (void)
7808 {
7809 memset (mips_split_p, '\0', sizeof (mips_split_p));
7810 memset (mips_split_hi_p, '\0', sizeof (mips_split_hi_p));
7811 memset (mips_use_pcrel_pool_p, '\0', sizeof (mips_use_pcrel_pool_p));
7812 memset (mips_hi_relocs, '\0', sizeof (mips_hi_relocs));
7813 memset (mips_lo_relocs, '\0', sizeof (mips_lo_relocs));
7814
7815 if (TARGET_MIPS16_PCREL_LOADS)
7816 mips_use_pcrel_pool_p[SYMBOL_ABSOLUTE] = true;
7817 else
7818 {
7819 if (ABI_HAS_64BIT_SYMBOLS)
7820 {
7821 if (TARGET_EXPLICIT_RELOCS)
7822 {
7823 mips_split_p[SYMBOL_64_HIGH] = true;
7824 mips_hi_relocs[SYMBOL_64_HIGH] = "%highest(";
7825 mips_lo_relocs[SYMBOL_64_HIGH] = "%higher(";
7826
7827 mips_split_p[SYMBOL_64_MID] = true;
7828 mips_hi_relocs[SYMBOL_64_MID] = "%higher(";
7829 mips_lo_relocs[SYMBOL_64_MID] = "%hi(";
7830
7831 mips_split_p[SYMBOL_64_LOW] = true;
7832 mips_hi_relocs[SYMBOL_64_LOW] = "%hi(";
7833 mips_lo_relocs[SYMBOL_64_LOW] = "%lo(";
7834
7835 mips_split_p[SYMBOL_ABSOLUTE] = true;
7836 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo(";
7837 }
7838 }
7839 else
7840 {
7841 if (TARGET_EXPLICIT_RELOCS
7842 || mips_split_addresses_p ()
7843 || TARGET_MIPS16)
7844 {
7845 mips_split_p[SYMBOL_ABSOLUTE] = true;
7846 mips_hi_relocs[SYMBOL_ABSOLUTE] = "%hi(";
7847 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo(";
7848 }
7849 }
7850 }
7851
7852 if (TARGET_MIPS16)
7853 {
7854 /* The high part is provided by a pseudo copy of $gp. */
7855 mips_split_p[SYMBOL_GP_RELATIVE] = true;
7856 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gprel(";
7857 }
7858 else if (TARGET_EXPLICIT_RELOCS)
7859 /* Small data constants are kept whole until after reload,
7860 then lowered by mips_rewrite_small_data. */
7861 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gp_rel(";
7862
7863 if (TARGET_EXPLICIT_RELOCS)
7864 {
7865 mips_split_p[SYMBOL_GOT_PAGE_OFST] = true;
7866 if (TARGET_NEWABI)
7867 {
7868 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got_page(";
7869 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%got_ofst(";
7870 }
7871 else
7872 {
7873 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got(";
7874 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%lo(";
7875 }
7876 if (TARGET_MIPS16)
7877 /* Expose the use of $28 as soon as possible. */
7878 mips_split_hi_p[SYMBOL_GOT_PAGE_OFST] = true;
7879
7880 if (TARGET_XGOT)
7881 {
7882 /* The HIGH and LO_SUM are matched by special .md patterns. */
7883 mips_split_p[SYMBOL_GOT_DISP] = true;
7884
7885 mips_split_p[SYMBOL_GOTOFF_DISP] = true;
7886 mips_hi_relocs[SYMBOL_GOTOFF_DISP] = "%got_hi(";
7887 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_lo(";
7888
7889 mips_split_p[SYMBOL_GOTOFF_CALL] = true;
7890 mips_hi_relocs[SYMBOL_GOTOFF_CALL] = "%call_hi(";
7891 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call_lo(";
7892 }
7893 else
7894 {
7895 if (TARGET_NEWABI)
7896 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_disp(";
7897 else
7898 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got(";
7899 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call16(";
7900 if (TARGET_MIPS16)
7901 /* Expose the use of $28 as soon as possible. */
7902 mips_split_p[SYMBOL_GOT_DISP] = true;
7903 }
7904 }
7905
7906 if (TARGET_NEWABI)
7907 {
7908 mips_split_p[SYMBOL_GOTOFF_LOADGP] = true;
7909 mips_hi_relocs[SYMBOL_GOTOFF_LOADGP] = "%hi(%neg(%gp_rel(";
7910 mips_lo_relocs[SYMBOL_GOTOFF_LOADGP] = "%lo(%neg(%gp_rel(";
7911 }
7912
7913 mips_lo_relocs[SYMBOL_TLSGD] = "%tlsgd(";
7914 mips_lo_relocs[SYMBOL_TLSLDM] = "%tlsldm(";
7915
7916 if (TARGET_MIPS16_PCREL_LOADS)
7917 {
7918 mips_use_pcrel_pool_p[SYMBOL_DTPREL] = true;
7919 mips_use_pcrel_pool_p[SYMBOL_TPREL] = true;
7920 }
7921 else
7922 {
7923 mips_split_p[SYMBOL_DTPREL] = true;
7924 mips_hi_relocs[SYMBOL_DTPREL] = "%dtprel_hi(";
7925 mips_lo_relocs[SYMBOL_DTPREL] = "%dtprel_lo(";
7926
7927 mips_split_p[SYMBOL_TPREL] = true;
7928 mips_hi_relocs[SYMBOL_TPREL] = "%tprel_hi(";
7929 mips_lo_relocs[SYMBOL_TPREL] = "%tprel_lo(";
7930 }
7931
7932 mips_lo_relocs[SYMBOL_GOTTPREL] = "%gottprel(";
7933 mips_lo_relocs[SYMBOL_HALF] = "%half(";
7934 }
7935
7936 /* Print symbolic operand OP, which is part of a HIGH or LO_SUM
7937 in context CONTEXT. RELOCS is the array of relocations to use. */
7938
7939 static void
7940 mips_print_operand_reloc (FILE *file, rtx op, enum mips_symbol_context context,
7941 const char **relocs)
7942 {
7943 enum mips_symbol_type symbol_type;
7944 const char *p;
7945
7946 symbol_type = mips_classify_symbolic_expression (op, context);
7947 gcc_assert (relocs[symbol_type]);
7948
7949 fputs (relocs[symbol_type], file);
7950 output_addr_const (file, mips_strip_unspec_address (op));
7951 for (p = relocs[symbol_type]; *p != 0; p++)
7952 if (*p == '(')
7953 fputc (')', file);
7954 }
7955
7956 /* Start a new block with the given asm switch enabled. If we need
7957 to print a directive, emit PREFIX before it and SUFFIX after it. */
7958
7959 static void
7960 mips_push_asm_switch_1 (struct mips_asm_switch *asm_switch,
7961 const char *prefix, const char *suffix)
7962 {
7963 if (asm_switch->nesting_level == 0)
7964 fprintf (asm_out_file, "%s.set\tno%s%s", prefix, asm_switch->name, suffix);
7965 asm_switch->nesting_level++;
7966 }
7967
7968 /* Likewise, but end a block. */
7969
7970 static void
7971 mips_pop_asm_switch_1 (struct mips_asm_switch *asm_switch,
7972 const char *prefix, const char *suffix)
7973 {
7974 gcc_assert (asm_switch->nesting_level);
7975 asm_switch->nesting_level--;
7976 if (asm_switch->nesting_level == 0)
7977 fprintf (asm_out_file, "%s.set\t%s%s", prefix, asm_switch->name, suffix);
7978 }
7979
7980 /* Wrappers around mips_push_asm_switch_1 and mips_pop_asm_switch_1
7981 that either print a complete line or print nothing. */
7982
7983 void
7984 mips_push_asm_switch (struct mips_asm_switch *asm_switch)
7985 {
7986 mips_push_asm_switch_1 (asm_switch, "\t", "\n");
7987 }
7988
7989 void
7990 mips_pop_asm_switch (struct mips_asm_switch *asm_switch)
7991 {
7992 mips_pop_asm_switch_1 (asm_switch, "\t", "\n");
7993 }
7994
7995 /* Print the text for PRINT_OPERAND punctation character CH to FILE.
7996 The punctuation characters are:
7997
7998 '(' Start a nested ".set noreorder" block.
7999 ')' End a nested ".set noreorder" block.
8000 '[' Start a nested ".set noat" block.
8001 ']' End a nested ".set noat" block.
8002 '<' Start a nested ".set nomacro" block.
8003 '>' End a nested ".set nomacro" block.
8004 '*' Behave like %(%< if generating a delayed-branch sequence.
8005 '#' Print a nop if in a ".set noreorder" block.
8006 '/' Like '#', but do nothing within a delayed-branch sequence.
8007 '?' Print "l" if mips_branch_likely is true
8008 '~' Print a nop if mips_branch_likely is true
8009 '.' Print the name of the register with a hard-wired zero (zero or $0).
8010 '@' Print the name of the assembler temporary register (at or $1).
8011 '^' Print the name of the pic call-through register (t9 or $25).
8012 '+' Print the name of the gp register (usually gp or $28).
8013 '$' Print the name of the stack pointer register (sp or $29).
8014 ':' Print "c" to use the compact version if the delay slot is a nop.
8015 '!' Print "s" to use the short version if the delay slot contains a
8016 16-bit instruction.
8017
8018 See also mips_init_print_operand_pucnt. */
8019
8020 static void
8021 mips_print_operand_punctuation (FILE *file, int ch)
8022 {
8023 switch (ch)
8024 {
8025 case '(':
8026 mips_push_asm_switch_1 (&mips_noreorder, "", "\n\t");
8027 break;
8028
8029 case ')':
8030 mips_pop_asm_switch_1 (&mips_noreorder, "\n\t", "");
8031 break;
8032
8033 case '[':
8034 mips_push_asm_switch_1 (&mips_noat, "", "\n\t");
8035 break;
8036
8037 case ']':
8038 mips_pop_asm_switch_1 (&mips_noat, "\n\t", "");
8039 break;
8040
8041 case '<':
8042 mips_push_asm_switch_1 (&mips_nomacro, "", "\n\t");
8043 break;
8044
8045 case '>':
8046 mips_pop_asm_switch_1 (&mips_nomacro, "\n\t", "");
8047 break;
8048
8049 case '*':
8050 if (final_sequence != 0)
8051 {
8052 mips_print_operand_punctuation (file, '(');
8053 mips_print_operand_punctuation (file, '<');
8054 }
8055 break;
8056
8057 case '#':
8058 if (mips_noreorder.nesting_level > 0)
8059 fputs ("\n\tnop", file);
8060 break;
8061
8062 case '/':
8063 /* Print an extra newline so that the delayed insn is separated
8064 from the following ones. This looks neater and is consistent
8065 with non-nop delayed sequences. */
8066 if (mips_noreorder.nesting_level > 0 && final_sequence == 0)
8067 fputs ("\n\tnop\n", file);
8068 break;
8069
8070 case '?':
8071 if (mips_branch_likely)
8072 putc ('l', file);
8073 break;
8074
8075 case '~':
8076 if (mips_branch_likely)
8077 fputs ("\n\tnop", file);
8078 break;
8079
8080 case '.':
8081 fputs (reg_names[GP_REG_FIRST + 0], file);
8082 break;
8083
8084 case '@':
8085 fputs (reg_names[AT_REGNUM], file);
8086 break;
8087
8088 case '^':
8089 fputs (reg_names[PIC_FUNCTION_ADDR_REGNUM], file);
8090 break;
8091
8092 case '+':
8093 fputs (reg_names[PIC_OFFSET_TABLE_REGNUM], file);
8094 break;
8095
8096 case '$':
8097 fputs (reg_names[STACK_POINTER_REGNUM], file);
8098 break;
8099
8100 case ':':
8101 /* When final_sequence is 0, the delay slot will be a nop. We can
8102 use the compact version for microMIPS. */
8103 if (final_sequence == 0)
8104 putc ('c', file);
8105 break;
8106
8107 case '!':
8108 /* If the delay slot instruction is short, then use the
8109 compact version. */
8110 if (final_sequence == 0
8111 || get_attr_length (XVECEXP (final_sequence, 0, 1)) == 2)
8112 putc ('s', file);
8113 break;
8114
8115 default:
8116 gcc_unreachable ();
8117 break;
8118 }
8119 }
8120
8121 /* Initialize mips_print_operand_punct. */
8122
8123 static void
8124 mips_init_print_operand_punct (void)
8125 {
8126 const char *p;
8127
8128 for (p = "()[]<>*#/?~.@^+$:!"; *p; p++)
8129 mips_print_operand_punct[(unsigned char) *p] = true;
8130 }
8131
8132 /* PRINT_OPERAND prefix LETTER refers to the integer branch instruction
8133 associated with condition CODE. Print the condition part of the
8134 opcode to FILE. */
8135
8136 static void
8137 mips_print_int_branch_condition (FILE *file, enum rtx_code code, int letter)
8138 {
8139 switch (code)
8140 {
8141 case EQ:
8142 case NE:
8143 case GT:
8144 case GE:
8145 case LT:
8146 case LE:
8147 case GTU:
8148 case GEU:
8149 case LTU:
8150 case LEU:
8151 /* Conveniently, the MIPS names for these conditions are the same
8152 as their RTL equivalents. */
8153 fputs (GET_RTX_NAME (code), file);
8154 break;
8155
8156 default:
8157 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter);
8158 break;
8159 }
8160 }
8161
8162 /* Likewise floating-point branches. */
8163
8164 static void
8165 mips_print_float_branch_condition (FILE *file, enum rtx_code code, int letter)
8166 {
8167 switch (code)
8168 {
8169 case EQ:
8170 fputs ("c1f", file);
8171 break;
8172
8173 case NE:
8174 fputs ("c1t", file);
8175 break;
8176
8177 default:
8178 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter);
8179 break;
8180 }
8181 }
8182
8183 /* Implement TARGET_PRINT_OPERAND_PUNCT_VALID_P. */
8184
8185 static bool
8186 mips_print_operand_punct_valid_p (unsigned char code)
8187 {
8188 return mips_print_operand_punct[code];
8189 }
8190
8191 /* Implement TARGET_PRINT_OPERAND. The MIPS-specific operand codes are:
8192
8193 'X' Print CONST_INT OP in hexadecimal format.
8194 'x' Print the low 16 bits of CONST_INT OP in hexadecimal format.
8195 'd' Print CONST_INT OP in decimal.
8196 'm' Print one less than CONST_INT OP in decimal.
8197 'h' Print the high-part relocation associated with OP, after stripping
8198 any outermost HIGH.
8199 'R' Print the low-part relocation associated with OP.
8200 'C' Print the integer branch condition for comparison OP.
8201 'N' Print the inverse of the integer branch condition for comparison OP.
8202 'F' Print the FPU branch condition for comparison OP.
8203 'W' Print the inverse of the FPU branch condition for comparison OP.
8204 'T' Print 'f' for (eq:CC ...), 't' for (ne:CC ...),
8205 'z' for (eq:?I ...), 'n' for (ne:?I ...).
8206 't' Like 'T', but with the EQ/NE cases reversed
8207 'Y' Print mips_fp_conditions[INTVAL (OP)]
8208 'Z' Print OP and a comma for ISA_HAS_8CC, otherwise print nothing.
8209 'q' Print a DSP accumulator register.
8210 'D' Print the second part of a double-word register or memory operand.
8211 'L' Print the low-order register in a double-word register operand.
8212 'M' Print high-order register in a double-word register operand.
8213 'z' Print $0 if OP is zero, otherwise print OP normally.
8214 'b' Print the address of a memory operand, without offset. */
8215
8216 static void
8217 mips_print_operand (FILE *file, rtx op, int letter)
8218 {
8219 enum rtx_code code;
8220
8221 if (mips_print_operand_punct_valid_p (letter))
8222 {
8223 mips_print_operand_punctuation (file, letter);
8224 return;
8225 }
8226
8227 gcc_assert (op);
8228 code = GET_CODE (op);
8229
8230 switch (letter)
8231 {
8232 case 'X':
8233 if (CONST_INT_P (op))
8234 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op));
8235 else
8236 output_operand_lossage ("invalid use of '%%%c'", letter);
8237 break;
8238
8239 case 'x':
8240 if (CONST_INT_P (op))
8241 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op) & 0xffff);
8242 else
8243 output_operand_lossage ("invalid use of '%%%c'", letter);
8244 break;
8245
8246 case 'd':
8247 if (CONST_INT_P (op))
8248 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op));
8249 else
8250 output_operand_lossage ("invalid use of '%%%c'", letter);
8251 break;
8252
8253 case 'm':
8254 if (CONST_INT_P (op))
8255 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op) - 1);
8256 else
8257 output_operand_lossage ("invalid use of '%%%c'", letter);
8258 break;
8259
8260 case 'h':
8261 if (code == HIGH)
8262 op = XEXP (op, 0);
8263 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_hi_relocs);
8264 break;
8265
8266 case 'R':
8267 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_lo_relocs);
8268 break;
8269
8270 case 'C':
8271 mips_print_int_branch_condition (file, code, letter);
8272 break;
8273
8274 case 'N':
8275 mips_print_int_branch_condition (file, reverse_condition (code), letter);
8276 break;
8277
8278 case 'F':
8279 mips_print_float_branch_condition (file, code, letter);
8280 break;
8281
8282 case 'W':
8283 mips_print_float_branch_condition (file, reverse_condition (code),
8284 letter);
8285 break;
8286
8287 case 'T':
8288 case 't':
8289 {
8290 int truth = (code == NE) == (letter == 'T');
8291 fputc ("zfnt"[truth * 2 + ST_REG_P (REGNO (XEXP (op, 0)))], file);
8292 }
8293 break;
8294
8295 case 'Y':
8296 if (code == CONST_INT && UINTVAL (op) < ARRAY_SIZE (mips_fp_conditions))
8297 fputs (mips_fp_conditions[UINTVAL (op)], file);
8298 else
8299 output_operand_lossage ("'%%%c' is not a valid operand prefix",
8300 letter);
8301 break;
8302
8303 case 'Z':
8304 if (ISA_HAS_8CC)
8305 {
8306 mips_print_operand (file, op, 0);
8307 fputc (',', file);
8308 }
8309 break;
8310
8311 case 'q':
8312 if (code == REG && MD_REG_P (REGNO (op)))
8313 fprintf (file, "$ac0");
8314 else if (code == REG && DSP_ACC_REG_P (REGNO (op)))
8315 fprintf (file, "$ac%c", reg_names[REGNO (op)][3]);
8316 else
8317 output_operand_lossage ("invalid use of '%%%c'", letter);
8318 break;
8319
8320 default:
8321 switch (code)
8322 {
8323 case REG:
8324 {
8325 unsigned int regno = REGNO (op);
8326 if ((letter == 'M' && TARGET_LITTLE_ENDIAN)
8327 || (letter == 'L' && TARGET_BIG_ENDIAN)
8328 || letter == 'D')
8329 regno++;
8330 else if (letter && letter != 'z' && letter != 'M' && letter != 'L')
8331 output_operand_lossage ("invalid use of '%%%c'", letter);
8332 /* We need to print $0 .. $31 for COP0 registers. */
8333 if (COP0_REG_P (regno))
8334 fprintf (file, "$%s", &reg_names[regno][4]);
8335 else
8336 fprintf (file, "%s", reg_names[regno]);
8337 }
8338 break;
8339
8340 case MEM:
8341 if (letter == 'D')
8342 output_address (plus_constant (Pmode, XEXP (op, 0), 4));
8343 else if (letter == 'b')
8344 {
8345 gcc_assert (REG_P (XEXP (op, 0)));
8346 mips_print_operand (file, XEXP (op, 0), 0);
8347 }
8348 else if (letter && letter != 'z')
8349 output_operand_lossage ("invalid use of '%%%c'", letter);
8350 else
8351 output_address (XEXP (op, 0));
8352 break;
8353
8354 default:
8355 if (letter == 'z' && op == CONST0_RTX (GET_MODE (op)))
8356 fputs (reg_names[GP_REG_FIRST], file);
8357 else if (letter && letter != 'z')
8358 output_operand_lossage ("invalid use of '%%%c'", letter);
8359 else if (CONST_GP_P (op))
8360 fputs (reg_names[GLOBAL_POINTER_REGNUM], file);
8361 else
8362 output_addr_const (file, mips_strip_unspec_address (op));
8363 break;
8364 }
8365 }
8366 }
8367
8368 /* Implement TARGET_PRINT_OPERAND_ADDRESS. */
8369
8370 static void
8371 mips_print_operand_address (FILE *file, rtx x)
8372 {
8373 struct mips_address_info addr;
8374
8375 if (mips_classify_address (&addr, x, word_mode, true))
8376 switch (addr.type)
8377 {
8378 case ADDRESS_REG:
8379 mips_print_operand (file, addr.offset, 0);
8380 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]);
8381 return;
8382
8383 case ADDRESS_LO_SUM:
8384 mips_print_operand_reloc (file, addr.offset, SYMBOL_CONTEXT_MEM,
8385 mips_lo_relocs);
8386 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]);
8387 return;
8388
8389 case ADDRESS_CONST_INT:
8390 output_addr_const (file, x);
8391 fprintf (file, "(%s)", reg_names[GP_REG_FIRST]);
8392 return;
8393
8394 case ADDRESS_SYMBOLIC:
8395 output_addr_const (file, mips_strip_unspec_address (x));
8396 return;
8397 }
8398 gcc_unreachable ();
8399 }
8400 \f
8401 /* Implement TARGET_ENCODE_SECTION_INFO. */
8402
8403 static void
8404 mips_encode_section_info (tree decl, rtx rtl, int first)
8405 {
8406 default_encode_section_info (decl, rtl, first);
8407
8408 if (TREE_CODE (decl) == FUNCTION_DECL)
8409 {
8410 rtx symbol = XEXP (rtl, 0);
8411 tree type = TREE_TYPE (decl);
8412
8413 /* Encode whether the symbol is short or long. */
8414 if ((TARGET_LONG_CALLS && !mips_near_type_p (type))
8415 || mips_far_type_p (type))
8416 SYMBOL_REF_FLAGS (symbol) |= SYMBOL_FLAG_LONG_CALL;
8417 }
8418 }
8419
8420 /* Implement TARGET_SELECT_RTX_SECTION. */
8421
8422 static section *
8423 mips_select_rtx_section (enum machine_mode mode, rtx x,
8424 unsigned HOST_WIDE_INT align)
8425 {
8426 /* ??? Consider using mergeable small data sections. */
8427 if (mips_rtx_constant_in_small_data_p (mode))
8428 return get_named_section (NULL, ".sdata", 0);
8429
8430 return default_elf_select_rtx_section (mode, x, align);
8431 }
8432
8433 /* Implement TARGET_ASM_FUNCTION_RODATA_SECTION.
8434
8435 The complication here is that, with the combination TARGET_ABICALLS
8436 && !TARGET_ABSOLUTE_ABICALLS && !TARGET_GPWORD, jump tables will use
8437 absolute addresses, and should therefore not be included in the
8438 read-only part of a DSO. Handle such cases by selecting a normal
8439 data section instead of a read-only one. The logic apes that in
8440 default_function_rodata_section. */
8441
8442 static section *
8443 mips_function_rodata_section (tree decl)
8444 {
8445 if (!TARGET_ABICALLS || TARGET_ABSOLUTE_ABICALLS || TARGET_GPWORD)
8446 return default_function_rodata_section (decl);
8447
8448 if (decl && DECL_SECTION_NAME (decl))
8449 {
8450 const char *name = DECL_SECTION_NAME (decl);
8451 if (DECL_COMDAT_GROUP (decl) && strncmp (name, ".gnu.linkonce.t.", 16) == 0)
8452 {
8453 char *rname = ASTRDUP (name);
8454 rname[14] = 'd';
8455 return get_section (rname, SECTION_LINKONCE | SECTION_WRITE, decl);
8456 }
8457 else if (flag_function_sections
8458 && flag_data_sections
8459 && strncmp (name, ".text.", 6) == 0)
8460 {
8461 char *rname = ASTRDUP (name);
8462 memcpy (rname + 1, "data", 4);
8463 return get_section (rname, SECTION_WRITE, decl);
8464 }
8465 }
8466 return data_section;
8467 }
8468
8469 /* Implement TARGET_IN_SMALL_DATA_P. */
8470
8471 static bool
8472 mips_in_small_data_p (const_tree decl)
8473 {
8474 unsigned HOST_WIDE_INT size;
8475
8476 if (TREE_CODE (decl) == STRING_CST || TREE_CODE (decl) == FUNCTION_DECL)
8477 return false;
8478
8479 /* We don't yet generate small-data references for -mabicalls
8480 or VxWorks RTP code. See the related -G handling in
8481 mips_option_override. */
8482 if (TARGET_ABICALLS || TARGET_VXWORKS_RTP)
8483 return false;
8484
8485 if (TREE_CODE (decl) == VAR_DECL && DECL_SECTION_NAME (decl) != 0)
8486 {
8487 const char *name;
8488
8489 /* Reject anything that isn't in a known small-data section. */
8490 name = DECL_SECTION_NAME (decl);
8491 if (strcmp (name, ".sdata") != 0 && strcmp (name, ".sbss") != 0)
8492 return false;
8493
8494 /* If a symbol is defined externally, the assembler will use the
8495 usual -G rules when deciding how to implement macros. */
8496 if (mips_lo_relocs[SYMBOL_GP_RELATIVE] || !DECL_EXTERNAL (decl))
8497 return true;
8498 }
8499 else if (TARGET_EMBEDDED_DATA)
8500 {
8501 /* Don't put constants into the small data section: we want them
8502 to be in ROM rather than RAM. */
8503 if (TREE_CODE (decl) != VAR_DECL)
8504 return false;
8505
8506 if (TREE_READONLY (decl)
8507 && !TREE_SIDE_EFFECTS (decl)
8508 && (!DECL_INITIAL (decl) || TREE_CONSTANT (DECL_INITIAL (decl))))
8509 return false;
8510 }
8511
8512 /* Enforce -mlocal-sdata. */
8513 if (!TARGET_LOCAL_SDATA && !TREE_PUBLIC (decl))
8514 return false;
8515
8516 /* Enforce -mextern-sdata. */
8517 if (!TARGET_EXTERN_SDATA && DECL_P (decl))
8518 {
8519 if (DECL_EXTERNAL (decl))
8520 return false;
8521 if (DECL_COMMON (decl) && DECL_INITIAL (decl) == NULL)
8522 return false;
8523 }
8524
8525 /* We have traditionally not treated zero-sized objects as small data,
8526 so this is now effectively part of the ABI. */
8527 size = int_size_in_bytes (TREE_TYPE (decl));
8528 return size > 0 && size <= mips_small_data_threshold;
8529 }
8530
8531 /* Implement TARGET_USE_ANCHORS_FOR_SYMBOL_P. We don't want to use
8532 anchors for small data: the GP register acts as an anchor in that
8533 case. We also don't want to use them for PC-relative accesses,
8534 where the PC acts as an anchor. */
8535
8536 static bool
8537 mips_use_anchors_for_symbol_p (const_rtx symbol)
8538 {
8539 switch (mips_classify_symbol (symbol, SYMBOL_CONTEXT_MEM))
8540 {
8541 case SYMBOL_PC_RELATIVE:
8542 case SYMBOL_GP_RELATIVE:
8543 return false;
8544
8545 default:
8546 return default_use_anchors_for_symbol_p (symbol);
8547 }
8548 }
8549 \f
8550 /* The MIPS debug format wants all automatic variables and arguments
8551 to be in terms of the virtual frame pointer (stack pointer before
8552 any adjustment in the function), while the MIPS 3.0 linker wants
8553 the frame pointer to be the stack pointer after the initial
8554 adjustment. So, we do the adjustment here. The arg pointer (which
8555 is eliminated) points to the virtual frame pointer, while the frame
8556 pointer (which may be eliminated) points to the stack pointer after
8557 the initial adjustments. */
8558
8559 HOST_WIDE_INT
8560 mips_debugger_offset (rtx addr, HOST_WIDE_INT offset)
8561 {
8562 rtx offset2 = const0_rtx;
8563 rtx reg = eliminate_constant_term (addr, &offset2);
8564
8565 if (offset == 0)
8566 offset = INTVAL (offset2);
8567
8568 if (reg == stack_pointer_rtx
8569 || reg == frame_pointer_rtx
8570 || reg == hard_frame_pointer_rtx)
8571 {
8572 offset -= cfun->machine->frame.total_size;
8573 if (reg == hard_frame_pointer_rtx)
8574 offset += cfun->machine->frame.hard_frame_pointer_offset;
8575 }
8576
8577 return offset;
8578 }
8579 \f
8580 /* Implement ASM_OUTPUT_EXTERNAL. */
8581
8582 void
8583 mips_output_external (FILE *file, tree decl, const char *name)
8584 {
8585 default_elf_asm_output_external (file, decl, name);
8586
8587 /* We output the name if and only if TREE_SYMBOL_REFERENCED is
8588 set in order to avoid putting out names that are never really
8589 used. */
8590 if (TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl)))
8591 {
8592 if (!TARGET_EXPLICIT_RELOCS && mips_in_small_data_p (decl))
8593 {
8594 /* When using assembler macros, emit .extern directives for
8595 all small-data externs so that the assembler knows how
8596 big they are.
8597
8598 In most cases it would be safe (though pointless) to emit
8599 .externs for other symbols too. One exception is when an
8600 object is within the -G limit but declared by the user to
8601 be in a section other than .sbss or .sdata. */
8602 fputs ("\t.extern\t", file);
8603 assemble_name (file, name);
8604 fprintf (file, ", " HOST_WIDE_INT_PRINT_DEC "\n",
8605 int_size_in_bytes (TREE_TYPE (decl)));
8606 }
8607 }
8608 }
8609
8610 /* Implement TARGET_ASM_OUTPUT_SOURCE_FILENAME. */
8611
8612 static void
8613 mips_output_filename (FILE *stream, const char *name)
8614 {
8615 /* If we are emitting DWARF-2, let dwarf2out handle the ".file"
8616 directives. */
8617 if (write_symbols == DWARF2_DEBUG)
8618 return;
8619 else if (mips_output_filename_first_time)
8620 {
8621 mips_output_filename_first_time = 0;
8622 num_source_filenames += 1;
8623 current_function_file = name;
8624 fprintf (stream, "\t.file\t%d ", num_source_filenames);
8625 output_quoted_string (stream, name);
8626 putc ('\n', stream);
8627 }
8628 /* If we are emitting stabs, let dbxout.c handle this (except for
8629 the mips_output_filename_first_time case). */
8630 else if (write_symbols == DBX_DEBUG)
8631 return;
8632 else if (name != current_function_file
8633 && strcmp (name, current_function_file) != 0)
8634 {
8635 num_source_filenames += 1;
8636 current_function_file = name;
8637 fprintf (stream, "\t.file\t%d ", num_source_filenames);
8638 output_quoted_string (stream, name);
8639 putc ('\n', stream);
8640 }
8641 }
8642
8643 /* Implement TARGET_ASM_OUTPUT_DWARF_DTPREL. */
8644
8645 static void ATTRIBUTE_UNUSED
8646 mips_output_dwarf_dtprel (FILE *file, int size, rtx x)
8647 {
8648 switch (size)
8649 {
8650 case 4:
8651 fputs ("\t.dtprelword\t", file);
8652 break;
8653
8654 case 8:
8655 fputs ("\t.dtpreldword\t", file);
8656 break;
8657
8658 default:
8659 gcc_unreachable ();
8660 }
8661 output_addr_const (file, x);
8662 fputs ("+0x8000", file);
8663 }
8664
8665 /* Implement TARGET_DWARF_REGISTER_SPAN. */
8666
8667 static rtx
8668 mips_dwarf_register_span (rtx reg)
8669 {
8670 rtx high, low;
8671 enum machine_mode mode;
8672
8673 /* By default, GCC maps increasing register numbers to increasing
8674 memory locations, but paired FPRs are always little-endian,
8675 regardless of the prevailing endianness. */
8676 mode = GET_MODE (reg);
8677 if (FP_REG_P (REGNO (reg))
8678 && TARGET_BIG_ENDIAN
8679 && MAX_FPRS_PER_FMT > 1
8680 && GET_MODE_SIZE (mode) > UNITS_PER_FPREG)
8681 {
8682 gcc_assert (GET_MODE_SIZE (mode) == UNITS_PER_HWFPVALUE);
8683 high = mips_subword (reg, true);
8684 low = mips_subword (reg, false);
8685 return gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, high, low));
8686 }
8687
8688 return NULL_RTX;
8689 }
8690
8691 /* DSP ALU can bypass data with no delays for the following pairs. */
8692 enum insn_code dspalu_bypass_table[][2] =
8693 {
8694 {CODE_FOR_mips_addsc, CODE_FOR_mips_addwc},
8695 {CODE_FOR_mips_cmpu_eq_qb, CODE_FOR_mips_pick_qb},
8696 {CODE_FOR_mips_cmpu_lt_qb, CODE_FOR_mips_pick_qb},
8697 {CODE_FOR_mips_cmpu_le_qb, CODE_FOR_mips_pick_qb},
8698 {CODE_FOR_mips_cmp_eq_ph, CODE_FOR_mips_pick_ph},
8699 {CODE_FOR_mips_cmp_lt_ph, CODE_FOR_mips_pick_ph},
8700 {CODE_FOR_mips_cmp_le_ph, CODE_FOR_mips_pick_ph},
8701 {CODE_FOR_mips_wrdsp, CODE_FOR_mips_insv}
8702 };
8703
8704 int
8705 mips_dspalu_bypass_p (rtx out_insn, rtx in_insn)
8706 {
8707 int i;
8708 int num_bypass = ARRAY_SIZE (dspalu_bypass_table);
8709 enum insn_code out_icode = (enum insn_code) INSN_CODE (out_insn);
8710 enum insn_code in_icode = (enum insn_code) INSN_CODE (in_insn);
8711
8712 for (i = 0; i < num_bypass; i++)
8713 {
8714 if (out_icode == dspalu_bypass_table[i][0]
8715 && in_icode == dspalu_bypass_table[i][1])
8716 return true;
8717 }
8718
8719 return false;
8720 }
8721 /* Implement ASM_OUTPUT_ASCII. */
8722
8723 void
8724 mips_output_ascii (FILE *stream, const char *string, size_t len)
8725 {
8726 size_t i;
8727 int cur_pos;
8728
8729 cur_pos = 17;
8730 fprintf (stream, "\t.ascii\t\"");
8731 for (i = 0; i < len; i++)
8732 {
8733 int c;
8734
8735 c = (unsigned char) string[i];
8736 if (ISPRINT (c))
8737 {
8738 if (c == '\\' || c == '\"')
8739 {
8740 putc ('\\', stream);
8741 cur_pos++;
8742 }
8743 putc (c, stream);
8744 cur_pos++;
8745 }
8746 else
8747 {
8748 fprintf (stream, "\\%03o", c);
8749 cur_pos += 4;
8750 }
8751
8752 if (cur_pos > 72 && i+1 < len)
8753 {
8754 cur_pos = 17;
8755 fprintf (stream, "\"\n\t.ascii\t\"");
8756 }
8757 }
8758 fprintf (stream, "\"\n");
8759 }
8760
8761 /* Return the pseudo-op for full SYMBOL_(D)TPREL address *ADDR.
8762 Update *ADDR with the operand that should be printed. */
8763
8764 const char *
8765 mips_output_tls_reloc_directive (rtx *addr)
8766 {
8767 enum mips_symbol_type type;
8768
8769 type = mips_classify_symbolic_expression (*addr, SYMBOL_CONTEXT_LEA);
8770 *addr = mips_strip_unspec_address (*addr);
8771 switch (type)
8772 {
8773 case SYMBOL_DTPREL:
8774 return Pmode == SImode ? ".dtprelword\t%0" : ".dtpreldword\t%0";
8775
8776 case SYMBOL_TPREL:
8777 return Pmode == SImode ? ".tprelword\t%0" : ".tpreldword\t%0";
8778
8779 default:
8780 gcc_unreachable ();
8781 }
8782 }
8783
8784 /* Emit either a label, .comm, or .lcomm directive. When using assembler
8785 macros, mark the symbol as written so that mips_asm_output_external
8786 won't emit an .extern for it. STREAM is the output file, NAME is the
8787 name of the symbol, INIT_STRING is the string that should be written
8788 before the symbol and FINAL_STRING is the string that should be
8789 written after it. FINAL_STRING is a printf format that consumes the
8790 remaining arguments. */
8791
8792 void
8793 mips_declare_object (FILE *stream, const char *name, const char *init_string,
8794 const char *final_string, ...)
8795 {
8796 va_list ap;
8797
8798 fputs (init_string, stream);
8799 assemble_name (stream, name);
8800 va_start (ap, final_string);
8801 vfprintf (stream, final_string, ap);
8802 va_end (ap);
8803
8804 if (!TARGET_EXPLICIT_RELOCS)
8805 {
8806 tree name_tree = get_identifier (name);
8807 TREE_ASM_WRITTEN (name_tree) = 1;
8808 }
8809 }
8810
8811 /* Declare a common object of SIZE bytes using asm directive INIT_STRING.
8812 NAME is the name of the object and ALIGN is the required alignment
8813 in bytes. TAKES_ALIGNMENT_P is true if the directive takes a third
8814 alignment argument. */
8815
8816 void
8817 mips_declare_common_object (FILE *stream, const char *name,
8818 const char *init_string,
8819 unsigned HOST_WIDE_INT size,
8820 unsigned int align, bool takes_alignment_p)
8821 {
8822 if (!takes_alignment_p)
8823 {
8824 size += (align / BITS_PER_UNIT) - 1;
8825 size -= size % (align / BITS_PER_UNIT);
8826 mips_declare_object (stream, name, init_string,
8827 "," HOST_WIDE_INT_PRINT_UNSIGNED "\n", size);
8828 }
8829 else
8830 mips_declare_object (stream, name, init_string,
8831 "," HOST_WIDE_INT_PRINT_UNSIGNED ",%u\n",
8832 size, align / BITS_PER_UNIT);
8833 }
8834
8835 /* Implement ASM_OUTPUT_ALIGNED_DECL_COMMON. This is usually the same as the
8836 elfos.h version, but we also need to handle -muninit-const-in-rodata. */
8837
8838 void
8839 mips_output_aligned_decl_common (FILE *stream, tree decl, const char *name,
8840 unsigned HOST_WIDE_INT size,
8841 unsigned int align)
8842 {
8843 /* If the target wants uninitialized const declarations in
8844 .rdata then don't put them in .comm. */
8845 if (TARGET_EMBEDDED_DATA
8846 && TARGET_UNINIT_CONST_IN_RODATA
8847 && TREE_CODE (decl) == VAR_DECL
8848 && TREE_READONLY (decl)
8849 && (DECL_INITIAL (decl) == 0 || DECL_INITIAL (decl) == error_mark_node))
8850 {
8851 if (TREE_PUBLIC (decl) && DECL_NAME (decl))
8852 targetm.asm_out.globalize_label (stream, name);
8853
8854 switch_to_section (readonly_data_section);
8855 ASM_OUTPUT_ALIGN (stream, floor_log2 (align / BITS_PER_UNIT));
8856 mips_declare_object (stream, name, "",
8857 ":\n\t.space\t" HOST_WIDE_INT_PRINT_UNSIGNED "\n",
8858 size);
8859 }
8860 else
8861 mips_declare_common_object (stream, name, "\n\t.comm\t",
8862 size, align, true);
8863 }
8864
8865 #ifdef ASM_OUTPUT_SIZE_DIRECTIVE
8866 extern int size_directive_output;
8867
8868 /* Implement ASM_DECLARE_OBJECT_NAME. This is like most of the standard ELF
8869 definitions except that it uses mips_declare_object to emit the label. */
8870
8871 void
8872 mips_declare_object_name (FILE *stream, const char *name,
8873 tree decl ATTRIBUTE_UNUSED)
8874 {
8875 #ifdef ASM_OUTPUT_TYPE_DIRECTIVE
8876 ASM_OUTPUT_TYPE_DIRECTIVE (stream, name, "object");
8877 #endif
8878
8879 size_directive_output = 0;
8880 if (!flag_inhibit_size_directive && DECL_SIZE (decl))
8881 {
8882 HOST_WIDE_INT size;
8883
8884 size_directive_output = 1;
8885 size = int_size_in_bytes (TREE_TYPE (decl));
8886 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size);
8887 }
8888
8889 mips_declare_object (stream, name, "", ":\n");
8890 }
8891
8892 /* Implement ASM_FINISH_DECLARE_OBJECT. This is generic ELF stuff. */
8893
8894 void
8895 mips_finish_declare_object (FILE *stream, tree decl, int top_level, int at_end)
8896 {
8897 const char *name;
8898
8899 name = XSTR (XEXP (DECL_RTL (decl), 0), 0);
8900 if (!flag_inhibit_size_directive
8901 && DECL_SIZE (decl) != 0
8902 && !at_end
8903 && top_level
8904 && DECL_INITIAL (decl) == error_mark_node
8905 && !size_directive_output)
8906 {
8907 HOST_WIDE_INT size;
8908
8909 size_directive_output = 1;
8910 size = int_size_in_bytes (TREE_TYPE (decl));
8911 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size);
8912 }
8913 }
8914 #endif
8915 \f
8916 /* Return the FOO in the name of the ".mdebug.FOO" section associated
8917 with the current ABI. */
8918
8919 static const char *
8920 mips_mdebug_abi_name (void)
8921 {
8922 switch (mips_abi)
8923 {
8924 case ABI_32:
8925 return "abi32";
8926 case ABI_O64:
8927 return "abiO64";
8928 case ABI_N32:
8929 return "abiN32";
8930 case ABI_64:
8931 return "abi64";
8932 case ABI_EABI:
8933 return TARGET_64BIT ? "eabi64" : "eabi32";
8934 default:
8935 gcc_unreachable ();
8936 }
8937 }
8938
8939 /* Implement TARGET_ASM_FILE_START. */
8940
8941 static void
8942 mips_file_start (void)
8943 {
8944 default_file_start ();
8945
8946 /* Generate a special section to describe the ABI switches used to
8947 produce the resultant binary. */
8948
8949 /* Record the ABI itself. Modern versions of binutils encode
8950 this information in the ELF header flags, but GDB needs the
8951 information in order to correctly debug binaries produced by
8952 older binutils. See the function mips_gdbarch_init in
8953 gdb/mips-tdep.c. */
8954 fprintf (asm_out_file, "\t.section .mdebug.%s\n\t.previous\n",
8955 mips_mdebug_abi_name ());
8956
8957 /* There is no ELF header flag to distinguish long32 forms of the
8958 EABI from long64 forms. Emit a special section to help tools
8959 such as GDB. Do the same for o64, which is sometimes used with
8960 -mlong64. */
8961 if (mips_abi == ABI_EABI || mips_abi == ABI_O64)
8962 fprintf (asm_out_file, "\t.section .gcc_compiled_long%d\n"
8963 "\t.previous\n", TARGET_LONG64 ? 64 : 32);
8964
8965 /* Record the NaN encoding. */
8966 if (HAVE_AS_NAN || mips_nan != MIPS_IEEE_754_DEFAULT)
8967 fprintf (asm_out_file, "\t.nan\t%s\n",
8968 mips_nan == MIPS_IEEE_754_2008 ? "2008" : "legacy");
8969
8970 #ifdef HAVE_AS_GNU_ATTRIBUTE
8971 {
8972 int attr;
8973
8974 /* No floating-point operations, -mno-float. */
8975 if (TARGET_NO_FLOAT)
8976 attr = 0;
8977 /* Soft-float code, -msoft-float. */
8978 else if (!TARGET_HARD_FLOAT_ABI)
8979 attr = 3;
8980 /* Single-float code, -msingle-float. */
8981 else if (!TARGET_DOUBLE_FLOAT)
8982 attr = 2;
8983 /* 64-bit FP registers on a 32-bit target, -mips32r2 -mfp64. */
8984 else if (!TARGET_64BIT && TARGET_FLOAT64)
8985 attr = 4;
8986 /* Regular FP code, FP regs same size as GP regs, -mdouble-float. */
8987 else
8988 attr = 1;
8989
8990 fprintf (asm_out_file, "\t.gnu_attribute 4, %d\n", attr);
8991 }
8992 #endif
8993
8994 /* If TARGET_ABICALLS, tell GAS to generate -KPIC code. */
8995 if (TARGET_ABICALLS)
8996 {
8997 fprintf (asm_out_file, "\t.abicalls\n");
8998 if (TARGET_ABICALLS_PIC0)
8999 fprintf (asm_out_file, "\t.option\tpic0\n");
9000 }
9001
9002 if (flag_verbose_asm)
9003 fprintf (asm_out_file, "\n%s -G value = %d, Arch = %s, ISA = %d\n",
9004 ASM_COMMENT_START,
9005 mips_small_data_threshold, mips_arch_info->name, mips_isa);
9006 }
9007
9008 /* Implement TARGET_ASM_CODE_END. */
9009
9010 static void
9011 mips_code_end (void)
9012 {
9013 mips_finish_stub (&mips16_rdhwr_stub);
9014 mips_finish_stub (&mips16_get_fcsr_stub);
9015 mips_finish_stub (&mips16_set_fcsr_stub);
9016 }
9017 \f
9018 /* Make the last instruction frame-related and note that it performs
9019 the operation described by FRAME_PATTERN. */
9020
9021 static void
9022 mips_set_frame_expr (rtx frame_pattern)
9023 {
9024 rtx_insn *insn;
9025
9026 insn = get_last_insn ();
9027 RTX_FRAME_RELATED_P (insn) = 1;
9028 REG_NOTES (insn) = alloc_EXPR_LIST (REG_FRAME_RELATED_EXPR,
9029 frame_pattern,
9030 REG_NOTES (insn));
9031 }
9032
9033 /* Return a frame-related rtx that stores REG at MEM.
9034 REG must be a single register. */
9035
9036 static rtx
9037 mips_frame_set (rtx mem, rtx reg)
9038 {
9039 rtx set;
9040
9041 set = gen_rtx_SET (VOIDmode, mem, reg);
9042 RTX_FRAME_RELATED_P (set) = 1;
9043
9044 return set;
9045 }
9046
9047 /* Record that the epilogue has restored call-saved register REG. */
9048
9049 static void
9050 mips_add_cfa_restore (rtx reg)
9051 {
9052 mips_epilogue.cfa_restores = alloc_reg_note (REG_CFA_RESTORE, reg,
9053 mips_epilogue.cfa_restores);
9054 }
9055 \f
9056 /* If a MIPS16e SAVE or RESTORE instruction saves or restores register
9057 mips16e_s2_s8_regs[X], it must also save the registers in indexes
9058 X + 1 onwards. Likewise mips16e_a0_a3_regs. */
9059 static const unsigned char mips16e_s2_s8_regs[] = {
9060 30, 23, 22, 21, 20, 19, 18
9061 };
9062 static const unsigned char mips16e_a0_a3_regs[] = {
9063 4, 5, 6, 7
9064 };
9065
9066 /* A list of the registers that can be saved by the MIPS16e SAVE instruction,
9067 ordered from the uppermost in memory to the lowest in memory. */
9068 static const unsigned char mips16e_save_restore_regs[] = {
9069 31, 30, 23, 22, 21, 20, 19, 18, 17, 16, 7, 6, 5, 4
9070 };
9071
9072 /* Return the index of the lowest X in the range [0, SIZE) for which
9073 bit REGS[X] is set in MASK. Return SIZE if there is no such X. */
9074
9075 static unsigned int
9076 mips16e_find_first_register (unsigned int mask, const unsigned char *regs,
9077 unsigned int size)
9078 {
9079 unsigned int i;
9080
9081 for (i = 0; i < size; i++)
9082 if (BITSET_P (mask, regs[i]))
9083 break;
9084
9085 return i;
9086 }
9087
9088 /* *MASK_PTR is a mask of general-purpose registers and *NUM_REGS_PTR
9089 is the number of set bits. If *MASK_PTR contains REGS[X] for some X
9090 in [0, SIZE), adjust *MASK_PTR and *NUM_REGS_PTR so that the same
9091 is true for all indexes (X, SIZE). */
9092
9093 static void
9094 mips16e_mask_registers (unsigned int *mask_ptr, const unsigned char *regs,
9095 unsigned int size, unsigned int *num_regs_ptr)
9096 {
9097 unsigned int i;
9098
9099 i = mips16e_find_first_register (*mask_ptr, regs, size);
9100 for (i++; i < size; i++)
9101 if (!BITSET_P (*mask_ptr, regs[i]))
9102 {
9103 *num_regs_ptr += 1;
9104 *mask_ptr |= 1 << regs[i];
9105 }
9106 }
9107
9108 /* Return a simplified form of X using the register values in REG_VALUES.
9109 REG_VALUES[R] is the last value assigned to hard register R, or null
9110 if R has not been modified.
9111
9112 This function is rather limited, but is good enough for our purposes. */
9113
9114 static rtx
9115 mips16e_collect_propagate_value (rtx x, rtx *reg_values)
9116 {
9117 x = avoid_constant_pool_reference (x);
9118
9119 if (UNARY_P (x))
9120 {
9121 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values);
9122 return simplify_gen_unary (GET_CODE (x), GET_MODE (x),
9123 x0, GET_MODE (XEXP (x, 0)));
9124 }
9125
9126 if (ARITHMETIC_P (x))
9127 {
9128 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values);
9129 rtx x1 = mips16e_collect_propagate_value (XEXP (x, 1), reg_values);
9130 return simplify_gen_binary (GET_CODE (x), GET_MODE (x), x0, x1);
9131 }
9132
9133 if (REG_P (x)
9134 && reg_values[REGNO (x)]
9135 && !rtx_unstable_p (reg_values[REGNO (x)]))
9136 return reg_values[REGNO (x)];
9137
9138 return x;
9139 }
9140
9141 /* Return true if (set DEST SRC) stores an argument register into its
9142 caller-allocated save slot, storing the number of that argument
9143 register in *REGNO_PTR if so. REG_VALUES is as for
9144 mips16e_collect_propagate_value. */
9145
9146 static bool
9147 mips16e_collect_argument_save_p (rtx dest, rtx src, rtx *reg_values,
9148 unsigned int *regno_ptr)
9149 {
9150 unsigned int argno, regno;
9151 HOST_WIDE_INT offset, required_offset;
9152 rtx addr, base;
9153
9154 /* Check that this is a word-mode store. */
9155 if (!MEM_P (dest) || !REG_P (src) || GET_MODE (dest) != word_mode)
9156 return false;
9157
9158 /* Check that the register being saved is an unmodified argument
9159 register. */
9160 regno = REGNO (src);
9161 if (!IN_RANGE (regno, GP_ARG_FIRST, GP_ARG_LAST) || reg_values[regno])
9162 return false;
9163 argno = regno - GP_ARG_FIRST;
9164
9165 /* Check whether the address is an appropriate stack-pointer or
9166 frame-pointer access. */
9167 addr = mips16e_collect_propagate_value (XEXP (dest, 0), reg_values);
9168 mips_split_plus (addr, &base, &offset);
9169 required_offset = cfun->machine->frame.total_size + argno * UNITS_PER_WORD;
9170 if (base == hard_frame_pointer_rtx)
9171 required_offset -= cfun->machine->frame.hard_frame_pointer_offset;
9172 else if (base != stack_pointer_rtx)
9173 return false;
9174 if (offset != required_offset)
9175 return false;
9176
9177 *regno_ptr = regno;
9178 return true;
9179 }
9180
9181 /* A subroutine of mips_expand_prologue, called only when generating
9182 MIPS16e SAVE instructions. Search the start of the function for any
9183 instructions that save argument registers into their caller-allocated
9184 save slots. Delete such instructions and return a value N such that
9185 saving [GP_ARG_FIRST, GP_ARG_FIRST + N) would make all the deleted
9186 instructions redundant. */
9187
9188 static unsigned int
9189 mips16e_collect_argument_saves (void)
9190 {
9191 rtx reg_values[FIRST_PSEUDO_REGISTER];
9192 rtx_insn *insn, *next;
9193 rtx set, dest, src;
9194 unsigned int nargs, regno;
9195
9196 push_topmost_sequence ();
9197 nargs = 0;
9198 memset (reg_values, 0, sizeof (reg_values));
9199 for (insn = get_insns (); insn; insn = next)
9200 {
9201 next = NEXT_INSN (insn);
9202 if (NOTE_P (insn) || DEBUG_INSN_P (insn))
9203 continue;
9204
9205 if (!INSN_P (insn))
9206 break;
9207
9208 set = PATTERN (insn);
9209 if (GET_CODE (set) != SET)
9210 break;
9211
9212 dest = SET_DEST (set);
9213 src = SET_SRC (set);
9214 if (mips16e_collect_argument_save_p (dest, src, reg_values, &regno))
9215 {
9216 if (!BITSET_P (cfun->machine->frame.mask, regno))
9217 {
9218 delete_insn (insn);
9219 nargs = MAX (nargs, (regno - GP_ARG_FIRST) + 1);
9220 }
9221 }
9222 else if (REG_P (dest) && GET_MODE (dest) == word_mode)
9223 reg_values[REGNO (dest)]
9224 = mips16e_collect_propagate_value (src, reg_values);
9225 else
9226 break;
9227 }
9228 pop_topmost_sequence ();
9229
9230 return nargs;
9231 }
9232
9233 /* Return a move between register REGNO and memory location SP + OFFSET.
9234 REG_PARM_P is true if SP + OFFSET belongs to REG_PARM_STACK_SPACE.
9235 Make the move a load if RESTORE_P, otherwise make it a store. */
9236
9237 static rtx
9238 mips16e_save_restore_reg (bool restore_p, bool reg_parm_p,
9239 HOST_WIDE_INT offset, unsigned int regno)
9240 {
9241 rtx reg, mem;
9242
9243 mem = gen_frame_mem (SImode, plus_constant (Pmode, stack_pointer_rtx,
9244 offset));
9245 reg = gen_rtx_REG (SImode, regno);
9246 if (restore_p)
9247 {
9248 mips_add_cfa_restore (reg);
9249 return gen_rtx_SET (VOIDmode, reg, mem);
9250 }
9251 if (reg_parm_p)
9252 return gen_rtx_SET (VOIDmode, mem, reg);
9253 return mips_frame_set (mem, reg);
9254 }
9255
9256 /* Return RTL for a MIPS16e SAVE or RESTORE instruction; RESTORE_P says which.
9257 The instruction must:
9258
9259 - Allocate or deallocate SIZE bytes in total; SIZE is known
9260 to be nonzero.
9261
9262 - Save or restore as many registers in *MASK_PTR as possible.
9263 The instruction saves the first registers at the top of the
9264 allocated area, with the other registers below it.
9265
9266 - Save NARGS argument registers above the allocated area.
9267
9268 (NARGS is always zero if RESTORE_P.)
9269
9270 The SAVE and RESTORE instructions cannot save and restore all general
9271 registers, so there may be some registers left over for the caller to
9272 handle. Destructively modify *MASK_PTR so that it contains the registers
9273 that still need to be saved or restored. The caller can save these
9274 registers in the memory immediately below *OFFSET_PTR, which is a
9275 byte offset from the bottom of the allocated stack area. */
9276
9277 static rtx
9278 mips16e_build_save_restore (bool restore_p, unsigned int *mask_ptr,
9279 HOST_WIDE_INT *offset_ptr, unsigned int nargs,
9280 HOST_WIDE_INT size)
9281 {
9282 rtx pattern, set;
9283 HOST_WIDE_INT offset, top_offset;
9284 unsigned int i, regno;
9285 int n;
9286
9287 gcc_assert (cfun->machine->frame.num_fp == 0);
9288
9289 /* Calculate the number of elements in the PARALLEL. We need one element
9290 for the stack adjustment, one for each argument register save, and one
9291 for each additional register move. */
9292 n = 1 + nargs;
9293 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++)
9294 if (BITSET_P (*mask_ptr, mips16e_save_restore_regs[i]))
9295 n++;
9296
9297 /* Create the final PARALLEL. */
9298 pattern = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (n));
9299 n = 0;
9300
9301 /* Add the stack pointer adjustment. */
9302 set = gen_rtx_SET (VOIDmode, stack_pointer_rtx,
9303 plus_constant (Pmode, stack_pointer_rtx,
9304 restore_p ? size : -size));
9305 RTX_FRAME_RELATED_P (set) = 1;
9306 XVECEXP (pattern, 0, n++) = set;
9307
9308 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */
9309 top_offset = restore_p ? size : 0;
9310
9311 /* Save the arguments. */
9312 for (i = 0; i < nargs; i++)
9313 {
9314 offset = top_offset + i * UNITS_PER_WORD;
9315 set = mips16e_save_restore_reg (restore_p, true, offset,
9316 GP_ARG_FIRST + i);
9317 XVECEXP (pattern, 0, n++) = set;
9318 }
9319
9320 /* Then fill in the other register moves. */
9321 offset = top_offset;
9322 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++)
9323 {
9324 regno = mips16e_save_restore_regs[i];
9325 if (BITSET_P (*mask_ptr, regno))
9326 {
9327 offset -= UNITS_PER_WORD;
9328 set = mips16e_save_restore_reg (restore_p, false, offset, regno);
9329 XVECEXP (pattern, 0, n++) = set;
9330 *mask_ptr &= ~(1 << regno);
9331 }
9332 }
9333
9334 /* Tell the caller what offset it should use for the remaining registers. */
9335 *offset_ptr = size + (offset - top_offset);
9336
9337 gcc_assert (n == XVECLEN (pattern, 0));
9338
9339 return pattern;
9340 }
9341
9342 /* PATTERN is a PARALLEL whose first element adds ADJUST to the stack
9343 pointer. Return true if PATTERN matches the kind of instruction
9344 generated by mips16e_build_save_restore. If INFO is nonnull,
9345 initialize it when returning true. */
9346
9347 bool
9348 mips16e_save_restore_pattern_p (rtx pattern, HOST_WIDE_INT adjust,
9349 struct mips16e_save_restore_info *info)
9350 {
9351 unsigned int i, nargs, mask, extra;
9352 HOST_WIDE_INT top_offset, save_offset, offset;
9353 rtx set, reg, mem, base;
9354 int n;
9355
9356 if (!GENERATE_MIPS16E_SAVE_RESTORE)
9357 return false;
9358
9359 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */
9360 top_offset = adjust > 0 ? adjust : 0;
9361
9362 /* Interpret all other members of the PARALLEL. */
9363 save_offset = top_offset - UNITS_PER_WORD;
9364 mask = 0;
9365 nargs = 0;
9366 i = 0;
9367 for (n = 1; n < XVECLEN (pattern, 0); n++)
9368 {
9369 /* Check that we have a SET. */
9370 set = XVECEXP (pattern, 0, n);
9371 if (GET_CODE (set) != SET)
9372 return false;
9373
9374 /* Check that the SET is a load (if restoring) or a store
9375 (if saving). */
9376 mem = adjust > 0 ? SET_SRC (set) : SET_DEST (set);
9377 if (!MEM_P (mem))
9378 return false;
9379
9380 /* Check that the address is the sum of the stack pointer and a
9381 possibly-zero constant offset. */
9382 mips_split_plus (XEXP (mem, 0), &base, &offset);
9383 if (base != stack_pointer_rtx)
9384 return false;
9385
9386 /* Check that SET's other operand is a register. */
9387 reg = adjust > 0 ? SET_DEST (set) : SET_SRC (set);
9388 if (!REG_P (reg))
9389 return false;
9390
9391 /* Check for argument saves. */
9392 if (offset == top_offset + nargs * UNITS_PER_WORD
9393 && REGNO (reg) == GP_ARG_FIRST + nargs)
9394 nargs++;
9395 else if (offset == save_offset)
9396 {
9397 while (mips16e_save_restore_regs[i++] != REGNO (reg))
9398 if (i == ARRAY_SIZE (mips16e_save_restore_regs))
9399 return false;
9400
9401 mask |= 1 << REGNO (reg);
9402 save_offset -= UNITS_PER_WORD;
9403 }
9404 else
9405 return false;
9406 }
9407
9408 /* Check that the restrictions on register ranges are met. */
9409 extra = 0;
9410 mips16e_mask_registers (&mask, mips16e_s2_s8_regs,
9411 ARRAY_SIZE (mips16e_s2_s8_regs), &extra);
9412 mips16e_mask_registers (&mask, mips16e_a0_a3_regs,
9413 ARRAY_SIZE (mips16e_a0_a3_regs), &extra);
9414 if (extra != 0)
9415 return false;
9416
9417 /* Make sure that the topmost argument register is not saved twice.
9418 The checks above ensure that the same is then true for the other
9419 argument registers. */
9420 if (nargs > 0 && BITSET_P (mask, GP_ARG_FIRST + nargs - 1))
9421 return false;
9422
9423 /* Pass back information, if requested. */
9424 if (info)
9425 {
9426 info->nargs = nargs;
9427 info->mask = mask;
9428 info->size = (adjust > 0 ? adjust : -adjust);
9429 }
9430
9431 return true;
9432 }
9433
9434 /* Add a MIPS16e SAVE or RESTORE register-range argument to string S
9435 for the register range [MIN_REG, MAX_REG]. Return a pointer to
9436 the null terminator. */
9437
9438 static char *
9439 mips16e_add_register_range (char *s, unsigned int min_reg,
9440 unsigned int max_reg)
9441 {
9442 if (min_reg != max_reg)
9443 s += sprintf (s, ",%s-%s", reg_names[min_reg], reg_names[max_reg]);
9444 else
9445 s += sprintf (s, ",%s", reg_names[min_reg]);
9446 return s;
9447 }
9448
9449 /* Return the assembly instruction for a MIPS16e SAVE or RESTORE instruction.
9450 PATTERN and ADJUST are as for mips16e_save_restore_pattern_p. */
9451
9452 const char *
9453 mips16e_output_save_restore (rtx pattern, HOST_WIDE_INT adjust)
9454 {
9455 static char buffer[300];
9456
9457 struct mips16e_save_restore_info info;
9458 unsigned int i, end;
9459 char *s;
9460
9461 /* Parse the pattern. */
9462 if (!mips16e_save_restore_pattern_p (pattern, adjust, &info))
9463 gcc_unreachable ();
9464
9465 /* Add the mnemonic. */
9466 s = strcpy (buffer, adjust > 0 ? "restore\t" : "save\t");
9467 s += strlen (s);
9468
9469 /* Save the arguments. */
9470 if (info.nargs > 1)
9471 s += sprintf (s, "%s-%s,", reg_names[GP_ARG_FIRST],
9472 reg_names[GP_ARG_FIRST + info.nargs - 1]);
9473 else if (info.nargs == 1)
9474 s += sprintf (s, "%s,", reg_names[GP_ARG_FIRST]);
9475
9476 /* Emit the amount of stack space to allocate or deallocate. */
9477 s += sprintf (s, "%d", (int) info.size);
9478
9479 /* Save or restore $16. */
9480 if (BITSET_P (info.mask, 16))
9481 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 16]);
9482
9483 /* Save or restore $17. */
9484 if (BITSET_P (info.mask, 17))
9485 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 17]);
9486
9487 /* Save or restore registers in the range $s2...$s8, which
9488 mips16e_s2_s8_regs lists in decreasing order. Note that this
9489 is a software register range; the hardware registers are not
9490 numbered consecutively. */
9491 end = ARRAY_SIZE (mips16e_s2_s8_regs);
9492 i = mips16e_find_first_register (info.mask, mips16e_s2_s8_regs, end);
9493 if (i < end)
9494 s = mips16e_add_register_range (s, mips16e_s2_s8_regs[end - 1],
9495 mips16e_s2_s8_regs[i]);
9496
9497 /* Save or restore registers in the range $a0...$a3. */
9498 end = ARRAY_SIZE (mips16e_a0_a3_regs);
9499 i = mips16e_find_first_register (info.mask, mips16e_a0_a3_regs, end);
9500 if (i < end)
9501 s = mips16e_add_register_range (s, mips16e_a0_a3_regs[i],
9502 mips16e_a0_a3_regs[end - 1]);
9503
9504 /* Save or restore $31. */
9505 if (BITSET_P (info.mask, RETURN_ADDR_REGNUM))
9506 s += sprintf (s, ",%s", reg_names[RETURN_ADDR_REGNUM]);
9507
9508 return buffer;
9509 }
9510 \f
9511 /* Return true if the current function returns its value in a floating-point
9512 register in MIPS16 mode. */
9513
9514 static bool
9515 mips16_cfun_returns_in_fpr_p (void)
9516 {
9517 tree return_type = DECL_RESULT (current_function_decl);
9518 return (TARGET_MIPS16
9519 && TARGET_HARD_FLOAT_ABI
9520 && !aggregate_value_p (return_type, current_function_decl)
9521 && mips_return_mode_in_fpr_p (DECL_MODE (return_type)));
9522 }
9523
9524 /* Return true if predicate PRED is true for at least one instruction.
9525 Cache the result in *CACHE, and assume that the result is true
9526 if *CACHE is already true. */
9527
9528 static bool
9529 mips_find_gp_ref (bool *cache, bool (*pred) (rtx_insn *))
9530 {
9531 rtx_insn *insn;
9532
9533 if (!*cache)
9534 {
9535 push_topmost_sequence ();
9536 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
9537 if (USEFUL_INSN_P (insn) && pred (insn))
9538 {
9539 *cache = true;
9540 break;
9541 }
9542 pop_topmost_sequence ();
9543 }
9544 return *cache;
9545 }
9546
9547 /* Return true if INSN refers to the global pointer in an "inflexible" way.
9548 See mips_cfun_has_inflexible_gp_ref_p for details. */
9549
9550 static bool
9551 mips_insn_has_inflexible_gp_ref_p (rtx_insn *insn)
9552 {
9553 /* Uses of pic_offset_table_rtx in CALL_INSN_FUNCTION_USAGE
9554 indicate that the target could be a traditional MIPS
9555 lazily-binding stub. */
9556 return find_reg_fusage (insn, USE, pic_offset_table_rtx);
9557 }
9558
9559 /* Return true if the current function refers to the global pointer
9560 in a way that forces $28 to be valid. This means that we can't
9561 change the choice of global pointer, even for NewABI code.
9562
9563 One example of this (and one which needs several checks) is that
9564 $28 must be valid when calling traditional MIPS lazy-binding stubs.
9565 (This restriction does not apply to PLTs.) */
9566
9567 static bool
9568 mips_cfun_has_inflexible_gp_ref_p (void)
9569 {
9570 /* If the function has a nonlocal goto, $28 must hold the correct
9571 global pointer for the target function. That is, the target
9572 of the goto implicitly uses $28. */
9573 if (crtl->has_nonlocal_goto)
9574 return true;
9575
9576 if (TARGET_ABICALLS_PIC2)
9577 {
9578 /* Symbolic accesses implicitly use the global pointer unless
9579 -mexplicit-relocs is in effect. JAL macros to symbolic addresses
9580 might go to traditional MIPS lazy-binding stubs. */
9581 if (!TARGET_EXPLICIT_RELOCS)
9582 return true;
9583
9584 /* FUNCTION_PROFILER includes a JAL to _mcount, which again
9585 can be lazily-bound. */
9586 if (crtl->profile)
9587 return true;
9588
9589 /* MIPS16 functions that return in FPRs need to call an
9590 external libgcc routine. This call is only made explict
9591 during mips_expand_epilogue, and it too might be lazily bound. */
9592 if (mips16_cfun_returns_in_fpr_p ())
9593 return true;
9594 }
9595
9596 return mips_find_gp_ref (&cfun->machine->has_inflexible_gp_insn_p,
9597 mips_insn_has_inflexible_gp_ref_p);
9598 }
9599
9600 /* Return true if INSN refers to the global pointer in a "flexible" way.
9601 See mips_cfun_has_flexible_gp_ref_p for details. */
9602
9603 static bool
9604 mips_insn_has_flexible_gp_ref_p (rtx_insn *insn)
9605 {
9606 return (get_attr_got (insn) != GOT_UNSET
9607 || mips_small_data_pattern_p (PATTERN (insn))
9608 || reg_overlap_mentioned_p (pic_offset_table_rtx, PATTERN (insn)));
9609 }
9610
9611 /* Return true if the current function references the global pointer,
9612 but if those references do not inherently require the global pointer
9613 to be $28. Assume !mips_cfun_has_inflexible_gp_ref_p (). */
9614
9615 static bool
9616 mips_cfun_has_flexible_gp_ref_p (void)
9617 {
9618 /* Reload can sometimes introduce constant pool references
9619 into a function that otherwise didn't need them. For example,
9620 suppose we have an instruction like:
9621
9622 (set (reg:DF R1) (float:DF (reg:SI R2)))
9623
9624 If R2 turns out to be a constant such as 1, the instruction may
9625 have a REG_EQUAL note saying that R1 == 1.0. Reload then has
9626 the option of using this constant if R2 doesn't get allocated
9627 to a register.
9628
9629 In cases like these, reload will have added the constant to the
9630 pool but no instruction will yet refer to it. */
9631 if (TARGET_ABICALLS_PIC2 && !reload_completed && crtl->uses_const_pool)
9632 return true;
9633
9634 return mips_find_gp_ref (&cfun->machine->has_flexible_gp_insn_p,
9635 mips_insn_has_flexible_gp_ref_p);
9636 }
9637
9638 /* Return the register that should be used as the global pointer
9639 within this function. Return INVALID_REGNUM if the function
9640 doesn't need a global pointer. */
9641
9642 static unsigned int
9643 mips_global_pointer (void)
9644 {
9645 unsigned int regno;
9646
9647 /* $gp is always available unless we're using a GOT. */
9648 if (!TARGET_USE_GOT)
9649 return GLOBAL_POINTER_REGNUM;
9650
9651 /* If there are inflexible references to $gp, we must use the
9652 standard register. */
9653 if (mips_cfun_has_inflexible_gp_ref_p ())
9654 return GLOBAL_POINTER_REGNUM;
9655
9656 /* If there are no current references to $gp, then the only uses
9657 we can introduce later are those involved in long branches. */
9658 if (TARGET_ABSOLUTE_JUMPS && !mips_cfun_has_flexible_gp_ref_p ())
9659 return INVALID_REGNUM;
9660
9661 /* If the global pointer is call-saved, try to use a call-clobbered
9662 alternative. */
9663 if (TARGET_CALL_SAVED_GP && crtl->is_leaf)
9664 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++)
9665 if (!df_regs_ever_live_p (regno)
9666 && call_really_used_regs[regno]
9667 && !fixed_regs[regno]
9668 && regno != PIC_FUNCTION_ADDR_REGNUM)
9669 return regno;
9670
9671 return GLOBAL_POINTER_REGNUM;
9672 }
9673
9674 /* Return true if the current function's prologue must load the global
9675 pointer value into pic_offset_table_rtx and store the same value in
9676 the function's cprestore slot (if any).
9677
9678 One problem we have to deal with is that, when emitting GOT-based
9679 position independent code, long-branch sequences will need to load
9680 the address of the branch target from the GOT. We don't know until
9681 the very end of compilation whether (and where) the function needs
9682 long branches, so we must ensure that _any_ branch can access the
9683 global pointer in some form. However, we do not want to pessimize
9684 the usual case in which all branches are short.
9685
9686 We handle this as follows:
9687
9688 (1) During reload, we set cfun->machine->global_pointer to
9689 INVALID_REGNUM if we _know_ that the current function
9690 doesn't need a global pointer. This is only valid if
9691 long branches don't need the GOT.
9692
9693 Otherwise, we assume that we might need a global pointer
9694 and pick an appropriate register.
9695
9696 (2) If cfun->machine->global_pointer != INVALID_REGNUM,
9697 we ensure that the global pointer is available at every
9698 block boundary bar entry and exit. We do this in one of two ways:
9699
9700 - If the function has a cprestore slot, we ensure that this
9701 slot is valid at every branch. However, as explained in
9702 point (6) below, there is no guarantee that pic_offset_table_rtx
9703 itself is valid if new uses of the global pointer are introduced
9704 after the first post-epilogue split.
9705
9706 We guarantee that the cprestore slot is valid by loading it
9707 into a fake register, CPRESTORE_SLOT_REGNUM. We then make
9708 this register live at every block boundary bar function entry
9709 and exit. It is then invalid to move the load (and thus the
9710 preceding store) across a block boundary.
9711
9712 - If the function has no cprestore slot, we guarantee that
9713 pic_offset_table_rtx itself is valid at every branch.
9714
9715 See mips_eh_uses for the handling of the register liveness.
9716
9717 (3) During prologue and epilogue generation, we emit "ghost"
9718 placeholder instructions to manipulate the global pointer.
9719
9720 (4) During prologue generation, we set cfun->machine->must_initialize_gp_p
9721 and cfun->machine->must_restore_gp_when_clobbered_p if we already know
9722 that the function needs a global pointer. (There is no need to set
9723 them earlier than this, and doing it as late as possible leads to
9724 fewer false positives.)
9725
9726 (5) If cfun->machine->must_initialize_gp_p is true during a
9727 split_insns pass, we split the ghost instructions into real
9728 instructions. These split instructions can then be optimized in
9729 the usual way. Otherwise, we keep the ghost instructions intact,
9730 and optimize for the case where they aren't needed. We still
9731 have the option of splitting them later, if we need to introduce
9732 new uses of the global pointer.
9733
9734 For example, the scheduler ignores a ghost instruction that
9735 stores $28 to the stack, but it handles the split form of
9736 the ghost instruction as an ordinary store.
9737
9738 (6) [OldABI only.] If cfun->machine->must_restore_gp_when_clobbered_p
9739 is true during the first post-epilogue split_insns pass, we split
9740 calls and restore_gp patterns into instructions that explicitly
9741 load pic_offset_table_rtx from the cprestore slot. Otherwise,
9742 we split these patterns into instructions that _don't_ load from
9743 the cprestore slot.
9744
9745 If cfun->machine->must_restore_gp_when_clobbered_p is true at the
9746 time of the split, then any instructions that exist at that time
9747 can make free use of pic_offset_table_rtx. However, if we want
9748 to introduce new uses of the global pointer after the split,
9749 we must explicitly load the value from the cprestore slot, since
9750 pic_offset_table_rtx itself might not be valid at a given point
9751 in the function.
9752
9753 The idea is that we want to be able to delete redundant
9754 loads from the cprestore slot in the usual case where no
9755 long branches are needed.
9756
9757 (7) If cfun->machine->must_initialize_gp_p is still false at the end
9758 of md_reorg, we decide whether the global pointer is needed for
9759 long branches. If so, we set cfun->machine->must_initialize_gp_p
9760 to true and split the ghost instructions into real instructions
9761 at that stage.
9762
9763 Note that the ghost instructions must have a zero length for three reasons:
9764
9765 - Giving the length of the underlying $gp sequence might cause
9766 us to use long branches in cases where they aren't really needed.
9767
9768 - They would perturb things like alignment calculations.
9769
9770 - More importantly, the hazard detection in md_reorg relies on
9771 empty instructions having a zero length.
9772
9773 If we find a long branch and split the ghost instructions at the
9774 end of md_reorg, the split could introduce more long branches.
9775 That isn't a problem though, because we still do the split before
9776 the final shorten_branches pass.
9777
9778 This is extremely ugly, but it seems like the best compromise between
9779 correctness and efficiency. */
9780
9781 bool
9782 mips_must_initialize_gp_p (void)
9783 {
9784 return cfun->machine->must_initialize_gp_p;
9785 }
9786
9787 /* Return true if REGNO is a register that is ordinarily call-clobbered
9788 but must nevertheless be preserved by an interrupt handler. */
9789
9790 static bool
9791 mips_interrupt_extra_call_saved_reg_p (unsigned int regno)
9792 {
9793 if (MD_REG_P (regno))
9794 return true;
9795
9796 if (TARGET_DSP && DSP_ACC_REG_P (regno))
9797 return true;
9798
9799 if (GP_REG_P (regno) && !cfun->machine->use_shadow_register_set_p)
9800 {
9801 /* $0 is hard-wired. */
9802 if (regno == GP_REG_FIRST)
9803 return false;
9804
9805 /* The interrupt handler can treat kernel registers as
9806 scratch registers. */
9807 if (KERNEL_REG_P (regno))
9808 return false;
9809
9810 /* The function will return the stack pointer to its original value
9811 anyway. */
9812 if (regno == STACK_POINTER_REGNUM)
9813 return false;
9814
9815 /* Otherwise, return true for registers that aren't ordinarily
9816 call-clobbered. */
9817 return call_really_used_regs[regno];
9818 }
9819
9820 return false;
9821 }
9822
9823 /* Return true if the current function should treat register REGNO
9824 as call-saved. */
9825
9826 static bool
9827 mips_cfun_call_saved_reg_p (unsigned int regno)
9828 {
9829 /* If the user makes an ordinarily-call-saved register global,
9830 that register is no longer call-saved. */
9831 if (global_regs[regno])
9832 return false;
9833
9834 /* Interrupt handlers need to save extra registers. */
9835 if (cfun->machine->interrupt_handler_p
9836 && mips_interrupt_extra_call_saved_reg_p (regno))
9837 return true;
9838
9839 /* call_insns preserve $28 unless they explicitly say otherwise,
9840 so call_really_used_regs[] treats $28 as call-saved. However,
9841 we want the ABI property rather than the default call_insn
9842 property here. */
9843 return (regno == GLOBAL_POINTER_REGNUM
9844 ? TARGET_CALL_SAVED_GP
9845 : !call_really_used_regs[regno]);
9846 }
9847
9848 /* Return true if the function body might clobber register REGNO.
9849 We know that REGNO is call-saved. */
9850
9851 static bool
9852 mips_cfun_might_clobber_call_saved_reg_p (unsigned int regno)
9853 {
9854 /* Some functions should be treated as clobbering all call-saved
9855 registers. */
9856 if (crtl->saves_all_registers)
9857 return true;
9858
9859 /* DF handles cases where a register is explicitly referenced in
9860 the rtl. Incoming values are passed in call-clobbered registers,
9861 so we can assume that any live call-saved register is set within
9862 the function. */
9863 if (df_regs_ever_live_p (regno))
9864 return true;
9865
9866 /* Check for registers that are clobbered by FUNCTION_PROFILER.
9867 These clobbers are not explicit in the rtl. */
9868 if (crtl->profile && MIPS_SAVE_REG_FOR_PROFILING_P (regno))
9869 return true;
9870
9871 /* If we're using a call-saved global pointer, the function's
9872 prologue will need to set it up. */
9873 if (cfun->machine->global_pointer == regno)
9874 return true;
9875
9876 /* The function's prologue will need to set the frame pointer if
9877 frame_pointer_needed. */
9878 if (regno == HARD_FRAME_POINTER_REGNUM && frame_pointer_needed)
9879 return true;
9880
9881 /* If a MIPS16 function returns a value in FPRs, its epilogue
9882 will need to call an external libgcc routine. This yet-to-be
9883 generated call_insn will clobber $31. */
9884 if (regno == RETURN_ADDR_REGNUM && mips16_cfun_returns_in_fpr_p ())
9885 return true;
9886
9887 /* If REGNO is ordinarily call-clobbered, we must assume that any
9888 called function could modify it. */
9889 if (cfun->machine->interrupt_handler_p
9890 && !crtl->is_leaf
9891 && mips_interrupt_extra_call_saved_reg_p (regno))
9892 return true;
9893
9894 return false;
9895 }
9896
9897 /* Return true if the current function must save register REGNO. */
9898
9899 static bool
9900 mips_save_reg_p (unsigned int regno)
9901 {
9902 if (mips_cfun_call_saved_reg_p (regno))
9903 {
9904 if (mips_cfun_might_clobber_call_saved_reg_p (regno))
9905 return true;
9906
9907 /* Save both registers in an FPR pair if either one is used. This is
9908 needed for the case when MIN_FPRS_PER_FMT == 1, which allows the odd
9909 register to be used without the even register. */
9910 if (FP_REG_P (regno)
9911 && MAX_FPRS_PER_FMT == 2
9912 && mips_cfun_might_clobber_call_saved_reg_p (regno + 1))
9913 return true;
9914 }
9915
9916 /* We need to save the incoming return address if __builtin_eh_return
9917 is being used to set a different return address. */
9918 if (regno == RETURN_ADDR_REGNUM && crtl->calls_eh_return)
9919 return true;
9920
9921 return false;
9922 }
9923
9924 /* Populate the current function's mips_frame_info structure.
9925
9926 MIPS stack frames look like:
9927
9928 +-------------------------------+
9929 | |
9930 | incoming stack arguments |
9931 | |
9932 +-------------------------------+
9933 | |
9934 | caller-allocated save area |
9935 A | for register arguments |
9936 | |
9937 +-------------------------------+ <-- incoming stack pointer
9938 | |
9939 | callee-allocated save area |
9940 B | for arguments that are |
9941 | split between registers and |
9942 | the stack |
9943 | |
9944 +-------------------------------+ <-- arg_pointer_rtx
9945 | |
9946 C | callee-allocated save area |
9947 | for register varargs |
9948 | |
9949 +-------------------------------+ <-- frame_pointer_rtx
9950 | | + cop0_sp_offset
9951 | COP0 reg save area | + UNITS_PER_WORD
9952 | |
9953 +-------------------------------+ <-- frame_pointer_rtx + acc_sp_offset
9954 | | + UNITS_PER_WORD
9955 | accumulator save area |
9956 | |
9957 +-------------------------------+ <-- stack_pointer_rtx + fp_sp_offset
9958 | | + UNITS_PER_HWFPVALUE
9959 | FPR save area |
9960 | |
9961 +-------------------------------+ <-- stack_pointer_rtx + gp_sp_offset
9962 | | + UNITS_PER_WORD
9963 | GPR save area |
9964 | |
9965 +-------------------------------+ <-- frame_pointer_rtx with
9966 | | \ -fstack-protector
9967 | local variables | | var_size
9968 | | /
9969 +-------------------------------+
9970 | | \
9971 | $gp save area | | cprestore_size
9972 | | /
9973 P +-------------------------------+ <-- hard_frame_pointer_rtx for
9974 | | \ MIPS16 code
9975 | outgoing stack arguments | |
9976 | | |
9977 +-------------------------------+ | args_size
9978 | | |
9979 | caller-allocated save area | |
9980 | for register arguments | |
9981 | | /
9982 +-------------------------------+ <-- stack_pointer_rtx
9983 frame_pointer_rtx without
9984 -fstack-protector
9985 hard_frame_pointer_rtx for
9986 non-MIPS16 code.
9987
9988 At least two of A, B and C will be empty.
9989
9990 Dynamic stack allocations such as alloca insert data at point P.
9991 They decrease stack_pointer_rtx but leave frame_pointer_rtx and
9992 hard_frame_pointer_rtx unchanged. */
9993
9994 static void
9995 mips_compute_frame_info (void)
9996 {
9997 struct mips_frame_info *frame;
9998 HOST_WIDE_INT offset, size;
9999 unsigned int regno, i;
10000
10001 /* Set this function's interrupt properties. */
10002 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl)))
10003 {
10004 if (mips_isa_rev < 2)
10005 error ("the %<interrupt%> attribute requires a MIPS32r2 processor or greater");
10006 else if (TARGET_HARD_FLOAT)
10007 error ("the %<interrupt%> attribute requires %<-msoft-float%>");
10008 else if (TARGET_MIPS16)
10009 error ("interrupt handlers cannot be MIPS16 functions");
10010 else
10011 {
10012 cfun->machine->interrupt_handler_p = true;
10013 cfun->machine->use_shadow_register_set_p =
10014 mips_use_shadow_register_set_p (TREE_TYPE (current_function_decl));
10015 cfun->machine->keep_interrupts_masked_p =
10016 mips_keep_interrupts_masked_p (TREE_TYPE (current_function_decl));
10017 cfun->machine->use_debug_exception_return_p =
10018 mips_use_debug_exception_return_p (TREE_TYPE
10019 (current_function_decl));
10020 }
10021 }
10022
10023 frame = &cfun->machine->frame;
10024 memset (frame, 0, sizeof (*frame));
10025 size = get_frame_size ();
10026
10027 cfun->machine->global_pointer = mips_global_pointer ();
10028
10029 /* The first two blocks contain the outgoing argument area and the $gp save
10030 slot. This area isn't needed in leaf functions, but if the
10031 target-independent frame size is nonzero, we have already committed to
10032 allocating these in STARTING_FRAME_OFFSET for !FRAME_GROWS_DOWNWARD. */
10033 if ((size == 0 || FRAME_GROWS_DOWNWARD) && crtl->is_leaf)
10034 {
10035 /* The MIPS 3.0 linker does not like functions that dynamically
10036 allocate the stack and have 0 for STACK_DYNAMIC_OFFSET, since it
10037 looks like we are trying to create a second frame pointer to the
10038 function, so allocate some stack space to make it happy. */
10039 if (cfun->calls_alloca)
10040 frame->args_size = REG_PARM_STACK_SPACE (cfun->decl);
10041 else
10042 frame->args_size = 0;
10043 frame->cprestore_size = 0;
10044 }
10045 else
10046 {
10047 frame->args_size = crtl->outgoing_args_size;
10048 frame->cprestore_size = MIPS_GP_SAVE_AREA_SIZE;
10049 }
10050 offset = frame->args_size + frame->cprestore_size;
10051
10052 /* Move above the local variables. */
10053 frame->var_size = MIPS_STACK_ALIGN (size);
10054 offset += frame->var_size;
10055
10056 /* Find out which GPRs we need to save. */
10057 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++)
10058 if (mips_save_reg_p (regno))
10059 {
10060 frame->num_gp++;
10061 frame->mask |= 1 << (regno - GP_REG_FIRST);
10062 }
10063
10064 /* If this function calls eh_return, we must also save and restore the
10065 EH data registers. */
10066 if (crtl->calls_eh_return)
10067 for (i = 0; EH_RETURN_DATA_REGNO (i) != INVALID_REGNUM; i++)
10068 {
10069 frame->num_gp++;
10070 frame->mask |= 1 << (EH_RETURN_DATA_REGNO (i) - GP_REG_FIRST);
10071 }
10072
10073 /* The MIPS16e SAVE and RESTORE instructions have two ranges of registers:
10074 $a3-$a0 and $s2-$s8. If we save one register in the range, we must
10075 save all later registers too. */
10076 if (GENERATE_MIPS16E_SAVE_RESTORE)
10077 {
10078 mips16e_mask_registers (&frame->mask, mips16e_s2_s8_regs,
10079 ARRAY_SIZE (mips16e_s2_s8_regs), &frame->num_gp);
10080 mips16e_mask_registers (&frame->mask, mips16e_a0_a3_regs,
10081 ARRAY_SIZE (mips16e_a0_a3_regs), &frame->num_gp);
10082 }
10083
10084 /* Move above the GPR save area. */
10085 if (frame->num_gp > 0)
10086 {
10087 offset += MIPS_STACK_ALIGN (frame->num_gp * UNITS_PER_WORD);
10088 frame->gp_sp_offset = offset - UNITS_PER_WORD;
10089 }
10090
10091 /* Find out which FPRs we need to save. This loop must iterate over
10092 the same space as its companion in mips_for_each_saved_gpr_and_fpr. */
10093 if (TARGET_HARD_FLOAT)
10094 for (regno = FP_REG_FIRST; regno <= FP_REG_LAST; regno += MAX_FPRS_PER_FMT)
10095 if (mips_save_reg_p (regno))
10096 {
10097 frame->num_fp += MAX_FPRS_PER_FMT;
10098 frame->fmask |= ~(~0 << MAX_FPRS_PER_FMT) << (regno - FP_REG_FIRST);
10099 }
10100
10101 /* Move above the FPR save area. */
10102 if (frame->num_fp > 0)
10103 {
10104 offset += MIPS_STACK_ALIGN (frame->num_fp * UNITS_PER_FPREG);
10105 frame->fp_sp_offset = offset - UNITS_PER_HWFPVALUE;
10106 }
10107
10108 /* Add in space for the interrupt context information. */
10109 if (cfun->machine->interrupt_handler_p)
10110 {
10111 /* Check HI/LO. */
10112 if (mips_save_reg_p (LO_REGNUM) || mips_save_reg_p (HI_REGNUM))
10113 {
10114 frame->num_acc++;
10115 frame->acc_mask |= (1 << 0);
10116 }
10117
10118 /* Check accumulators 1, 2, 3. */
10119 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2)
10120 if (mips_save_reg_p (i) || mips_save_reg_p (i + 1))
10121 {
10122 frame->num_acc++;
10123 frame->acc_mask |= 1 << (((i - DSP_ACC_REG_FIRST) / 2) + 1);
10124 }
10125
10126 /* All interrupt context functions need space to preserve STATUS. */
10127 frame->num_cop0_regs++;
10128
10129 /* If we don't keep interrupts masked, we need to save EPC. */
10130 if (!cfun->machine->keep_interrupts_masked_p)
10131 frame->num_cop0_regs++;
10132 }
10133
10134 /* Move above the accumulator save area. */
10135 if (frame->num_acc > 0)
10136 {
10137 /* Each accumulator needs 2 words. */
10138 offset += frame->num_acc * 2 * UNITS_PER_WORD;
10139 frame->acc_sp_offset = offset - UNITS_PER_WORD;
10140 }
10141
10142 /* Move above the COP0 register save area. */
10143 if (frame->num_cop0_regs > 0)
10144 {
10145 offset += frame->num_cop0_regs * UNITS_PER_WORD;
10146 frame->cop0_sp_offset = offset - UNITS_PER_WORD;
10147 }
10148
10149 /* Move above the callee-allocated varargs save area. */
10150 offset += MIPS_STACK_ALIGN (cfun->machine->varargs_size);
10151 frame->arg_pointer_offset = offset;
10152
10153 /* Move above the callee-allocated area for pretend stack arguments. */
10154 offset += crtl->args.pretend_args_size;
10155 frame->total_size = offset;
10156
10157 /* Work out the offsets of the save areas from the top of the frame. */
10158 if (frame->gp_sp_offset > 0)
10159 frame->gp_save_offset = frame->gp_sp_offset - offset;
10160 if (frame->fp_sp_offset > 0)
10161 frame->fp_save_offset = frame->fp_sp_offset - offset;
10162 if (frame->acc_sp_offset > 0)
10163 frame->acc_save_offset = frame->acc_sp_offset - offset;
10164 if (frame->num_cop0_regs > 0)
10165 frame->cop0_save_offset = frame->cop0_sp_offset - offset;
10166
10167 /* MIPS16 code offsets the frame pointer by the size of the outgoing
10168 arguments. This tends to increase the chances of using unextended
10169 instructions for local variables and incoming arguments. */
10170 if (TARGET_MIPS16)
10171 frame->hard_frame_pointer_offset = frame->args_size;
10172 }
10173
10174 /* Return the style of GP load sequence that is being used for the
10175 current function. */
10176
10177 enum mips_loadgp_style
10178 mips_current_loadgp_style (void)
10179 {
10180 if (!TARGET_USE_GOT || cfun->machine->global_pointer == INVALID_REGNUM)
10181 return LOADGP_NONE;
10182
10183 if (TARGET_RTP_PIC)
10184 return LOADGP_RTP;
10185
10186 if (TARGET_ABSOLUTE_ABICALLS)
10187 return LOADGP_ABSOLUTE;
10188
10189 return TARGET_NEWABI ? LOADGP_NEWABI : LOADGP_OLDABI;
10190 }
10191
10192 /* Implement TARGET_FRAME_POINTER_REQUIRED. */
10193
10194 static bool
10195 mips_frame_pointer_required (void)
10196 {
10197 /* If the function contains dynamic stack allocations, we need to
10198 use the frame pointer to access the static parts of the frame. */
10199 if (cfun->calls_alloca)
10200 return true;
10201
10202 /* In MIPS16 mode, we need a frame pointer for a large frame; otherwise,
10203 reload may be unable to compute the address of a local variable,
10204 since there is no way to add a large constant to the stack pointer
10205 without using a second temporary register. */
10206 if (TARGET_MIPS16)
10207 {
10208 mips_compute_frame_info ();
10209 if (!SMALL_OPERAND (cfun->machine->frame.total_size))
10210 return true;
10211 }
10212
10213 return false;
10214 }
10215
10216 /* Make sure that we're not trying to eliminate to the wrong hard frame
10217 pointer. */
10218
10219 static bool
10220 mips_can_eliminate (const int from ATTRIBUTE_UNUSED, const int to)
10221 {
10222 return (to == HARD_FRAME_POINTER_REGNUM || to == STACK_POINTER_REGNUM);
10223 }
10224
10225 /* Implement INITIAL_ELIMINATION_OFFSET. FROM is either the frame pointer
10226 or argument pointer. TO is either the stack pointer or hard frame
10227 pointer. */
10228
10229 HOST_WIDE_INT
10230 mips_initial_elimination_offset (int from, int to)
10231 {
10232 HOST_WIDE_INT offset;
10233
10234 mips_compute_frame_info ();
10235
10236 /* Set OFFSET to the offset from the end-of-prologue stack pointer. */
10237 switch (from)
10238 {
10239 case FRAME_POINTER_REGNUM:
10240 if (FRAME_GROWS_DOWNWARD)
10241 offset = (cfun->machine->frame.args_size
10242 + cfun->machine->frame.cprestore_size
10243 + cfun->machine->frame.var_size);
10244 else
10245 offset = 0;
10246 break;
10247
10248 case ARG_POINTER_REGNUM:
10249 offset = cfun->machine->frame.arg_pointer_offset;
10250 break;
10251
10252 default:
10253 gcc_unreachable ();
10254 }
10255
10256 if (to == HARD_FRAME_POINTER_REGNUM)
10257 offset -= cfun->machine->frame.hard_frame_pointer_offset;
10258
10259 return offset;
10260 }
10261 \f
10262 /* Implement TARGET_EXTRA_LIVE_ON_ENTRY. */
10263
10264 static void
10265 mips_extra_live_on_entry (bitmap regs)
10266 {
10267 if (TARGET_USE_GOT)
10268 {
10269 /* PIC_FUNCTION_ADDR_REGNUM is live if we need it to set up
10270 the global pointer. */
10271 if (!TARGET_ABSOLUTE_ABICALLS)
10272 bitmap_set_bit (regs, PIC_FUNCTION_ADDR_REGNUM);
10273
10274 /* The prologue may set MIPS16_PIC_TEMP_REGNUM to the value of
10275 the global pointer. */
10276 if (TARGET_MIPS16)
10277 bitmap_set_bit (regs, MIPS16_PIC_TEMP_REGNUM);
10278
10279 /* See the comment above load_call<mode> for details. */
10280 bitmap_set_bit (regs, GOT_VERSION_REGNUM);
10281 }
10282 }
10283
10284 /* Implement RETURN_ADDR_RTX. We do not support moving back to a
10285 previous frame. */
10286
10287 rtx
10288 mips_return_addr (int count, rtx frame ATTRIBUTE_UNUSED)
10289 {
10290 if (count != 0)
10291 return const0_rtx;
10292
10293 return get_hard_reg_initial_val (Pmode, RETURN_ADDR_REGNUM);
10294 }
10295
10296 /* Emit code to change the current function's return address to
10297 ADDRESS. SCRATCH is available as a scratch register, if needed.
10298 ADDRESS and SCRATCH are both word-mode GPRs. */
10299
10300 void
10301 mips_set_return_address (rtx address, rtx scratch)
10302 {
10303 rtx slot_address;
10304
10305 gcc_assert (BITSET_P (cfun->machine->frame.mask, RETURN_ADDR_REGNUM));
10306 slot_address = mips_add_offset (scratch, stack_pointer_rtx,
10307 cfun->machine->frame.gp_sp_offset);
10308 mips_emit_move (gen_frame_mem (GET_MODE (address), slot_address), address);
10309 }
10310
10311 /* Return true if the current function has a cprestore slot. */
10312
10313 bool
10314 mips_cfun_has_cprestore_slot_p (void)
10315 {
10316 return (cfun->machine->global_pointer != INVALID_REGNUM
10317 && cfun->machine->frame.cprestore_size > 0);
10318 }
10319
10320 /* Fill *BASE and *OFFSET such that *BASE + *OFFSET refers to the
10321 cprestore slot. LOAD_P is true if the caller wants to load from
10322 the cprestore slot; it is false if the caller wants to store to
10323 the slot. */
10324
10325 static void
10326 mips_get_cprestore_base_and_offset (rtx *base, HOST_WIDE_INT *offset,
10327 bool load_p)
10328 {
10329 const struct mips_frame_info *frame;
10330
10331 frame = &cfun->machine->frame;
10332 /* .cprestore always uses the stack pointer instead of the frame pointer.
10333 We have a free choice for direct stores for non-MIPS16 functions,
10334 and for MIPS16 functions whose cprestore slot is in range of the
10335 stack pointer. Using the stack pointer would sometimes give more
10336 (early) scheduling freedom, but using the frame pointer would
10337 sometimes give more (late) scheduling freedom. It's hard to
10338 predict which applies to a given function, so let's keep things
10339 simple.
10340
10341 Loads must always use the frame pointer in functions that call
10342 alloca, and there's little benefit to using the stack pointer
10343 otherwise. */
10344 if (frame_pointer_needed && !(TARGET_CPRESTORE_DIRECTIVE && !load_p))
10345 {
10346 *base = hard_frame_pointer_rtx;
10347 *offset = frame->args_size - frame->hard_frame_pointer_offset;
10348 }
10349 else
10350 {
10351 *base = stack_pointer_rtx;
10352 *offset = frame->args_size;
10353 }
10354 }
10355
10356 /* Return true if X is the load or store address of the cprestore slot;
10357 LOAD_P says which. */
10358
10359 bool
10360 mips_cprestore_address_p (rtx x, bool load_p)
10361 {
10362 rtx given_base, required_base;
10363 HOST_WIDE_INT given_offset, required_offset;
10364
10365 mips_split_plus (x, &given_base, &given_offset);
10366 mips_get_cprestore_base_and_offset (&required_base, &required_offset, load_p);
10367 return given_base == required_base && given_offset == required_offset;
10368 }
10369
10370 /* Return a MEM rtx for the cprestore slot. LOAD_P is true if we are
10371 going to load from it, false if we are going to store to it.
10372 Use TEMP as a temporary register if need be. */
10373
10374 static rtx
10375 mips_cprestore_slot (rtx temp, bool load_p)
10376 {
10377 rtx base;
10378 HOST_WIDE_INT offset;
10379
10380 mips_get_cprestore_base_and_offset (&base, &offset, load_p);
10381 return gen_frame_mem (Pmode, mips_add_offset (temp, base, offset));
10382 }
10383
10384 /* Emit instructions to save global pointer value GP into cprestore
10385 slot MEM. OFFSET is the offset that MEM applies to the base register.
10386
10387 MEM may not be a legitimate address. If it isn't, TEMP is a
10388 temporary register that can be used, otherwise it is a SCRATCH. */
10389
10390 void
10391 mips_save_gp_to_cprestore_slot (rtx mem, rtx offset, rtx gp, rtx temp)
10392 {
10393 if (TARGET_CPRESTORE_DIRECTIVE)
10394 {
10395 gcc_assert (gp == pic_offset_table_rtx);
10396 emit_insn (PMODE_INSN (gen_cprestore, (mem, offset)));
10397 }
10398 else
10399 mips_emit_move (mips_cprestore_slot (temp, false), gp);
10400 }
10401
10402 /* Restore $gp from its save slot, using TEMP as a temporary base register
10403 if need be. This function is for o32 and o64 abicalls only.
10404
10405 See mips_must_initialize_gp_p for details about how we manage the
10406 global pointer. */
10407
10408 void
10409 mips_restore_gp_from_cprestore_slot (rtx temp)
10410 {
10411 gcc_assert (TARGET_ABICALLS && TARGET_OLDABI && epilogue_completed);
10412
10413 if (!cfun->machine->must_restore_gp_when_clobbered_p)
10414 {
10415 emit_note (NOTE_INSN_DELETED);
10416 return;
10417 }
10418
10419 if (TARGET_MIPS16)
10420 {
10421 mips_emit_move (temp, mips_cprestore_slot (temp, true));
10422 mips_emit_move (pic_offset_table_rtx, temp);
10423 }
10424 else
10425 mips_emit_move (pic_offset_table_rtx, mips_cprestore_slot (temp, true));
10426 if (!TARGET_EXPLICIT_RELOCS)
10427 emit_insn (gen_blockage ());
10428 }
10429 \f
10430 /* A function to save or store a register. The first argument is the
10431 register and the second is the stack slot. */
10432 typedef void (*mips_save_restore_fn) (rtx, rtx);
10433
10434 /* Use FN to save or restore register REGNO. MODE is the register's
10435 mode and OFFSET is the offset of its save slot from the current
10436 stack pointer. */
10437
10438 static void
10439 mips_save_restore_reg (enum machine_mode mode, int regno,
10440 HOST_WIDE_INT offset, mips_save_restore_fn fn)
10441 {
10442 rtx mem;
10443
10444 mem = gen_frame_mem (mode, plus_constant (Pmode, stack_pointer_rtx,
10445 offset));
10446 fn (gen_rtx_REG (mode, regno), mem);
10447 }
10448
10449 /* Call FN for each accumlator that is saved by the current function.
10450 SP_OFFSET is the offset of the current stack pointer from the start
10451 of the frame. */
10452
10453 static void
10454 mips_for_each_saved_acc (HOST_WIDE_INT sp_offset, mips_save_restore_fn fn)
10455 {
10456 HOST_WIDE_INT offset;
10457 int regno;
10458
10459 offset = cfun->machine->frame.acc_sp_offset - sp_offset;
10460 if (BITSET_P (cfun->machine->frame.acc_mask, 0))
10461 {
10462 mips_save_restore_reg (word_mode, LO_REGNUM, offset, fn);
10463 offset -= UNITS_PER_WORD;
10464 mips_save_restore_reg (word_mode, HI_REGNUM, offset, fn);
10465 offset -= UNITS_PER_WORD;
10466 }
10467
10468 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno++)
10469 if (BITSET_P (cfun->machine->frame.acc_mask,
10470 ((regno - DSP_ACC_REG_FIRST) / 2) + 1))
10471 {
10472 mips_save_restore_reg (word_mode, regno, offset, fn);
10473 offset -= UNITS_PER_WORD;
10474 }
10475 }
10476
10477 /* Save register REG to MEM. Make the instruction frame-related. */
10478
10479 static void
10480 mips_save_reg (rtx reg, rtx mem)
10481 {
10482 if (GET_MODE (reg) == DFmode && !TARGET_FLOAT64)
10483 {
10484 rtx x1, x2;
10485
10486 mips_emit_move_or_split (mem, reg, SPLIT_IF_NECESSARY);
10487
10488 x1 = mips_frame_set (mips_subword (mem, false),
10489 mips_subword (reg, false));
10490 x2 = mips_frame_set (mips_subword (mem, true),
10491 mips_subword (reg, true));
10492 mips_set_frame_expr (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, x1, x2)));
10493 }
10494 else
10495 mips_emit_save_slot_move (mem, reg, MIPS_PROLOGUE_TEMP (GET_MODE (reg)));
10496 }
10497
10498 /* Capture the register combinations that are allowed in a SWM or LWM
10499 instruction. The entries are ordered by number of registers set in
10500 the mask. We also ignore the single register encodings because a
10501 normal SW/LW is preferred. */
10502
10503 static const unsigned int umips_swm_mask[17] = {
10504 0xc0ff0000, 0x80ff0000, 0x40ff0000, 0x807f0000,
10505 0x00ff0000, 0x803f0000, 0x007f0000, 0x801f0000,
10506 0x003f0000, 0x800f0000, 0x001f0000, 0x80070000,
10507 0x000f0000, 0x80030000, 0x00070000, 0x80010000,
10508 0x00030000
10509 };
10510
10511 static const unsigned int umips_swm_encoding[17] = {
10512 25, 24, 9, 23, 8, 22, 7, 21, 6, 20, 5, 19, 4, 18, 3, 17, 2
10513 };
10514
10515 /* Try to use a microMIPS LWM or SWM instruction to save or restore
10516 as many GPRs in *MASK as possible. *OFFSET is the offset from the
10517 stack pointer of the topmost save slot.
10518
10519 Remove from *MASK all registers that were handled using LWM and SWM.
10520 Update *OFFSET so that it points to the first unused save slot. */
10521
10522 static bool
10523 umips_build_save_restore (mips_save_restore_fn fn,
10524 unsigned *mask, HOST_WIDE_INT *offset)
10525 {
10526 int nregs;
10527 unsigned int i, j;
10528 rtx pattern, set, reg, mem;
10529 HOST_WIDE_INT this_offset;
10530 rtx this_base;
10531
10532 /* Try matching $16 to $31 (s0 to ra). */
10533 for (i = 0; i < ARRAY_SIZE (umips_swm_mask); i++)
10534 if ((*mask & 0xffff0000) == umips_swm_mask[i])
10535 break;
10536
10537 if (i == ARRAY_SIZE (umips_swm_mask))
10538 return false;
10539
10540 /* Get the offset of the lowest save slot. */
10541 nregs = (umips_swm_encoding[i] & 0xf) + (umips_swm_encoding[i] >> 4);
10542 this_offset = *offset - UNITS_PER_WORD * (nregs - 1);
10543
10544 /* LWM/SWM can only support offsets from -2048 to 2047. */
10545 if (!UMIPS_12BIT_OFFSET_P (this_offset))
10546 return false;
10547
10548 /* Create the final PARALLEL. */
10549 pattern = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (nregs));
10550 this_base = stack_pointer_rtx;
10551
10552 /* For registers $16-$23 and $30. */
10553 for (j = 0; j < (umips_swm_encoding[i] & 0xf); j++)
10554 {
10555 HOST_WIDE_INT offset = this_offset + j * UNITS_PER_WORD;
10556 mem = gen_frame_mem (SImode, plus_constant (Pmode, this_base, offset));
10557 unsigned int regno = (j != 8) ? 16 + j : 30;
10558 *mask &= ~(1 << regno);
10559 reg = gen_rtx_REG (SImode, regno);
10560 if (fn == mips_save_reg)
10561 set = mips_frame_set (mem, reg);
10562 else
10563 {
10564 set = gen_rtx_SET (VOIDmode, reg, mem);
10565 mips_add_cfa_restore (reg);
10566 }
10567 XVECEXP (pattern, 0, j) = set;
10568 }
10569
10570 /* For register $31. */
10571 if (umips_swm_encoding[i] >> 4)
10572 {
10573 HOST_WIDE_INT offset = this_offset + j * UNITS_PER_WORD;
10574 *mask &= ~(1 << 31);
10575 mem = gen_frame_mem (SImode, plus_constant (Pmode, this_base, offset));
10576 reg = gen_rtx_REG (SImode, 31);
10577 if (fn == mips_save_reg)
10578 set = mips_frame_set (mem, reg);
10579 else
10580 {
10581 set = gen_rtx_SET (VOIDmode, reg, mem);
10582 mips_add_cfa_restore (reg);
10583 }
10584 XVECEXP (pattern, 0, j) = set;
10585 }
10586
10587 pattern = emit_insn (pattern);
10588 if (fn == mips_save_reg)
10589 RTX_FRAME_RELATED_P (pattern) = 1;
10590
10591 /* Adjust the last offset. */
10592 *offset -= UNITS_PER_WORD * nregs;
10593
10594 return true;
10595 }
10596
10597 /* Call FN for each register that is saved by the current function.
10598 SP_OFFSET is the offset of the current stack pointer from the start
10599 of the frame. */
10600
10601 static void
10602 mips_for_each_saved_gpr_and_fpr (HOST_WIDE_INT sp_offset,
10603 mips_save_restore_fn fn)
10604 {
10605 enum machine_mode fpr_mode;
10606 int regno;
10607 const struct mips_frame_info *frame = &cfun->machine->frame;
10608 HOST_WIDE_INT offset;
10609 unsigned int mask;
10610
10611 /* Save registers starting from high to low. The debuggers prefer at least
10612 the return register be stored at func+4, and also it allows us not to
10613 need a nop in the epilogue if at least one register is reloaded in
10614 addition to return address. */
10615 offset = frame->gp_sp_offset - sp_offset;
10616 mask = frame->mask;
10617
10618 if (TARGET_MICROMIPS)
10619 umips_build_save_restore (fn, &mask, &offset);
10620
10621 for (regno = GP_REG_LAST; regno >= GP_REG_FIRST; regno--)
10622 if (BITSET_P (mask, regno - GP_REG_FIRST))
10623 {
10624 /* Record the ra offset for use by mips_function_profiler. */
10625 if (regno == RETURN_ADDR_REGNUM)
10626 cfun->machine->frame.ra_fp_offset = offset + sp_offset;
10627 mips_save_restore_reg (word_mode, regno, offset, fn);
10628 offset -= UNITS_PER_WORD;
10629 }
10630
10631 /* This loop must iterate over the same space as its companion in
10632 mips_compute_frame_info. */
10633 offset = cfun->machine->frame.fp_sp_offset - sp_offset;
10634 fpr_mode = (TARGET_SINGLE_FLOAT ? SFmode : DFmode);
10635 for (regno = FP_REG_LAST - MAX_FPRS_PER_FMT + 1;
10636 regno >= FP_REG_FIRST;
10637 regno -= MAX_FPRS_PER_FMT)
10638 if (BITSET_P (cfun->machine->frame.fmask, regno - FP_REG_FIRST))
10639 {
10640 mips_save_restore_reg (fpr_mode, regno, offset, fn);
10641 offset -= GET_MODE_SIZE (fpr_mode);
10642 }
10643 }
10644
10645 /* Return true if a move between register REGNO and its save slot (MEM)
10646 can be done in a single move. LOAD_P is true if we are loading
10647 from the slot, false if we are storing to it. */
10648
10649 static bool
10650 mips_direct_save_slot_move_p (unsigned int regno, rtx mem, bool load_p)
10651 {
10652 /* There is a specific MIPS16 instruction for saving $31 to the stack. */
10653 if (TARGET_MIPS16 && !load_p && regno == RETURN_ADDR_REGNUM)
10654 return false;
10655
10656 return mips_secondary_reload_class (REGNO_REG_CLASS (regno),
10657 GET_MODE (mem), mem, load_p) == NO_REGS;
10658 }
10659
10660 /* Emit a move from SRC to DEST, given that one of them is a register
10661 save slot and that the other is a register. TEMP is a temporary
10662 GPR of the same mode that is available if need be. */
10663
10664 void
10665 mips_emit_save_slot_move (rtx dest, rtx src, rtx temp)
10666 {
10667 unsigned int regno;
10668 rtx mem;
10669
10670 if (REG_P (src))
10671 {
10672 regno = REGNO (src);
10673 mem = dest;
10674 }
10675 else
10676 {
10677 regno = REGNO (dest);
10678 mem = src;
10679 }
10680
10681 if (regno == cfun->machine->global_pointer && !mips_must_initialize_gp_p ())
10682 {
10683 /* We don't yet know whether we'll need this instruction or not.
10684 Postpone the decision by emitting a ghost move. This move
10685 is specifically not frame-related; only the split version is. */
10686 if (TARGET_64BIT)
10687 emit_insn (gen_move_gpdi (dest, src));
10688 else
10689 emit_insn (gen_move_gpsi (dest, src));
10690 return;
10691 }
10692
10693 if (regno == HI_REGNUM)
10694 {
10695 if (REG_P (dest))
10696 {
10697 mips_emit_move (temp, src);
10698 if (TARGET_64BIT)
10699 emit_insn (gen_mthisi_di (gen_rtx_REG (TImode, MD_REG_FIRST),
10700 temp, gen_rtx_REG (DImode, LO_REGNUM)));
10701 else
10702 emit_insn (gen_mthisi_di (gen_rtx_REG (DImode, MD_REG_FIRST),
10703 temp, gen_rtx_REG (SImode, LO_REGNUM)));
10704 }
10705 else
10706 {
10707 if (TARGET_64BIT)
10708 emit_insn (gen_mfhidi_ti (temp,
10709 gen_rtx_REG (TImode, MD_REG_FIRST)));
10710 else
10711 emit_insn (gen_mfhisi_di (temp,
10712 gen_rtx_REG (DImode, MD_REG_FIRST)));
10713 mips_emit_move (dest, temp);
10714 }
10715 }
10716 else if (mips_direct_save_slot_move_p (regno, mem, mem == src))
10717 mips_emit_move (dest, src);
10718 else
10719 {
10720 gcc_assert (!reg_overlap_mentioned_p (dest, temp));
10721 mips_emit_move (temp, src);
10722 mips_emit_move (dest, temp);
10723 }
10724 if (MEM_P (dest))
10725 mips_set_frame_expr (mips_frame_set (dest, src));
10726 }
10727 \f
10728 /* If we're generating n32 or n64 abicalls, and the current function
10729 does not use $28 as its global pointer, emit a cplocal directive.
10730 Use pic_offset_table_rtx as the argument to the directive. */
10731
10732 static void
10733 mips_output_cplocal (void)
10734 {
10735 if (!TARGET_EXPLICIT_RELOCS
10736 && mips_must_initialize_gp_p ()
10737 && cfun->machine->global_pointer != GLOBAL_POINTER_REGNUM)
10738 output_asm_insn (".cplocal %+", 0);
10739 }
10740
10741 /* Implement TARGET_OUTPUT_FUNCTION_PROLOGUE. */
10742
10743 static void
10744 mips_output_function_prologue (FILE *file, HOST_WIDE_INT size ATTRIBUTE_UNUSED)
10745 {
10746 const char *fnname;
10747
10748 /* In MIPS16 mode, we may need to generate a non-MIPS16 stub to handle
10749 floating-point arguments. */
10750 if (TARGET_MIPS16
10751 && TARGET_HARD_FLOAT_ABI
10752 && crtl->args.info.fp_code != 0)
10753 mips16_build_function_stub ();
10754
10755 /* Get the function name the same way that toplev.c does before calling
10756 assemble_start_function. This is needed so that the name used here
10757 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */
10758 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0);
10759 mips_start_function_definition (fnname, TARGET_MIPS16);
10760
10761 /* Output MIPS-specific frame information. */
10762 if (!flag_inhibit_size_directive)
10763 {
10764 const struct mips_frame_info *frame;
10765
10766 frame = &cfun->machine->frame;
10767
10768 /* .frame FRAMEREG, FRAMESIZE, RETREG. */
10769 fprintf (file,
10770 "\t.frame\t%s," HOST_WIDE_INT_PRINT_DEC ",%s\t\t"
10771 "# vars= " HOST_WIDE_INT_PRINT_DEC
10772 ", regs= %d/%d"
10773 ", args= " HOST_WIDE_INT_PRINT_DEC
10774 ", gp= " HOST_WIDE_INT_PRINT_DEC "\n",
10775 reg_names[frame_pointer_needed
10776 ? HARD_FRAME_POINTER_REGNUM
10777 : STACK_POINTER_REGNUM],
10778 (frame_pointer_needed
10779 ? frame->total_size - frame->hard_frame_pointer_offset
10780 : frame->total_size),
10781 reg_names[RETURN_ADDR_REGNUM],
10782 frame->var_size,
10783 frame->num_gp, frame->num_fp,
10784 frame->args_size,
10785 frame->cprestore_size);
10786
10787 /* .mask MASK, OFFSET. */
10788 fprintf (file, "\t.mask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n",
10789 frame->mask, frame->gp_save_offset);
10790
10791 /* .fmask MASK, OFFSET. */
10792 fprintf (file, "\t.fmask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n",
10793 frame->fmask, frame->fp_save_offset);
10794 }
10795
10796 /* Handle the initialization of $gp for SVR4 PIC, if applicable.
10797 Also emit the ".set noreorder; .set nomacro" sequence for functions
10798 that need it. */
10799 if (mips_must_initialize_gp_p ()
10800 && mips_current_loadgp_style () == LOADGP_OLDABI)
10801 {
10802 if (TARGET_MIPS16)
10803 {
10804 /* This is a fixed-form sequence. The position of the
10805 first two instructions is important because of the
10806 way _gp_disp is defined. */
10807 output_asm_insn ("li\t$2,%%hi(_gp_disp)", 0);
10808 output_asm_insn ("addiu\t$3,$pc,%%lo(_gp_disp)", 0);
10809 output_asm_insn ("sll\t$2,16", 0);
10810 output_asm_insn ("addu\t$2,$3", 0);
10811 }
10812 else
10813 {
10814 /* .cpload must be in a .set noreorder but not a
10815 .set nomacro block. */
10816 mips_push_asm_switch (&mips_noreorder);
10817 output_asm_insn (".cpload\t%^", 0);
10818 if (!cfun->machine->all_noreorder_p)
10819 mips_pop_asm_switch (&mips_noreorder);
10820 else
10821 mips_push_asm_switch (&mips_nomacro);
10822 }
10823 }
10824 else if (cfun->machine->all_noreorder_p)
10825 {
10826 mips_push_asm_switch (&mips_noreorder);
10827 mips_push_asm_switch (&mips_nomacro);
10828 }
10829
10830 /* Tell the assembler which register we're using as the global
10831 pointer. This is needed for thunks, since they can use either
10832 explicit relocs or assembler macros. */
10833 mips_output_cplocal ();
10834 }
10835
10836 /* Implement TARGET_OUTPUT_FUNCTION_EPILOGUE. */
10837
10838 static void
10839 mips_output_function_epilogue (FILE *file ATTRIBUTE_UNUSED,
10840 HOST_WIDE_INT size ATTRIBUTE_UNUSED)
10841 {
10842 const char *fnname;
10843
10844 /* Reinstate the normal $gp. */
10845 SET_REGNO (pic_offset_table_rtx, GLOBAL_POINTER_REGNUM);
10846 mips_output_cplocal ();
10847
10848 if (cfun->machine->all_noreorder_p)
10849 {
10850 mips_pop_asm_switch (&mips_nomacro);
10851 mips_pop_asm_switch (&mips_noreorder);
10852 }
10853
10854 /* Get the function name the same way that toplev.c does before calling
10855 assemble_start_function. This is needed so that the name used here
10856 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */
10857 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0);
10858 mips_end_function_definition (fnname);
10859 }
10860 \f
10861 /* Emit an optimisation barrier for accesses to the current frame. */
10862
10863 static void
10864 mips_frame_barrier (void)
10865 {
10866 emit_clobber (gen_frame_mem (BLKmode, stack_pointer_rtx));
10867 }
10868
10869
10870 /* The __gnu_local_gp symbol. */
10871
10872 static GTY(()) rtx mips_gnu_local_gp;
10873
10874 /* If we're generating n32 or n64 abicalls, emit instructions
10875 to set up the global pointer. */
10876
10877 static void
10878 mips_emit_loadgp (void)
10879 {
10880 rtx addr, offset, incoming_address, base, index, pic_reg;
10881
10882 pic_reg = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx;
10883 switch (mips_current_loadgp_style ())
10884 {
10885 case LOADGP_ABSOLUTE:
10886 if (mips_gnu_local_gp == NULL)
10887 {
10888 mips_gnu_local_gp = gen_rtx_SYMBOL_REF (Pmode, "__gnu_local_gp");
10889 SYMBOL_REF_FLAGS (mips_gnu_local_gp) |= SYMBOL_FLAG_LOCAL;
10890 }
10891 emit_insn (PMODE_INSN (gen_loadgp_absolute,
10892 (pic_reg, mips_gnu_local_gp)));
10893 break;
10894
10895 case LOADGP_OLDABI:
10896 /* Added by mips_output_function_prologue. */
10897 break;
10898
10899 case LOADGP_NEWABI:
10900 addr = XEXP (DECL_RTL (current_function_decl), 0);
10901 offset = mips_unspec_address (addr, SYMBOL_GOTOFF_LOADGP);
10902 incoming_address = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
10903 emit_insn (PMODE_INSN (gen_loadgp_newabi,
10904 (pic_reg, offset, incoming_address)));
10905 break;
10906
10907 case LOADGP_RTP:
10908 base = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_BASE));
10909 index = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_INDEX));
10910 emit_insn (PMODE_INSN (gen_loadgp_rtp, (pic_reg, base, index)));
10911 break;
10912
10913 default:
10914 return;
10915 }
10916
10917 if (TARGET_MIPS16)
10918 emit_insn (PMODE_INSN (gen_copygp_mips16,
10919 (pic_offset_table_rtx, pic_reg)));
10920
10921 /* Emit a blockage if there are implicit uses of the GP register.
10922 This includes profiled functions, because FUNCTION_PROFILE uses
10923 a jal macro. */
10924 if (!TARGET_EXPLICIT_RELOCS || crtl->profile)
10925 emit_insn (gen_loadgp_blockage ());
10926 }
10927
10928 #define PROBE_INTERVAL (1 << STACK_CHECK_PROBE_INTERVAL_EXP)
10929
10930 #if PROBE_INTERVAL > 32768
10931 #error Cannot use indexed addressing mode for stack probing
10932 #endif
10933
10934 /* Emit code to probe a range of stack addresses from FIRST to FIRST+SIZE,
10935 inclusive. These are offsets from the current stack pointer. */
10936
10937 static void
10938 mips_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size)
10939 {
10940 if (TARGET_MIPS16)
10941 sorry ("-fstack-check=specific not implemented for MIPS16");
10942
10943 /* See if we have a constant small number of probes to generate. If so,
10944 that's the easy case. */
10945 if (first + size <= 32768)
10946 {
10947 HOST_WIDE_INT i;
10948
10949 /* Probe at FIRST + N * PROBE_INTERVAL for values of N from 1 until
10950 it exceeds SIZE. If only one probe is needed, this will not
10951 generate any code. Then probe at FIRST + SIZE. */
10952 for (i = PROBE_INTERVAL; i < size; i += PROBE_INTERVAL)
10953 emit_stack_probe (plus_constant (Pmode, stack_pointer_rtx,
10954 -(first + i)));
10955
10956 emit_stack_probe (plus_constant (Pmode, stack_pointer_rtx,
10957 -(first + size)));
10958 }
10959
10960 /* Otherwise, do the same as above, but in a loop. Note that we must be
10961 extra careful with variables wrapping around because we might be at
10962 the very top (or the very bottom) of the address space and we have
10963 to be able to handle this case properly; in particular, we use an
10964 equality test for the loop condition. */
10965 else
10966 {
10967 HOST_WIDE_INT rounded_size;
10968 rtx r3 = MIPS_PROLOGUE_TEMP (Pmode);
10969 rtx r12 = MIPS_PROLOGUE_TEMP2 (Pmode);
10970
10971 /* Sanity check for the addressing mode we're going to use. */
10972 gcc_assert (first <= 32768);
10973
10974
10975 /* Step 1: round SIZE to the previous multiple of the interval. */
10976
10977 rounded_size = size & -PROBE_INTERVAL;
10978
10979
10980 /* Step 2: compute initial and final value of the loop counter. */
10981
10982 /* TEST_ADDR = SP + FIRST. */
10983 emit_insn (gen_rtx_SET (VOIDmode, r3,
10984 plus_constant (Pmode, stack_pointer_rtx,
10985 -first)));
10986
10987 /* LAST_ADDR = SP + FIRST + ROUNDED_SIZE. */
10988 if (rounded_size > 32768)
10989 {
10990 emit_move_insn (r12, GEN_INT (rounded_size));
10991 emit_insn (gen_rtx_SET (VOIDmode, r12,
10992 gen_rtx_MINUS (Pmode, r3, r12)));
10993 }
10994 else
10995 emit_insn (gen_rtx_SET (VOIDmode, r12,
10996 plus_constant (Pmode, r3, -rounded_size)));
10997
10998
10999 /* Step 3: the loop
11000
11001 while (TEST_ADDR != LAST_ADDR)
11002 {
11003 TEST_ADDR = TEST_ADDR + PROBE_INTERVAL
11004 probe at TEST_ADDR
11005 }
11006
11007 probes at FIRST + N * PROBE_INTERVAL for values of N from 1
11008 until it is equal to ROUNDED_SIZE. */
11009
11010 emit_insn (PMODE_INSN (gen_probe_stack_range, (r3, r3, r12)));
11011
11012
11013 /* Step 4: probe at FIRST + SIZE if we cannot assert at compile-time
11014 that SIZE is equal to ROUNDED_SIZE. */
11015
11016 if (size != rounded_size)
11017 emit_stack_probe (plus_constant (Pmode, r12, rounded_size - size));
11018 }
11019
11020 /* Make sure nothing is scheduled before we are done. */
11021 emit_insn (gen_blockage ());
11022 }
11023
11024 /* Probe a range of stack addresses from REG1 to REG2 inclusive. These are
11025 absolute addresses. */
11026
11027 const char *
11028 mips_output_probe_stack_range (rtx reg1, rtx reg2)
11029 {
11030 static int labelno = 0;
11031 char loop_lab[32], end_lab[32], tmp[64];
11032 rtx xops[2];
11033
11034 ASM_GENERATE_INTERNAL_LABEL (loop_lab, "LPSRL", labelno);
11035 ASM_GENERATE_INTERNAL_LABEL (end_lab, "LPSRE", labelno++);
11036
11037 ASM_OUTPUT_INTERNAL_LABEL (asm_out_file, loop_lab);
11038
11039 /* Jump to END_LAB if TEST_ADDR == LAST_ADDR. */
11040 xops[0] = reg1;
11041 xops[1] = reg2;
11042 strcpy (tmp, "%(%<beq\t%0,%1,");
11043 output_asm_insn (strcat (tmp, &end_lab[1]), xops);
11044
11045 /* TEST_ADDR = TEST_ADDR + PROBE_INTERVAL. */
11046 xops[1] = GEN_INT (-PROBE_INTERVAL);
11047 if (TARGET_64BIT && TARGET_LONG64)
11048 output_asm_insn ("daddiu\t%0,%0,%1", xops);
11049 else
11050 output_asm_insn ("addiu\t%0,%0,%1", xops);
11051
11052 /* Probe at TEST_ADDR and branch. */
11053 fprintf (asm_out_file, "\tb\t");
11054 assemble_name_raw (asm_out_file, loop_lab);
11055 fputc ('\n', asm_out_file);
11056 if (TARGET_64BIT)
11057 output_asm_insn ("sd\t$0,0(%0)%)", xops);
11058 else
11059 output_asm_insn ("sw\t$0,0(%0)%)", xops);
11060
11061 ASM_OUTPUT_INTERNAL_LABEL (asm_out_file, end_lab);
11062
11063 return "";
11064 }
11065
11066 /* A for_each_rtx callback. Stop the search if *X is a kernel register. */
11067
11068 static int
11069 mips_kernel_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED)
11070 {
11071 return REG_P (*x) && KERNEL_REG_P (REGNO (*x));
11072 }
11073
11074 /* Expand the "prologue" pattern. */
11075
11076 void
11077 mips_expand_prologue (void)
11078 {
11079 const struct mips_frame_info *frame;
11080 HOST_WIDE_INT size;
11081 unsigned int nargs;
11082 rtx insn;
11083
11084 if (cfun->machine->global_pointer != INVALID_REGNUM)
11085 {
11086 /* Check whether an insn uses pic_offset_table_rtx, either explicitly
11087 or implicitly. If so, we can commit to using a global pointer
11088 straight away, otherwise we need to defer the decision. */
11089 if (mips_cfun_has_inflexible_gp_ref_p ()
11090 || mips_cfun_has_flexible_gp_ref_p ())
11091 {
11092 cfun->machine->must_initialize_gp_p = true;
11093 cfun->machine->must_restore_gp_when_clobbered_p = true;
11094 }
11095
11096 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer);
11097 }
11098
11099 frame = &cfun->machine->frame;
11100 size = frame->total_size;
11101
11102 if (flag_stack_usage_info)
11103 current_function_static_stack_size = size;
11104
11105 if (flag_stack_check == STATIC_BUILTIN_STACK_CHECK)
11106 {
11107 if (crtl->is_leaf && !cfun->calls_alloca)
11108 {
11109 if (size > PROBE_INTERVAL && size > STACK_CHECK_PROTECT)
11110 mips_emit_probe_stack_range (STACK_CHECK_PROTECT,
11111 size - STACK_CHECK_PROTECT);
11112 }
11113 else if (size > 0)
11114 mips_emit_probe_stack_range (STACK_CHECK_PROTECT, size);
11115 }
11116
11117 /* Save the registers. Allocate up to MIPS_MAX_FIRST_STACK_STEP
11118 bytes beforehand; this is enough to cover the register save area
11119 without going out of range. */
11120 if (((frame->mask | frame->fmask | frame->acc_mask) != 0)
11121 || frame->num_cop0_regs > 0)
11122 {
11123 HOST_WIDE_INT step1;
11124
11125 step1 = MIN (size, MIPS_MAX_FIRST_STACK_STEP);
11126 if (GENERATE_MIPS16E_SAVE_RESTORE)
11127 {
11128 HOST_WIDE_INT offset;
11129 unsigned int mask, regno;
11130
11131 /* Try to merge argument stores into the save instruction. */
11132 nargs = mips16e_collect_argument_saves ();
11133
11134 /* Build the save instruction. */
11135 mask = frame->mask;
11136 insn = mips16e_build_save_restore (false, &mask, &offset,
11137 nargs, step1);
11138 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11139 mips_frame_barrier ();
11140 size -= step1;
11141
11142 /* Check if we need to save other registers. */
11143 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++)
11144 if (BITSET_P (mask, regno - GP_REG_FIRST))
11145 {
11146 offset -= UNITS_PER_WORD;
11147 mips_save_restore_reg (word_mode, regno,
11148 offset, mips_save_reg);
11149 }
11150 }
11151 else
11152 {
11153 if (cfun->machine->interrupt_handler_p)
11154 {
11155 HOST_WIDE_INT offset;
11156 rtx mem;
11157
11158 /* If this interrupt is using a shadow register set, we need to
11159 get the stack pointer from the previous register set. */
11160 if (cfun->machine->use_shadow_register_set_p)
11161 emit_insn (gen_mips_rdpgpr (stack_pointer_rtx,
11162 stack_pointer_rtx));
11163
11164 if (!cfun->machine->keep_interrupts_masked_p)
11165 {
11166 /* Move from COP0 Cause to K0. */
11167 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K0_REG_NUM),
11168 gen_rtx_REG (SImode,
11169 COP0_CAUSE_REG_NUM)));
11170 /* Move from COP0 EPC to K1. */
11171 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM),
11172 gen_rtx_REG (SImode,
11173 COP0_EPC_REG_NUM)));
11174 }
11175
11176 /* Allocate the first part of the frame. */
11177 insn = gen_add3_insn (stack_pointer_rtx, stack_pointer_rtx,
11178 GEN_INT (-step1));
11179 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11180 mips_frame_barrier ();
11181 size -= step1;
11182
11183 /* Start at the uppermost location for saving. */
11184 offset = frame->cop0_sp_offset - size;
11185 if (!cfun->machine->keep_interrupts_masked_p)
11186 {
11187 /* Push EPC into its stack slot. */
11188 mem = gen_frame_mem (word_mode,
11189 plus_constant (Pmode, stack_pointer_rtx,
11190 offset));
11191 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM));
11192 offset -= UNITS_PER_WORD;
11193 }
11194
11195 /* Move from COP0 Status to K1. */
11196 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM),
11197 gen_rtx_REG (SImode,
11198 COP0_STATUS_REG_NUM)));
11199
11200 /* Right justify the RIPL in k0. */
11201 if (!cfun->machine->keep_interrupts_masked_p)
11202 emit_insn (gen_lshrsi3 (gen_rtx_REG (SImode, K0_REG_NUM),
11203 gen_rtx_REG (SImode, K0_REG_NUM),
11204 GEN_INT (CAUSE_IPL)));
11205
11206 /* Push Status into its stack slot. */
11207 mem = gen_frame_mem (word_mode,
11208 plus_constant (Pmode, stack_pointer_rtx,
11209 offset));
11210 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM));
11211 offset -= UNITS_PER_WORD;
11212
11213 /* Insert the RIPL into our copy of SR (k1) as the new IPL. */
11214 if (!cfun->machine->keep_interrupts_masked_p)
11215 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
11216 GEN_INT (6),
11217 GEN_INT (SR_IPL),
11218 gen_rtx_REG (SImode, K0_REG_NUM)));
11219
11220 if (!cfun->machine->keep_interrupts_masked_p)
11221 /* Enable interrupts by clearing the KSU ERL and EXL bits.
11222 IE is already the correct value, so we don't have to do
11223 anything explicit. */
11224 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
11225 GEN_INT (4),
11226 GEN_INT (SR_EXL),
11227 gen_rtx_REG (SImode, GP_REG_FIRST)));
11228 else
11229 /* Disable interrupts by clearing the KSU, ERL, EXL,
11230 and IE bits. */
11231 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
11232 GEN_INT (5),
11233 GEN_INT (SR_IE),
11234 gen_rtx_REG (SImode, GP_REG_FIRST)));
11235 }
11236 else
11237 {
11238 insn = gen_add3_insn (stack_pointer_rtx,
11239 stack_pointer_rtx,
11240 GEN_INT (-step1));
11241 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11242 mips_frame_barrier ();
11243 size -= step1;
11244 }
11245 mips_for_each_saved_acc (size, mips_save_reg);
11246 mips_for_each_saved_gpr_and_fpr (size, mips_save_reg);
11247 }
11248 }
11249
11250 /* Allocate the rest of the frame. */
11251 if (size > 0)
11252 {
11253 if (SMALL_OPERAND (-size))
11254 RTX_FRAME_RELATED_P (emit_insn (gen_add3_insn (stack_pointer_rtx,
11255 stack_pointer_rtx,
11256 GEN_INT (-size)))) = 1;
11257 else
11258 {
11259 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (size));
11260 if (TARGET_MIPS16)
11261 {
11262 /* There are no instructions to add or subtract registers
11263 from the stack pointer, so use the frame pointer as a
11264 temporary. We should always be using a frame pointer
11265 in this case anyway. */
11266 gcc_assert (frame_pointer_needed);
11267 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
11268 emit_insn (gen_sub3_insn (hard_frame_pointer_rtx,
11269 hard_frame_pointer_rtx,
11270 MIPS_PROLOGUE_TEMP (Pmode)));
11271 mips_emit_move (stack_pointer_rtx, hard_frame_pointer_rtx);
11272 }
11273 else
11274 emit_insn (gen_sub3_insn (stack_pointer_rtx,
11275 stack_pointer_rtx,
11276 MIPS_PROLOGUE_TEMP (Pmode)));
11277
11278 /* Describe the combined effect of the previous instructions. */
11279 mips_set_frame_expr
11280 (gen_rtx_SET (VOIDmode, stack_pointer_rtx,
11281 plus_constant (Pmode, stack_pointer_rtx, -size)));
11282 }
11283 mips_frame_barrier ();
11284 }
11285
11286 /* Set up the frame pointer, if we're using one. */
11287 if (frame_pointer_needed)
11288 {
11289 HOST_WIDE_INT offset;
11290
11291 offset = frame->hard_frame_pointer_offset;
11292 if (offset == 0)
11293 {
11294 insn = mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
11295 RTX_FRAME_RELATED_P (insn) = 1;
11296 }
11297 else if (SMALL_OPERAND (offset))
11298 {
11299 insn = gen_add3_insn (hard_frame_pointer_rtx,
11300 stack_pointer_rtx, GEN_INT (offset));
11301 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11302 }
11303 else
11304 {
11305 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (offset));
11306 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
11307 emit_insn (gen_add3_insn (hard_frame_pointer_rtx,
11308 hard_frame_pointer_rtx,
11309 MIPS_PROLOGUE_TEMP (Pmode)));
11310 mips_set_frame_expr
11311 (gen_rtx_SET (VOIDmode, hard_frame_pointer_rtx,
11312 plus_constant (Pmode, stack_pointer_rtx, offset)));
11313 }
11314 }
11315
11316 mips_emit_loadgp ();
11317
11318 /* Initialize the $gp save slot. */
11319 if (mips_cfun_has_cprestore_slot_p ())
11320 {
11321 rtx base, mem, gp, temp;
11322 HOST_WIDE_INT offset;
11323
11324 mips_get_cprestore_base_and_offset (&base, &offset, false);
11325 mem = gen_frame_mem (Pmode, plus_constant (Pmode, base, offset));
11326 gp = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx;
11327 temp = (SMALL_OPERAND (offset)
11328 ? gen_rtx_SCRATCH (Pmode)
11329 : MIPS_PROLOGUE_TEMP (Pmode));
11330 emit_insn (PMODE_INSN (gen_potential_cprestore,
11331 (mem, GEN_INT (offset), gp, temp)));
11332
11333 mips_get_cprestore_base_and_offset (&base, &offset, true);
11334 mem = gen_frame_mem (Pmode, plus_constant (Pmode, base, offset));
11335 emit_insn (PMODE_INSN (gen_use_cprestore, (mem)));
11336 }
11337
11338 /* We need to search back to the last use of K0 or K1. */
11339 if (cfun->machine->interrupt_handler_p)
11340 {
11341 for (insn = get_last_insn (); insn != NULL_RTX; insn = PREV_INSN (insn))
11342 if (INSN_P (insn)
11343 && for_each_rtx (&PATTERN (insn), mips_kernel_reg_p, NULL))
11344 break;
11345 /* Emit a move from K1 to COP0 Status after insn. */
11346 gcc_assert (insn != NULL_RTX);
11347 emit_insn_after (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM),
11348 gen_rtx_REG (SImode, K1_REG_NUM)),
11349 insn);
11350 }
11351
11352 /* If we are profiling, make sure no instructions are scheduled before
11353 the call to mcount. */
11354 if (crtl->profile)
11355 emit_insn (gen_blockage ());
11356 }
11357 \f
11358 /* Attach all pending register saves to the previous instruction.
11359 Return that instruction. */
11360
11361 static rtx_insn *
11362 mips_epilogue_emit_cfa_restores (void)
11363 {
11364 rtx_insn *insn;
11365
11366 insn = get_last_insn ();
11367 gcc_assert (insn && !REG_NOTES (insn));
11368 if (mips_epilogue.cfa_restores)
11369 {
11370 RTX_FRAME_RELATED_P (insn) = 1;
11371 REG_NOTES (insn) = mips_epilogue.cfa_restores;
11372 mips_epilogue.cfa_restores = 0;
11373 }
11374 return insn;
11375 }
11376
11377 /* Like mips_epilogue_emit_cfa_restores, but also record that the CFA is
11378 now at REG + OFFSET. */
11379
11380 static void
11381 mips_epilogue_set_cfa (rtx reg, HOST_WIDE_INT offset)
11382 {
11383 rtx_insn *insn;
11384
11385 insn = mips_epilogue_emit_cfa_restores ();
11386 if (reg != mips_epilogue.cfa_reg || offset != mips_epilogue.cfa_offset)
11387 {
11388 RTX_FRAME_RELATED_P (insn) = 1;
11389 REG_NOTES (insn) = alloc_reg_note (REG_CFA_DEF_CFA,
11390 plus_constant (Pmode, reg, offset),
11391 REG_NOTES (insn));
11392 mips_epilogue.cfa_reg = reg;
11393 mips_epilogue.cfa_offset = offset;
11394 }
11395 }
11396
11397 /* Emit instructions to restore register REG from slot MEM. Also update
11398 the cfa_restores list. */
11399
11400 static void
11401 mips_restore_reg (rtx reg, rtx mem)
11402 {
11403 /* There's no MIPS16 instruction to load $31 directly. Load into
11404 $7 instead and adjust the return insn appropriately. */
11405 if (TARGET_MIPS16 && REGNO (reg) == RETURN_ADDR_REGNUM)
11406 reg = gen_rtx_REG (GET_MODE (reg), GP_REG_FIRST + 7);
11407 else if (GET_MODE (reg) == DFmode && !TARGET_FLOAT64)
11408 {
11409 mips_add_cfa_restore (mips_subword (reg, true));
11410 mips_add_cfa_restore (mips_subword (reg, false));
11411 }
11412 else
11413 mips_add_cfa_restore (reg);
11414
11415 mips_emit_save_slot_move (reg, mem, MIPS_EPILOGUE_TEMP (GET_MODE (reg)));
11416 if (REGNO (reg) == REGNO (mips_epilogue.cfa_reg))
11417 /* The CFA is currently defined in terms of the register whose
11418 value we have just restored. Redefine the CFA in terms of
11419 the stack pointer. */
11420 mips_epilogue_set_cfa (stack_pointer_rtx,
11421 mips_epilogue.cfa_restore_sp_offset);
11422 }
11423
11424 /* Emit code to set the stack pointer to BASE + OFFSET, given that
11425 BASE + OFFSET is NEW_FRAME_SIZE bytes below the top of the frame.
11426 BASE, if not the stack pointer, is available as a temporary. */
11427
11428 static void
11429 mips_deallocate_stack (rtx base, rtx offset, HOST_WIDE_INT new_frame_size)
11430 {
11431 if (base == stack_pointer_rtx && offset == const0_rtx)
11432 return;
11433
11434 mips_frame_barrier ();
11435 if (offset == const0_rtx)
11436 {
11437 emit_move_insn (stack_pointer_rtx, base);
11438 mips_epilogue_set_cfa (stack_pointer_rtx, new_frame_size);
11439 }
11440 else if (TARGET_MIPS16 && base != stack_pointer_rtx)
11441 {
11442 emit_insn (gen_add3_insn (base, base, offset));
11443 mips_epilogue_set_cfa (base, new_frame_size);
11444 emit_move_insn (stack_pointer_rtx, base);
11445 }
11446 else
11447 {
11448 emit_insn (gen_add3_insn (stack_pointer_rtx, base, offset));
11449 mips_epilogue_set_cfa (stack_pointer_rtx, new_frame_size);
11450 }
11451 }
11452
11453 /* Emit any instructions needed before a return. */
11454
11455 void
11456 mips_expand_before_return (void)
11457 {
11458 /* When using a call-clobbered gp, we start out with unified call
11459 insns that include instructions to restore the gp. We then split
11460 these unified calls after reload. These split calls explicitly
11461 clobber gp, so there is no need to define
11462 PIC_OFFSET_TABLE_REG_CALL_CLOBBERED.
11463
11464 For consistency, we should also insert an explicit clobber of $28
11465 before return insns, so that the post-reload optimizers know that
11466 the register is not live on exit. */
11467 if (TARGET_CALL_CLOBBERED_GP)
11468 emit_clobber (pic_offset_table_rtx);
11469 }
11470
11471 /* Expand an "epilogue" or "sibcall_epilogue" pattern; SIBCALL_P
11472 says which. */
11473
11474 void
11475 mips_expand_epilogue (bool sibcall_p)
11476 {
11477 const struct mips_frame_info *frame;
11478 HOST_WIDE_INT step1, step2;
11479 rtx base, adjust;
11480 rtx_insn *insn;
11481 bool use_jraddiusp_p = false;
11482
11483 if (!sibcall_p && mips_can_use_return_insn ())
11484 {
11485 emit_jump_insn (gen_return ());
11486 return;
11487 }
11488
11489 /* In MIPS16 mode, if the return value should go into a floating-point
11490 register, we need to call a helper routine to copy it over. */
11491 if (mips16_cfun_returns_in_fpr_p ())
11492 mips16_copy_fpr_return_value ();
11493
11494 /* Split the frame into two. STEP1 is the amount of stack we should
11495 deallocate before restoring the registers. STEP2 is the amount we
11496 should deallocate afterwards.
11497
11498 Start off by assuming that no registers need to be restored. */
11499 frame = &cfun->machine->frame;
11500 step1 = frame->total_size;
11501 step2 = 0;
11502
11503 /* Work out which register holds the frame address. */
11504 if (!frame_pointer_needed)
11505 base = stack_pointer_rtx;
11506 else
11507 {
11508 base = hard_frame_pointer_rtx;
11509 step1 -= frame->hard_frame_pointer_offset;
11510 }
11511 mips_epilogue.cfa_reg = base;
11512 mips_epilogue.cfa_offset = step1;
11513 mips_epilogue.cfa_restores = NULL_RTX;
11514
11515 /* If we need to restore registers, deallocate as much stack as
11516 possible in the second step without going out of range. */
11517 if ((frame->mask | frame->fmask | frame->acc_mask) != 0
11518 || frame->num_cop0_regs > 0)
11519 {
11520 step2 = MIN (step1, MIPS_MAX_FIRST_STACK_STEP);
11521 step1 -= step2;
11522 }
11523
11524 /* Get an rtx for STEP1 that we can add to BASE. */
11525 adjust = GEN_INT (step1);
11526 if (!SMALL_OPERAND (step1))
11527 {
11528 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), adjust);
11529 adjust = MIPS_EPILOGUE_TEMP (Pmode);
11530 }
11531 mips_deallocate_stack (base, adjust, step2);
11532
11533 /* If we're using addressing macros, $gp is implicitly used by all
11534 SYMBOL_REFs. We must emit a blockage insn before restoring $gp
11535 from the stack. */
11536 if (TARGET_CALL_SAVED_GP && !TARGET_EXPLICIT_RELOCS)
11537 emit_insn (gen_blockage ());
11538
11539 mips_epilogue.cfa_restore_sp_offset = step2;
11540 if (GENERATE_MIPS16E_SAVE_RESTORE && frame->mask != 0)
11541 {
11542 unsigned int regno, mask;
11543 HOST_WIDE_INT offset;
11544 rtx restore;
11545
11546 /* Generate the restore instruction. */
11547 mask = frame->mask;
11548 restore = mips16e_build_save_restore (true, &mask, &offset, 0, step2);
11549
11550 /* Restore any other registers manually. */
11551 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++)
11552 if (BITSET_P (mask, regno - GP_REG_FIRST))
11553 {
11554 offset -= UNITS_PER_WORD;
11555 mips_save_restore_reg (word_mode, regno, offset, mips_restore_reg);
11556 }
11557
11558 /* Restore the remaining registers and deallocate the final bit
11559 of the frame. */
11560 mips_frame_barrier ();
11561 emit_insn (restore);
11562 mips_epilogue_set_cfa (stack_pointer_rtx, 0);
11563 }
11564 else
11565 {
11566 /* Restore the registers. */
11567 mips_for_each_saved_acc (frame->total_size - step2, mips_restore_reg);
11568 mips_for_each_saved_gpr_and_fpr (frame->total_size - step2,
11569 mips_restore_reg);
11570
11571 if (cfun->machine->interrupt_handler_p)
11572 {
11573 HOST_WIDE_INT offset;
11574 rtx mem;
11575
11576 offset = frame->cop0_sp_offset - (frame->total_size - step2);
11577 if (!cfun->machine->keep_interrupts_masked_p)
11578 {
11579 /* Restore the original EPC. */
11580 mem = gen_frame_mem (word_mode,
11581 plus_constant (Pmode, stack_pointer_rtx,
11582 offset));
11583 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem);
11584 offset -= UNITS_PER_WORD;
11585
11586 /* Move to COP0 EPC. */
11587 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_EPC_REG_NUM),
11588 gen_rtx_REG (SImode, K0_REG_NUM)));
11589 }
11590
11591 /* Restore the original Status. */
11592 mem = gen_frame_mem (word_mode,
11593 plus_constant (Pmode, stack_pointer_rtx,
11594 offset));
11595 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem);
11596 offset -= UNITS_PER_WORD;
11597
11598 /* If we don't use shadow register set, we need to update SP. */
11599 if (!cfun->machine->use_shadow_register_set_p)
11600 mips_deallocate_stack (stack_pointer_rtx, GEN_INT (step2), 0);
11601 else
11602 /* The choice of position is somewhat arbitrary in this case. */
11603 mips_epilogue_emit_cfa_restores ();
11604
11605 /* Move to COP0 Status. */
11606 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM),
11607 gen_rtx_REG (SImode, K0_REG_NUM)));
11608 }
11609 else if (TARGET_MICROMIPS
11610 && !crtl->calls_eh_return
11611 && !sibcall_p
11612 && step2 > 0
11613 && mips_unsigned_immediate_p (step2, 5, 2))
11614 use_jraddiusp_p = true;
11615 else
11616 /* Deallocate the final bit of the frame. */
11617 mips_deallocate_stack (stack_pointer_rtx, GEN_INT (step2), 0);
11618 }
11619
11620 if (!use_jraddiusp_p)
11621 gcc_assert (!mips_epilogue.cfa_restores);
11622
11623 /* Add in the __builtin_eh_return stack adjustment. We need to
11624 use a temporary in MIPS16 code. */
11625 if (crtl->calls_eh_return)
11626 {
11627 if (TARGET_MIPS16)
11628 {
11629 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), stack_pointer_rtx);
11630 emit_insn (gen_add3_insn (MIPS_EPILOGUE_TEMP (Pmode),
11631 MIPS_EPILOGUE_TEMP (Pmode),
11632 EH_RETURN_STACKADJ_RTX));
11633 mips_emit_move (stack_pointer_rtx, MIPS_EPILOGUE_TEMP (Pmode));
11634 }
11635 else
11636 emit_insn (gen_add3_insn (stack_pointer_rtx,
11637 stack_pointer_rtx,
11638 EH_RETURN_STACKADJ_RTX));
11639 }
11640
11641 if (!sibcall_p)
11642 {
11643 mips_expand_before_return ();
11644 if (cfun->machine->interrupt_handler_p)
11645 {
11646 /* Interrupt handlers generate eret or deret. */
11647 if (cfun->machine->use_debug_exception_return_p)
11648 emit_jump_insn (gen_mips_deret ());
11649 else
11650 emit_jump_insn (gen_mips_eret ());
11651 }
11652 else
11653 {
11654 rtx pat;
11655
11656 /* When generating MIPS16 code, the normal
11657 mips_for_each_saved_gpr_and_fpr path will restore the return
11658 address into $7 rather than $31. */
11659 if (TARGET_MIPS16
11660 && !GENERATE_MIPS16E_SAVE_RESTORE
11661 && BITSET_P (frame->mask, RETURN_ADDR_REGNUM))
11662 {
11663 /* simple_returns cannot rely on values that are only available
11664 on paths through the epilogue (because return paths that do
11665 not pass through the epilogue may nevertheless reuse a
11666 simple_return that occurs at the end of the epilogue).
11667 Use a normal return here instead. */
11668 rtx reg = gen_rtx_REG (Pmode, GP_REG_FIRST + 7);
11669 pat = gen_return_internal (reg);
11670 }
11671 else if (use_jraddiusp_p)
11672 pat = gen_jraddiusp (GEN_INT (step2));
11673 else
11674 {
11675 rtx reg = gen_rtx_REG (Pmode, RETURN_ADDR_REGNUM);
11676 pat = gen_simple_return_internal (reg);
11677 }
11678 emit_jump_insn (pat);
11679 if (use_jraddiusp_p)
11680 mips_epilogue_set_cfa (stack_pointer_rtx, step2);
11681 }
11682 }
11683
11684 /* Search from the beginning to the first use of K0 or K1. */
11685 if (cfun->machine->interrupt_handler_p
11686 && !cfun->machine->keep_interrupts_masked_p)
11687 {
11688 for (insn = get_insns (); insn != NULL_RTX; insn = NEXT_INSN (insn))
11689 if (INSN_P (insn)
11690 && for_each_rtx (&PATTERN(insn), mips_kernel_reg_p, NULL))
11691 break;
11692 gcc_assert (insn != NULL_RTX);
11693 /* Insert disable interrupts before the first use of K0 or K1. */
11694 emit_insn_before (gen_mips_di (), insn);
11695 emit_insn_before (gen_mips_ehb (), insn);
11696 }
11697 }
11698 \f
11699 /* Return nonzero if this function is known to have a null epilogue.
11700 This allows the optimizer to omit jumps to jumps if no stack
11701 was created. */
11702
11703 bool
11704 mips_can_use_return_insn (void)
11705 {
11706 /* Interrupt handlers need to go through the epilogue. */
11707 if (cfun->machine->interrupt_handler_p)
11708 return false;
11709
11710 if (!reload_completed)
11711 return false;
11712
11713 if (crtl->profile)
11714 return false;
11715
11716 /* In MIPS16 mode, a function that returns a floating-point value
11717 needs to arrange to copy the return value into the floating-point
11718 registers. */
11719 if (mips16_cfun_returns_in_fpr_p ())
11720 return false;
11721
11722 return cfun->machine->frame.total_size == 0;
11723 }
11724 \f
11725 /* Return true if register REGNO can store a value of mode MODE.
11726 The result of this function is cached in mips_hard_regno_mode_ok. */
11727
11728 static bool
11729 mips_hard_regno_mode_ok_p (unsigned int regno, enum machine_mode mode)
11730 {
11731 unsigned int size;
11732 enum mode_class mclass;
11733
11734 if (mode == CCV2mode)
11735 return (ISA_HAS_8CC
11736 && ST_REG_P (regno)
11737 && (regno - ST_REG_FIRST) % 2 == 0);
11738
11739 if (mode == CCV4mode)
11740 return (ISA_HAS_8CC
11741 && ST_REG_P (regno)
11742 && (regno - ST_REG_FIRST) % 4 == 0);
11743
11744 if (mode == CCmode)
11745 return ISA_HAS_8CC ? ST_REG_P (regno) : regno == FPSW_REGNUM;
11746
11747 size = GET_MODE_SIZE (mode);
11748 mclass = GET_MODE_CLASS (mode);
11749
11750 if (GP_REG_P (regno))
11751 return ((regno - GP_REG_FIRST) & 1) == 0 || size <= UNITS_PER_WORD;
11752
11753 if (FP_REG_P (regno)
11754 && (((regno - FP_REG_FIRST) % MAX_FPRS_PER_FMT) == 0
11755 || (MIN_FPRS_PER_FMT == 1 && size <= UNITS_PER_FPREG)))
11756 {
11757 /* Allow 64-bit vector modes for Loongson-2E/2F. */
11758 if (TARGET_LOONGSON_VECTORS
11759 && (mode == V2SImode
11760 || mode == V4HImode
11761 || mode == V8QImode
11762 || mode == DImode))
11763 return true;
11764
11765 if (mclass == MODE_FLOAT
11766 || mclass == MODE_COMPLEX_FLOAT
11767 || mclass == MODE_VECTOR_FLOAT)
11768 return size <= UNITS_PER_FPVALUE;
11769
11770 /* Allow integer modes that fit into a single register. We need
11771 to put integers into FPRs when using instructions like CVT
11772 and TRUNC. There's no point allowing sizes smaller than a word,
11773 because the FPU has no appropriate load/store instructions. */
11774 if (mclass == MODE_INT)
11775 return size >= MIN_UNITS_PER_WORD && size <= UNITS_PER_FPREG;
11776 }
11777
11778 if (ACC_REG_P (regno)
11779 && (INTEGRAL_MODE_P (mode) || ALL_FIXED_POINT_MODE_P (mode)))
11780 {
11781 if (MD_REG_P (regno))
11782 {
11783 /* After a multiplication or division, clobbering HI makes
11784 the value of LO unpredictable, and vice versa. This means
11785 that, for all interesting cases, HI and LO are effectively
11786 a single register.
11787
11788 We model this by requiring that any value that uses HI
11789 also uses LO. */
11790 if (size <= UNITS_PER_WORD * 2)
11791 return regno == (size <= UNITS_PER_WORD ? LO_REGNUM : MD_REG_FIRST);
11792 }
11793 else
11794 {
11795 /* DSP accumulators do not have the same restrictions as
11796 HI and LO, so we can treat them as normal doubleword
11797 registers. */
11798 if (size <= UNITS_PER_WORD)
11799 return true;
11800
11801 if (size <= UNITS_PER_WORD * 2
11802 && ((regno - DSP_ACC_REG_FIRST) & 1) == 0)
11803 return true;
11804 }
11805 }
11806
11807 if (ALL_COP_REG_P (regno))
11808 return mclass == MODE_INT && size <= UNITS_PER_WORD;
11809
11810 if (regno == GOT_VERSION_REGNUM)
11811 return mode == SImode;
11812
11813 return false;
11814 }
11815
11816 /* Implement HARD_REGNO_NREGS. */
11817
11818 unsigned int
11819 mips_hard_regno_nregs (int regno, enum machine_mode mode)
11820 {
11821 if (ST_REG_P (regno))
11822 /* The size of FP status registers is always 4, because they only hold
11823 CCmode values, and CCmode is always considered to be 4 bytes wide. */
11824 return (GET_MODE_SIZE (mode) + 3) / 4;
11825
11826 if (FP_REG_P (regno))
11827 return (GET_MODE_SIZE (mode) + UNITS_PER_FPREG - 1) / UNITS_PER_FPREG;
11828
11829 /* All other registers are word-sized. */
11830 return (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
11831 }
11832
11833 /* Implement CLASS_MAX_NREGS, taking the maximum of the cases
11834 in mips_hard_regno_nregs. */
11835
11836 int
11837 mips_class_max_nregs (enum reg_class rclass, enum machine_mode mode)
11838 {
11839 int size;
11840 HARD_REG_SET left;
11841
11842 size = 0x8000;
11843 COPY_HARD_REG_SET (left, reg_class_contents[(int) rclass]);
11844 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) ST_REGS]))
11845 {
11846 if (HARD_REGNO_MODE_OK (ST_REG_FIRST, mode))
11847 size = MIN (size, 4);
11848 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) ST_REGS]);
11849 }
11850 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) FP_REGS]))
11851 {
11852 if (HARD_REGNO_MODE_OK (FP_REG_FIRST, mode))
11853 size = MIN (size, UNITS_PER_FPREG);
11854 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) FP_REGS]);
11855 }
11856 if (!hard_reg_set_empty_p (left))
11857 size = MIN (size, UNITS_PER_WORD);
11858 return (GET_MODE_SIZE (mode) + size - 1) / size;
11859 }
11860
11861 /* Implement CANNOT_CHANGE_MODE_CLASS. */
11862
11863 bool
11864 mips_cannot_change_mode_class (enum machine_mode from,
11865 enum machine_mode to,
11866 enum reg_class rclass)
11867 {
11868 /* Allow conversions between different Loongson integer vectors,
11869 and between those vectors and DImode. */
11870 if (GET_MODE_SIZE (from) == 8 && GET_MODE_SIZE (to) == 8
11871 && INTEGRAL_MODE_P (from) && INTEGRAL_MODE_P (to))
11872 return false;
11873
11874 /* Otherwise, there are several problems with changing the modes of
11875 values in floating-point registers:
11876
11877 - When a multi-word value is stored in paired floating-point
11878 registers, the first register always holds the low word. We
11879 therefore can't allow FPRs to change between single-word and
11880 multi-word modes on big-endian targets.
11881
11882 - GCC assumes that each word of a multiword register can be
11883 accessed individually using SUBREGs. This is not true for
11884 floating-point registers if they are bigger than a word.
11885
11886 - Loading a 32-bit value into a 64-bit floating-point register
11887 will not sign-extend the value, despite what LOAD_EXTEND_OP
11888 says. We can't allow FPRs to change from SImode to a wider
11889 mode on 64-bit targets.
11890
11891 - If the FPU has already interpreted a value in one format, we
11892 must not ask it to treat the value as having a different
11893 format.
11894
11895 We therefore disallow all mode changes involving FPRs. */
11896
11897 return reg_classes_intersect_p (FP_REGS, rclass);
11898 }
11899
11900 /* Implement target hook small_register_classes_for_mode_p. */
11901
11902 static bool
11903 mips_small_register_classes_for_mode_p (enum machine_mode mode
11904 ATTRIBUTE_UNUSED)
11905 {
11906 return TARGET_MIPS16;
11907 }
11908
11909 /* Return true if moves in mode MODE can use the FPU's mov.fmt instruction. */
11910
11911 static bool
11912 mips_mode_ok_for_mov_fmt_p (enum machine_mode mode)
11913 {
11914 switch (mode)
11915 {
11916 case SFmode:
11917 return TARGET_HARD_FLOAT;
11918
11919 case DFmode:
11920 return TARGET_HARD_FLOAT && TARGET_DOUBLE_FLOAT;
11921
11922 case V2SFmode:
11923 return TARGET_HARD_FLOAT && TARGET_PAIRED_SINGLE_FLOAT;
11924
11925 default:
11926 return false;
11927 }
11928 }
11929
11930 /* Implement MODES_TIEABLE_P. */
11931
11932 bool
11933 mips_modes_tieable_p (enum machine_mode mode1, enum machine_mode mode2)
11934 {
11935 /* FPRs allow no mode punning, so it's not worth tying modes if we'd
11936 prefer to put one of them in FPRs. */
11937 return (mode1 == mode2
11938 || (!mips_mode_ok_for_mov_fmt_p (mode1)
11939 && !mips_mode_ok_for_mov_fmt_p (mode2)));
11940 }
11941
11942 /* Implement TARGET_PREFERRED_RELOAD_CLASS. */
11943
11944 static reg_class_t
11945 mips_preferred_reload_class (rtx x, reg_class_t rclass)
11946 {
11947 if (mips_dangerous_for_la25_p (x) && reg_class_subset_p (LEA_REGS, rclass))
11948 return LEA_REGS;
11949
11950 if (reg_class_subset_p (FP_REGS, rclass)
11951 && mips_mode_ok_for_mov_fmt_p (GET_MODE (x)))
11952 return FP_REGS;
11953
11954 if (reg_class_subset_p (GR_REGS, rclass))
11955 rclass = GR_REGS;
11956
11957 if (TARGET_MIPS16 && reg_class_subset_p (M16_REGS, rclass))
11958 rclass = M16_REGS;
11959
11960 return rclass;
11961 }
11962
11963 /* RCLASS is a class involved in a REGISTER_MOVE_COST calculation.
11964 Return a "canonical" class to represent it in later calculations. */
11965
11966 static reg_class_t
11967 mips_canonicalize_move_class (reg_class_t rclass)
11968 {
11969 /* All moves involving accumulator registers have the same cost. */
11970 if (reg_class_subset_p (rclass, ACC_REGS))
11971 rclass = ACC_REGS;
11972
11973 /* Likewise promote subclasses of general registers to the most
11974 interesting containing class. */
11975 if (TARGET_MIPS16 && reg_class_subset_p (rclass, M16_REGS))
11976 rclass = M16_REGS;
11977 else if (reg_class_subset_p (rclass, GENERAL_REGS))
11978 rclass = GENERAL_REGS;
11979
11980 return rclass;
11981 }
11982
11983 /* Return the cost of moving a value from a register of class FROM to a GPR.
11984 Return 0 for classes that are unions of other classes handled by this
11985 function. */
11986
11987 static int
11988 mips_move_to_gpr_cost (reg_class_t from)
11989 {
11990 switch (from)
11991 {
11992 case M16_REGS:
11993 case GENERAL_REGS:
11994 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */
11995 return 2;
11996
11997 case ACC_REGS:
11998 /* MFLO and MFHI. */
11999 return 6;
12000
12001 case FP_REGS:
12002 /* MFC1, etc. */
12003 return 4;
12004
12005 case COP0_REGS:
12006 case COP2_REGS:
12007 case COP3_REGS:
12008 /* This choice of value is historical. */
12009 return 5;
12010
12011 default:
12012 return 0;
12013 }
12014 }
12015
12016 /* Return the cost of moving a value from a GPR to a register of class TO.
12017 Return 0 for classes that are unions of other classes handled by this
12018 function. */
12019
12020 static int
12021 mips_move_from_gpr_cost (reg_class_t to)
12022 {
12023 switch (to)
12024 {
12025 case M16_REGS:
12026 case GENERAL_REGS:
12027 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */
12028 return 2;
12029
12030 case ACC_REGS:
12031 /* MTLO and MTHI. */
12032 return 6;
12033
12034 case FP_REGS:
12035 /* MTC1, etc. */
12036 return 4;
12037
12038 case COP0_REGS:
12039 case COP2_REGS:
12040 case COP3_REGS:
12041 /* This choice of value is historical. */
12042 return 5;
12043
12044 default:
12045 return 0;
12046 }
12047 }
12048
12049 /* Implement TARGET_REGISTER_MOVE_COST. Return 0 for classes that are the
12050 maximum of the move costs for subclasses; regclass will work out
12051 the maximum for us. */
12052
12053 static int
12054 mips_register_move_cost (enum machine_mode mode,
12055 reg_class_t from, reg_class_t to)
12056 {
12057 reg_class_t dregs;
12058 int cost1, cost2;
12059
12060 from = mips_canonicalize_move_class (from);
12061 to = mips_canonicalize_move_class (to);
12062
12063 /* Handle moves that can be done without using general-purpose registers. */
12064 if (from == FP_REGS)
12065 {
12066 if (to == FP_REGS && mips_mode_ok_for_mov_fmt_p (mode))
12067 /* MOV.FMT. */
12068 return 4;
12069 }
12070
12071 /* Handle cases in which only one class deviates from the ideal. */
12072 dregs = TARGET_MIPS16 ? M16_REGS : GENERAL_REGS;
12073 if (from == dregs)
12074 return mips_move_from_gpr_cost (to);
12075 if (to == dregs)
12076 return mips_move_to_gpr_cost (from);
12077
12078 /* Handles cases that require a GPR temporary. */
12079 cost1 = mips_move_to_gpr_cost (from);
12080 if (cost1 != 0)
12081 {
12082 cost2 = mips_move_from_gpr_cost (to);
12083 if (cost2 != 0)
12084 return cost1 + cost2;
12085 }
12086
12087 return 0;
12088 }
12089
12090 /* Implement TARGET_REGISTER_PRIORITY. */
12091
12092 static int
12093 mips_register_priority (int hard_regno)
12094 {
12095 /* Treat MIPS16 registers with higher priority than other regs. */
12096 if (TARGET_MIPS16
12097 && TEST_HARD_REG_BIT (reg_class_contents[M16_REGS], hard_regno))
12098 return 1;
12099 return 0;
12100 }
12101
12102 /* Implement TARGET_MEMORY_MOVE_COST. */
12103
12104 static int
12105 mips_memory_move_cost (enum machine_mode mode, reg_class_t rclass, bool in)
12106 {
12107 return (mips_cost->memory_latency
12108 + memory_move_secondary_cost (mode, rclass, in));
12109 }
12110
12111 /* Return the register class required for a secondary register when
12112 copying between one of the registers in RCLASS and value X, which
12113 has mode MODE. X is the source of the move if IN_P, otherwise it
12114 is the destination. Return NO_REGS if no secondary register is
12115 needed. */
12116
12117 enum reg_class
12118 mips_secondary_reload_class (enum reg_class rclass,
12119 enum machine_mode mode, rtx x, bool)
12120 {
12121 int regno;
12122
12123 /* If X is a constant that cannot be loaded into $25, it must be loaded
12124 into some other GPR. No other register class allows a direct move. */
12125 if (mips_dangerous_for_la25_p (x))
12126 return reg_class_subset_p (rclass, LEA_REGS) ? NO_REGS : LEA_REGS;
12127
12128 regno = true_regnum (x);
12129 if (TARGET_MIPS16)
12130 {
12131 /* In MIPS16 mode, every move must involve a member of M16_REGS. */
12132 if (!reg_class_subset_p (rclass, M16_REGS) && !M16_REG_P (regno))
12133 return M16_REGS;
12134
12135 return NO_REGS;
12136 }
12137
12138 /* Copying from accumulator registers to anywhere other than a general
12139 register requires a temporary general register. */
12140 if (reg_class_subset_p (rclass, ACC_REGS))
12141 return GP_REG_P (regno) ? NO_REGS : GR_REGS;
12142 if (ACC_REG_P (regno))
12143 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
12144
12145 if (reg_class_subset_p (rclass, FP_REGS))
12146 {
12147 if (MEM_P (x)
12148 && (GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8))
12149 /* In this case we can use lwc1, swc1, ldc1 or sdc1. We'll use
12150 pairs of lwc1s and swc1s if ldc1 and sdc1 are not supported. */
12151 return NO_REGS;
12152
12153 if (GP_REG_P (regno) || x == CONST0_RTX (mode))
12154 /* In this case we can use mtc1, mfc1, dmtc1 or dmfc1. */
12155 return NO_REGS;
12156
12157 if (CONSTANT_P (x) && !targetm.cannot_force_const_mem (mode, x))
12158 /* We can force the constant to memory and use lwc1
12159 and ldc1. As above, we will use pairs of lwc1s if
12160 ldc1 is not supported. */
12161 return NO_REGS;
12162
12163 if (FP_REG_P (regno) && mips_mode_ok_for_mov_fmt_p (mode))
12164 /* In this case we can use mov.fmt. */
12165 return NO_REGS;
12166
12167 /* Otherwise, we need to reload through an integer register. */
12168 return GR_REGS;
12169 }
12170 if (FP_REG_P (regno))
12171 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
12172
12173 return NO_REGS;
12174 }
12175
12176 /* Implement TARGET_MODE_REP_EXTENDED. */
12177
12178 static int
12179 mips_mode_rep_extended (enum machine_mode mode, enum machine_mode mode_rep)
12180 {
12181 /* On 64-bit targets, SImode register values are sign-extended to DImode. */
12182 if (TARGET_64BIT && mode == SImode && mode_rep == DImode)
12183 return SIGN_EXTEND;
12184
12185 return UNKNOWN;
12186 }
12187 \f
12188 /* Implement TARGET_VALID_POINTER_MODE. */
12189
12190 static bool
12191 mips_valid_pointer_mode (enum machine_mode mode)
12192 {
12193 return mode == SImode || (TARGET_64BIT && mode == DImode);
12194 }
12195
12196 /* Implement TARGET_VECTOR_MODE_SUPPORTED_P. */
12197
12198 static bool
12199 mips_vector_mode_supported_p (enum machine_mode mode)
12200 {
12201 switch (mode)
12202 {
12203 case V2SFmode:
12204 return TARGET_PAIRED_SINGLE_FLOAT;
12205
12206 case V2HImode:
12207 case V4QImode:
12208 case V2HQmode:
12209 case V2UHQmode:
12210 case V2HAmode:
12211 case V2UHAmode:
12212 case V4QQmode:
12213 case V4UQQmode:
12214 return TARGET_DSP;
12215
12216 case V2SImode:
12217 case V4HImode:
12218 case V8QImode:
12219 return TARGET_LOONGSON_VECTORS;
12220
12221 default:
12222 return false;
12223 }
12224 }
12225
12226 /* Implement TARGET_SCALAR_MODE_SUPPORTED_P. */
12227
12228 static bool
12229 mips_scalar_mode_supported_p (enum machine_mode mode)
12230 {
12231 if (ALL_FIXED_POINT_MODE_P (mode)
12232 && GET_MODE_PRECISION (mode) <= 2 * BITS_PER_WORD)
12233 return true;
12234
12235 return default_scalar_mode_supported_p (mode);
12236 }
12237 \f
12238 /* Implement TARGET_VECTORIZE_PREFERRED_SIMD_MODE. */
12239
12240 static enum machine_mode
12241 mips_preferred_simd_mode (enum machine_mode mode ATTRIBUTE_UNUSED)
12242 {
12243 if (TARGET_PAIRED_SINGLE_FLOAT
12244 && mode == SFmode)
12245 return V2SFmode;
12246 return word_mode;
12247 }
12248
12249 /* Implement TARGET_INIT_LIBFUNCS. */
12250
12251 static void
12252 mips_init_libfuncs (void)
12253 {
12254 if (TARGET_FIX_VR4120)
12255 {
12256 /* Register the special divsi3 and modsi3 functions needed to work
12257 around VR4120 division errata. */
12258 set_optab_libfunc (sdiv_optab, SImode, "__vr4120_divsi3");
12259 set_optab_libfunc (smod_optab, SImode, "__vr4120_modsi3");
12260 }
12261
12262 if (TARGET_MIPS16 && TARGET_HARD_FLOAT_ABI)
12263 {
12264 /* Register the MIPS16 -mhard-float stubs. */
12265 set_optab_libfunc (add_optab, SFmode, "__mips16_addsf3");
12266 set_optab_libfunc (sub_optab, SFmode, "__mips16_subsf3");
12267 set_optab_libfunc (smul_optab, SFmode, "__mips16_mulsf3");
12268 set_optab_libfunc (sdiv_optab, SFmode, "__mips16_divsf3");
12269
12270 set_optab_libfunc (eq_optab, SFmode, "__mips16_eqsf2");
12271 set_optab_libfunc (ne_optab, SFmode, "__mips16_nesf2");
12272 set_optab_libfunc (gt_optab, SFmode, "__mips16_gtsf2");
12273 set_optab_libfunc (ge_optab, SFmode, "__mips16_gesf2");
12274 set_optab_libfunc (lt_optab, SFmode, "__mips16_ltsf2");
12275 set_optab_libfunc (le_optab, SFmode, "__mips16_lesf2");
12276 set_optab_libfunc (unord_optab, SFmode, "__mips16_unordsf2");
12277
12278 set_conv_libfunc (sfix_optab, SImode, SFmode, "__mips16_fix_truncsfsi");
12279 set_conv_libfunc (sfloat_optab, SFmode, SImode, "__mips16_floatsisf");
12280 set_conv_libfunc (ufloat_optab, SFmode, SImode, "__mips16_floatunsisf");
12281
12282 if (TARGET_DOUBLE_FLOAT)
12283 {
12284 set_optab_libfunc (add_optab, DFmode, "__mips16_adddf3");
12285 set_optab_libfunc (sub_optab, DFmode, "__mips16_subdf3");
12286 set_optab_libfunc (smul_optab, DFmode, "__mips16_muldf3");
12287 set_optab_libfunc (sdiv_optab, DFmode, "__mips16_divdf3");
12288
12289 set_optab_libfunc (eq_optab, DFmode, "__mips16_eqdf2");
12290 set_optab_libfunc (ne_optab, DFmode, "__mips16_nedf2");
12291 set_optab_libfunc (gt_optab, DFmode, "__mips16_gtdf2");
12292 set_optab_libfunc (ge_optab, DFmode, "__mips16_gedf2");
12293 set_optab_libfunc (lt_optab, DFmode, "__mips16_ltdf2");
12294 set_optab_libfunc (le_optab, DFmode, "__mips16_ledf2");
12295 set_optab_libfunc (unord_optab, DFmode, "__mips16_unorddf2");
12296
12297 set_conv_libfunc (sext_optab, DFmode, SFmode,
12298 "__mips16_extendsfdf2");
12299 set_conv_libfunc (trunc_optab, SFmode, DFmode,
12300 "__mips16_truncdfsf2");
12301 set_conv_libfunc (sfix_optab, SImode, DFmode,
12302 "__mips16_fix_truncdfsi");
12303 set_conv_libfunc (sfloat_optab, DFmode, SImode,
12304 "__mips16_floatsidf");
12305 set_conv_libfunc (ufloat_optab, DFmode, SImode,
12306 "__mips16_floatunsidf");
12307 }
12308 }
12309
12310 /* The MIPS16 ISA does not have an encoding for "sync", so we rely
12311 on an external non-MIPS16 routine to implement __sync_synchronize.
12312 Similarly for the rest of the ll/sc libfuncs. */
12313 if (TARGET_MIPS16)
12314 {
12315 synchronize_libfunc = init_one_libfunc ("__sync_synchronize");
12316 init_sync_libfuncs (UNITS_PER_WORD);
12317 }
12318 }
12319
12320 /* Build up a multi-insn sequence that loads label TARGET into $AT. */
12321
12322 static void
12323 mips_process_load_label (rtx target)
12324 {
12325 rtx base, gp, intop;
12326 HOST_WIDE_INT offset;
12327
12328 mips_multi_start ();
12329 switch (mips_abi)
12330 {
12331 case ABI_N32:
12332 mips_multi_add_insn ("lw\t%@,%%got_page(%0)(%+)", target, 0);
12333 mips_multi_add_insn ("addiu\t%@,%@,%%got_ofst(%0)", target, 0);
12334 break;
12335
12336 case ABI_64:
12337 mips_multi_add_insn ("ld\t%@,%%got_page(%0)(%+)", target, 0);
12338 mips_multi_add_insn ("daddiu\t%@,%@,%%got_ofst(%0)", target, 0);
12339 break;
12340
12341 default:
12342 gp = pic_offset_table_rtx;
12343 if (mips_cfun_has_cprestore_slot_p ())
12344 {
12345 gp = gen_rtx_REG (Pmode, AT_REGNUM);
12346 mips_get_cprestore_base_and_offset (&base, &offset, true);
12347 if (!SMALL_OPERAND (offset))
12348 {
12349 intop = GEN_INT (CONST_HIGH_PART (offset));
12350 mips_multi_add_insn ("lui\t%0,%1", gp, intop, 0);
12351 mips_multi_add_insn ("addu\t%0,%0,%1", gp, base, 0);
12352
12353 base = gp;
12354 offset = CONST_LOW_PART (offset);
12355 }
12356 intop = GEN_INT (offset);
12357 if (ISA_HAS_LOAD_DELAY)
12358 mips_multi_add_insn ("lw\t%0,%1(%2)%#", gp, intop, base, 0);
12359 else
12360 mips_multi_add_insn ("lw\t%0,%1(%2)", gp, intop, base, 0);
12361 }
12362 if (ISA_HAS_LOAD_DELAY)
12363 mips_multi_add_insn ("lw\t%@,%%got(%0)(%1)%#", target, gp, 0);
12364 else
12365 mips_multi_add_insn ("lw\t%@,%%got(%0)(%1)", target, gp, 0);
12366 mips_multi_add_insn ("addiu\t%@,%@,%%lo(%0)", target, 0);
12367 break;
12368 }
12369 }
12370
12371 /* Return the number of instructions needed to load a label into $AT. */
12372
12373 static unsigned int
12374 mips_load_label_num_insns (void)
12375 {
12376 if (cfun->machine->load_label_num_insns == 0)
12377 {
12378 mips_process_load_label (pc_rtx);
12379 cfun->machine->load_label_num_insns = mips_multi_num_insns;
12380 }
12381 return cfun->machine->load_label_num_insns;
12382 }
12383
12384 /* Emit an asm sequence to start a noat block and load the address
12385 of a label into $1. */
12386
12387 void
12388 mips_output_load_label (rtx target)
12389 {
12390 mips_push_asm_switch (&mips_noat);
12391 if (TARGET_EXPLICIT_RELOCS)
12392 {
12393 mips_process_load_label (target);
12394 mips_multi_write ();
12395 }
12396 else
12397 {
12398 if (Pmode == DImode)
12399 output_asm_insn ("dla\t%@,%0", &target);
12400 else
12401 output_asm_insn ("la\t%@,%0", &target);
12402 }
12403 }
12404
12405 /* Return the length of INSN. LENGTH is the initial length computed by
12406 attributes in the machine-description file. */
12407
12408 int
12409 mips_adjust_insn_length (rtx_insn *insn, int length)
12410 {
12411 /* mips.md uses MAX_PIC_BRANCH_LENGTH as a placeholder for the length
12412 of a PIC long-branch sequence. Substitute the correct value. */
12413 if (length == MAX_PIC_BRANCH_LENGTH
12414 && JUMP_P (insn)
12415 && INSN_CODE (insn) >= 0
12416 && get_attr_type (insn) == TYPE_BRANCH)
12417 {
12418 /* Add the branch-over instruction and its delay slot, if this
12419 is a conditional branch. */
12420 length = simplejump_p (insn) ? 0 : 8;
12421
12422 /* Add the size of a load into $AT. */
12423 length += BASE_INSN_LENGTH * mips_load_label_num_insns ();
12424
12425 /* Add the length of an indirect jump, ignoring the delay slot. */
12426 length += TARGET_COMPRESSION ? 2 : 4;
12427 }
12428
12429 /* A unconditional jump has an unfilled delay slot if it is not part
12430 of a sequence. A conditional jump normally has a delay slot, but
12431 does not on MIPS16. */
12432 if (CALL_P (insn) || (TARGET_MIPS16 ? simplejump_p (insn) : JUMP_P (insn)))
12433 length += TARGET_MIPS16 ? 2 : 4;
12434
12435 /* See how many nops might be needed to avoid hardware hazards. */
12436 if (!cfun->machine->ignore_hazard_length_p
12437 && INSN_P (insn)
12438 && INSN_CODE (insn) >= 0)
12439 switch (get_attr_hazard (insn))
12440 {
12441 case HAZARD_NONE:
12442 break;
12443
12444 case HAZARD_DELAY:
12445 length += NOP_INSN_LENGTH;
12446 break;
12447
12448 case HAZARD_HILO:
12449 length += NOP_INSN_LENGTH * 2;
12450 break;
12451 }
12452
12453 return length;
12454 }
12455
12456 /* Return the assembly code for INSN, which has the operands given by
12457 OPERANDS, and which branches to OPERANDS[0] if some condition is true.
12458 BRANCH_IF_TRUE is the asm template that should be used if OPERANDS[0]
12459 is in range of a direct branch. BRANCH_IF_FALSE is an inverted
12460 version of BRANCH_IF_TRUE. */
12461
12462 const char *
12463 mips_output_conditional_branch (rtx_insn *insn, rtx *operands,
12464 const char *branch_if_true,
12465 const char *branch_if_false)
12466 {
12467 unsigned int length;
12468 rtx taken, not_taken;
12469
12470 gcc_assert (LABEL_P (operands[0]));
12471
12472 length = get_attr_length (insn);
12473 if (length <= 8)
12474 {
12475 /* Just a simple conditional branch. */
12476 mips_branch_likely = (final_sequence && INSN_ANNULLED_BRANCH_P (insn));
12477 return branch_if_true;
12478 }
12479
12480 /* Generate a reversed branch around a direct jump. This fallback does
12481 not use branch-likely instructions. */
12482 mips_branch_likely = false;
12483 not_taken = gen_label_rtx ();
12484 taken = operands[0];
12485
12486 /* Generate the reversed branch to NOT_TAKEN. */
12487 operands[0] = not_taken;
12488 output_asm_insn (branch_if_false, operands);
12489
12490 /* If INSN has a delay slot, we must provide delay slots for both the
12491 branch to NOT_TAKEN and the conditional jump. We must also ensure
12492 that INSN's delay slot is executed in the appropriate cases. */
12493 if (final_sequence)
12494 {
12495 /* This first delay slot will always be executed, so use INSN's
12496 delay slot if is not annulled. */
12497 if (!INSN_ANNULLED_BRANCH_P (insn))
12498 {
12499 final_scan_insn (XVECEXP (final_sequence, 0, 1),
12500 asm_out_file, optimize, 1, NULL);
12501 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1;
12502 }
12503 else
12504 output_asm_insn ("nop", 0);
12505 fprintf (asm_out_file, "\n");
12506 }
12507
12508 /* Output the unconditional branch to TAKEN. */
12509 if (TARGET_ABSOLUTE_JUMPS)
12510 output_asm_insn (MIPS_ABSOLUTE_JUMP ("j\t%0%/"), &taken);
12511 else
12512 {
12513 mips_output_load_label (taken);
12514 output_asm_insn ("jr\t%@%]%/", 0);
12515 }
12516
12517 /* Now deal with its delay slot; see above. */
12518 if (final_sequence)
12519 {
12520 /* This delay slot will only be executed if the branch is taken.
12521 Use INSN's delay slot if is annulled. */
12522 if (INSN_ANNULLED_BRANCH_P (insn))
12523 {
12524 final_scan_insn (XVECEXP (final_sequence, 0, 1),
12525 asm_out_file, optimize, 1, NULL);
12526 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1;
12527 }
12528 else
12529 output_asm_insn ("nop", 0);
12530 fprintf (asm_out_file, "\n");
12531 }
12532
12533 /* Output NOT_TAKEN. */
12534 targetm.asm_out.internal_label (asm_out_file, "L",
12535 CODE_LABEL_NUMBER (not_taken));
12536 return "";
12537 }
12538
12539 /* Return the assembly code for INSN, which branches to OPERANDS[0]
12540 if some ordering condition is true. The condition is given by
12541 OPERANDS[1] if !INVERTED_P, otherwise it is the inverse of
12542 OPERANDS[1]. OPERANDS[2] is the comparison's first operand;
12543 its second is always zero. */
12544
12545 const char *
12546 mips_output_order_conditional_branch (rtx_insn *insn, rtx *operands, bool inverted_p)
12547 {
12548 const char *branch[2];
12549
12550 /* Make BRANCH[1] branch to OPERANDS[0] when the condition is true.
12551 Make BRANCH[0] branch on the inverse condition. */
12552 switch (GET_CODE (operands[1]))
12553 {
12554 /* These cases are equivalent to comparisons against zero. */
12555 case LEU:
12556 inverted_p = !inverted_p;
12557 /* Fall through. */
12558 case GTU:
12559 branch[!inverted_p] = MIPS_BRANCH ("bne", "%2,%.,%0");
12560 branch[inverted_p] = MIPS_BRANCH ("beq", "%2,%.,%0");
12561 break;
12562
12563 /* These cases are always true or always false. */
12564 case LTU:
12565 inverted_p = !inverted_p;
12566 /* Fall through. */
12567 case GEU:
12568 branch[!inverted_p] = MIPS_BRANCH ("beq", "%.,%.,%0");
12569 branch[inverted_p] = MIPS_BRANCH ("bne", "%.,%.,%0");
12570 break;
12571
12572 default:
12573 branch[!inverted_p] = MIPS_BRANCH ("b%C1z", "%2,%0");
12574 branch[inverted_p] = MIPS_BRANCH ("b%N1z", "%2,%0");
12575 break;
12576 }
12577 return mips_output_conditional_branch (insn, operands, branch[1], branch[0]);
12578 }
12579 \f
12580 /* Start a block of code that needs access to the LL, SC and SYNC
12581 instructions. */
12582
12583 static void
12584 mips_start_ll_sc_sync_block (void)
12585 {
12586 if (!ISA_HAS_LL_SC)
12587 {
12588 output_asm_insn (".set\tpush", 0);
12589 if (TARGET_64BIT)
12590 output_asm_insn (".set\tmips3", 0);
12591 else
12592 output_asm_insn (".set\tmips2", 0);
12593 }
12594 }
12595
12596 /* End a block started by mips_start_ll_sc_sync_block. */
12597
12598 static void
12599 mips_end_ll_sc_sync_block (void)
12600 {
12601 if (!ISA_HAS_LL_SC)
12602 output_asm_insn (".set\tpop", 0);
12603 }
12604
12605 /* Output and/or return the asm template for a sync instruction. */
12606
12607 const char *
12608 mips_output_sync (void)
12609 {
12610 mips_start_ll_sc_sync_block ();
12611 output_asm_insn ("sync", 0);
12612 mips_end_ll_sc_sync_block ();
12613 return "";
12614 }
12615
12616 /* Return the asm template associated with sync_insn1 value TYPE.
12617 IS_64BIT_P is true if we want a 64-bit rather than 32-bit operation. */
12618
12619 static const char *
12620 mips_sync_insn1_template (enum attr_sync_insn1 type, bool is_64bit_p)
12621 {
12622 switch (type)
12623 {
12624 case SYNC_INSN1_MOVE:
12625 return "move\t%0,%z2";
12626 case SYNC_INSN1_LI:
12627 return "li\t%0,%2";
12628 case SYNC_INSN1_ADDU:
12629 return is_64bit_p ? "daddu\t%0,%1,%z2" : "addu\t%0,%1,%z2";
12630 case SYNC_INSN1_ADDIU:
12631 return is_64bit_p ? "daddiu\t%0,%1,%2" : "addiu\t%0,%1,%2";
12632 case SYNC_INSN1_SUBU:
12633 return is_64bit_p ? "dsubu\t%0,%1,%z2" : "subu\t%0,%1,%z2";
12634 case SYNC_INSN1_AND:
12635 return "and\t%0,%1,%z2";
12636 case SYNC_INSN1_ANDI:
12637 return "andi\t%0,%1,%2";
12638 case SYNC_INSN1_OR:
12639 return "or\t%0,%1,%z2";
12640 case SYNC_INSN1_ORI:
12641 return "ori\t%0,%1,%2";
12642 case SYNC_INSN1_XOR:
12643 return "xor\t%0,%1,%z2";
12644 case SYNC_INSN1_XORI:
12645 return "xori\t%0,%1,%2";
12646 }
12647 gcc_unreachable ();
12648 }
12649
12650 /* Return the asm template associated with sync_insn2 value TYPE. */
12651
12652 static const char *
12653 mips_sync_insn2_template (enum attr_sync_insn2 type)
12654 {
12655 switch (type)
12656 {
12657 case SYNC_INSN2_NOP:
12658 gcc_unreachable ();
12659 case SYNC_INSN2_AND:
12660 return "and\t%0,%1,%z2";
12661 case SYNC_INSN2_XOR:
12662 return "xor\t%0,%1,%z2";
12663 case SYNC_INSN2_NOT:
12664 return "nor\t%0,%1,%.";
12665 }
12666 gcc_unreachable ();
12667 }
12668
12669 /* OPERANDS are the operands to a sync loop instruction and INDEX is
12670 the value of the one of the sync_* attributes. Return the operand
12671 referred to by the attribute, or DEFAULT_VALUE if the insn doesn't
12672 have the associated attribute. */
12673
12674 static rtx
12675 mips_get_sync_operand (rtx *operands, int index, rtx default_value)
12676 {
12677 if (index > 0)
12678 default_value = operands[index - 1];
12679 return default_value;
12680 }
12681
12682 /* INSN is a sync loop with operands OPERANDS. Build up a multi-insn
12683 sequence for it. */
12684
12685 static void
12686 mips_process_sync_loop (rtx insn, rtx *operands)
12687 {
12688 rtx at, mem, oldval, newval, inclusive_mask, exclusive_mask;
12689 rtx required_oldval, insn1_op2, tmp1, tmp2, tmp3, cmp;
12690 unsigned int tmp3_insn;
12691 enum attr_sync_insn1 insn1;
12692 enum attr_sync_insn2 insn2;
12693 bool is_64bit_p;
12694 int memmodel_attr;
12695 enum memmodel model;
12696
12697 /* Read an operand from the sync_WHAT attribute and store it in
12698 variable WHAT. DEFAULT is the default value if no attribute
12699 is specified. */
12700 #define READ_OPERAND(WHAT, DEFAULT) \
12701 WHAT = mips_get_sync_operand (operands, (int) get_attr_sync_##WHAT (insn), \
12702 DEFAULT)
12703
12704 /* Read the memory. */
12705 READ_OPERAND (mem, 0);
12706 gcc_assert (mem);
12707 is_64bit_p = (GET_MODE_BITSIZE (GET_MODE (mem)) == 64);
12708
12709 /* Read the other attributes. */
12710 at = gen_rtx_REG (GET_MODE (mem), AT_REGNUM);
12711 READ_OPERAND (oldval, at);
12712 READ_OPERAND (cmp, 0);
12713 READ_OPERAND (newval, at);
12714 READ_OPERAND (inclusive_mask, 0);
12715 READ_OPERAND (exclusive_mask, 0);
12716 READ_OPERAND (required_oldval, 0);
12717 READ_OPERAND (insn1_op2, 0);
12718 insn1 = get_attr_sync_insn1 (insn);
12719 insn2 = get_attr_sync_insn2 (insn);
12720
12721 /* Don't bother setting CMP result that is never used. */
12722 if (cmp && find_reg_note (insn, REG_UNUSED, cmp))
12723 cmp = 0;
12724
12725 memmodel_attr = get_attr_sync_memmodel (insn);
12726 switch (memmodel_attr)
12727 {
12728 case 10:
12729 model = MEMMODEL_ACQ_REL;
12730 break;
12731 case 11:
12732 model = MEMMODEL_ACQUIRE;
12733 break;
12734 default:
12735 model = (enum memmodel) INTVAL (operands[memmodel_attr]);
12736 }
12737
12738 mips_multi_start ();
12739
12740 /* Output the release side of the memory barrier. */
12741 if (need_atomic_barrier_p (model, true))
12742 {
12743 if (required_oldval == 0 && TARGET_OCTEON)
12744 {
12745 /* Octeon doesn't reorder reads, so a full barrier can be
12746 created by using SYNCW to order writes combined with the
12747 write from the following SC. When the SC successfully
12748 completes, we know that all preceding writes are also
12749 committed to the coherent memory system. It is possible
12750 for a single SYNCW to fail, but a pair of them will never
12751 fail, so we use two. */
12752 mips_multi_add_insn ("syncw", NULL);
12753 mips_multi_add_insn ("syncw", NULL);
12754 }
12755 else
12756 mips_multi_add_insn ("sync", NULL);
12757 }
12758
12759 /* Output the branch-back label. */
12760 mips_multi_add_label ("1:");
12761
12762 /* OLDVAL = *MEM. */
12763 mips_multi_add_insn (is_64bit_p ? "lld\t%0,%1" : "ll\t%0,%1",
12764 oldval, mem, NULL);
12765
12766 /* if ((OLDVAL & INCLUSIVE_MASK) != REQUIRED_OLDVAL) goto 2. */
12767 if (required_oldval)
12768 {
12769 if (inclusive_mask == 0)
12770 tmp1 = oldval;
12771 else
12772 {
12773 gcc_assert (oldval != at);
12774 mips_multi_add_insn ("and\t%0,%1,%2",
12775 at, oldval, inclusive_mask, NULL);
12776 tmp1 = at;
12777 }
12778 mips_multi_add_insn ("bne\t%0,%z1,2f", tmp1, required_oldval, NULL);
12779
12780 /* CMP = 0 [delay slot]. */
12781 if (cmp)
12782 mips_multi_add_insn ("li\t%0,0", cmp, NULL);
12783 }
12784
12785 /* $TMP1 = OLDVAL & EXCLUSIVE_MASK. */
12786 if (exclusive_mask == 0)
12787 tmp1 = const0_rtx;
12788 else
12789 {
12790 gcc_assert (oldval != at);
12791 mips_multi_add_insn ("and\t%0,%1,%z2",
12792 at, oldval, exclusive_mask, NULL);
12793 tmp1 = at;
12794 }
12795
12796 /* $TMP2 = INSN1 (OLDVAL, INSN1_OP2).
12797
12798 We can ignore moves if $TMP4 != INSN1_OP2, since we'll still emit
12799 at least one instruction in that case. */
12800 if (insn1 == SYNC_INSN1_MOVE
12801 && (tmp1 != const0_rtx || insn2 != SYNC_INSN2_NOP))
12802 tmp2 = insn1_op2;
12803 else
12804 {
12805 mips_multi_add_insn (mips_sync_insn1_template (insn1, is_64bit_p),
12806 newval, oldval, insn1_op2, NULL);
12807 tmp2 = newval;
12808 }
12809
12810 /* $TMP3 = INSN2 ($TMP2, INCLUSIVE_MASK). */
12811 if (insn2 == SYNC_INSN2_NOP)
12812 tmp3 = tmp2;
12813 else
12814 {
12815 mips_multi_add_insn (mips_sync_insn2_template (insn2),
12816 newval, tmp2, inclusive_mask, NULL);
12817 tmp3 = newval;
12818 }
12819 tmp3_insn = mips_multi_last_index ();
12820
12821 /* $AT = $TMP1 | $TMP3. */
12822 if (tmp1 == const0_rtx || tmp3 == const0_rtx)
12823 {
12824 mips_multi_set_operand (tmp3_insn, 0, at);
12825 tmp3 = at;
12826 }
12827 else
12828 {
12829 gcc_assert (tmp1 != tmp3);
12830 mips_multi_add_insn ("or\t%0,%1,%2", at, tmp1, tmp3, NULL);
12831 }
12832
12833 /* if (!commit (*MEM = $AT)) goto 1.
12834
12835 This will sometimes be a delayed branch; see the write code below
12836 for details. */
12837 mips_multi_add_insn (is_64bit_p ? "scd\t%0,%1" : "sc\t%0,%1", at, mem, NULL);
12838 mips_multi_add_insn ("beq%?\t%0,%.,1b", at, NULL);
12839
12840 /* if (INSN1 != MOVE && INSN1 != LI) NEWVAL = $TMP3 [delay slot]. */
12841 if (insn1 != SYNC_INSN1_MOVE && insn1 != SYNC_INSN1_LI && tmp3 != newval)
12842 {
12843 mips_multi_copy_insn (tmp3_insn);
12844 mips_multi_set_operand (mips_multi_last_index (), 0, newval);
12845 }
12846 else if (!(required_oldval && cmp))
12847 mips_multi_add_insn ("nop", NULL);
12848
12849 /* CMP = 1 -- either standalone or in a delay slot. */
12850 if (required_oldval && cmp)
12851 mips_multi_add_insn ("li\t%0,1", cmp, NULL);
12852
12853 /* Output the acquire side of the memory barrier. */
12854 if (TARGET_SYNC_AFTER_SC && need_atomic_barrier_p (model, false))
12855 mips_multi_add_insn ("sync", NULL);
12856
12857 /* Output the exit label, if needed. */
12858 if (required_oldval)
12859 mips_multi_add_label ("2:");
12860
12861 #undef READ_OPERAND
12862 }
12863
12864 /* Output and/or return the asm template for sync loop INSN, which has
12865 the operands given by OPERANDS. */
12866
12867 const char *
12868 mips_output_sync_loop (rtx insn, rtx *operands)
12869 {
12870 mips_process_sync_loop (insn, operands);
12871
12872 /* Use branch-likely instructions to work around the LL/SC R10000
12873 errata. */
12874 mips_branch_likely = TARGET_FIX_R10000;
12875
12876 mips_push_asm_switch (&mips_noreorder);
12877 mips_push_asm_switch (&mips_nomacro);
12878 mips_push_asm_switch (&mips_noat);
12879 mips_start_ll_sc_sync_block ();
12880
12881 mips_multi_write ();
12882
12883 mips_end_ll_sc_sync_block ();
12884 mips_pop_asm_switch (&mips_noat);
12885 mips_pop_asm_switch (&mips_nomacro);
12886 mips_pop_asm_switch (&mips_noreorder);
12887
12888 return "";
12889 }
12890
12891 /* Return the number of individual instructions in sync loop INSN,
12892 which has the operands given by OPERANDS. */
12893
12894 unsigned int
12895 mips_sync_loop_insns (rtx insn, rtx *operands)
12896 {
12897 mips_process_sync_loop (insn, operands);
12898 return mips_multi_num_insns;
12899 }
12900 \f
12901 /* Return the assembly code for DIV or DDIV instruction DIVISION, which has
12902 the operands given by OPERANDS. Add in a divide-by-zero check if needed.
12903
12904 When working around R4000 and R4400 errata, we need to make sure that
12905 the division is not immediately followed by a shift[1][2]. We also
12906 need to stop the division from being put into a branch delay slot[3].
12907 The easiest way to avoid both problems is to add a nop after the
12908 division. When a divide-by-zero check is needed, this nop can be
12909 used to fill the branch delay slot.
12910
12911 [1] If a double-word or a variable shift executes immediately
12912 after starting an integer division, the shift may give an
12913 incorrect result. See quotations of errata #16 and #28 from
12914 "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0"
12915 in mips.md for details.
12916
12917 [2] A similar bug to [1] exists for all revisions of the
12918 R4000 and the R4400 when run in an MC configuration.
12919 From "MIPS R4000MC Errata, Processor Revision 2.2 and 3.0":
12920
12921 "19. In this following sequence:
12922
12923 ddiv (or ddivu or div or divu)
12924 dsll32 (or dsrl32, dsra32)
12925
12926 if an MPT stall occurs, while the divide is slipping the cpu
12927 pipeline, then the following double shift would end up with an
12928 incorrect result.
12929
12930 Workaround: The compiler needs to avoid generating any
12931 sequence with divide followed by extended double shift."
12932
12933 This erratum is also present in "MIPS R4400MC Errata, Processor
12934 Revision 1.0" and "MIPS R4400MC Errata, Processor Revision 2.0
12935 & 3.0" as errata #10 and #4, respectively.
12936
12937 [3] From "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0"
12938 (also valid for MIPS R4000MC processors):
12939
12940 "52. R4000SC: This bug does not apply for the R4000PC.
12941
12942 There are two flavors of this bug:
12943
12944 1) If the instruction just after divide takes an RF exception
12945 (tlb-refill, tlb-invalid) and gets an instruction cache
12946 miss (both primary and secondary) and the line which is
12947 currently in secondary cache at this index had the first
12948 data word, where the bits 5..2 are set, then R4000 would
12949 get a wrong result for the div.
12950
12951 ##1
12952 nop
12953 div r8, r9
12954 ------------------- # end-of page. -tlb-refill
12955 nop
12956 ##2
12957 nop
12958 div r8, r9
12959 ------------------- # end-of page. -tlb-invalid
12960 nop
12961
12962 2) If the divide is in the taken branch delay slot, where the
12963 target takes RF exception and gets an I-cache miss for the
12964 exception vector or where I-cache miss occurs for the
12965 target address, under the above mentioned scenarios, the
12966 div would get wrong results.
12967
12968 ##1
12969 j r2 # to next page mapped or unmapped
12970 div r8,r9 # this bug would be there as long
12971 # as there is an ICache miss and
12972 nop # the "data pattern" is present
12973
12974 ##2
12975 beq r0, r0, NextPage # to Next page
12976 div r8,r9
12977 nop
12978
12979 This bug is present for div, divu, ddiv, and ddivu
12980 instructions.
12981
12982 Workaround: For item 1), OS could make sure that the next page
12983 after the divide instruction is also mapped. For item 2), the
12984 compiler could make sure that the divide instruction is not in
12985 the branch delay slot."
12986
12987 These processors have PRId values of 0x00004220 and 0x00004300 for
12988 the R4000 and 0x00004400, 0x00004500 and 0x00004600 for the R4400. */
12989
12990 const char *
12991 mips_output_division (const char *division, rtx *operands)
12992 {
12993 const char *s;
12994
12995 s = division;
12996 if (TARGET_FIX_R4000 || TARGET_FIX_R4400)
12997 {
12998 output_asm_insn (s, operands);
12999 s = "nop";
13000 }
13001 if (TARGET_CHECK_ZERO_DIV)
13002 {
13003 if (TARGET_MIPS16)
13004 {
13005 output_asm_insn (s, operands);
13006 s = "bnez\t%2,1f\n\tbreak\t7\n1:";
13007 }
13008 else if (GENERATE_DIVIDE_TRAPS)
13009 {
13010 /* Avoid long replay penalty on load miss by putting the trap before
13011 the divide. */
13012 if (TUNE_74K)
13013 output_asm_insn ("teq\t%2,%.,7", operands);
13014 else
13015 {
13016 output_asm_insn (s, operands);
13017 s = "teq\t%2,%.,7";
13018 }
13019 }
13020 else
13021 {
13022 output_asm_insn ("%(bne\t%2,%.,1f", operands);
13023 output_asm_insn (s, operands);
13024 s = "break\t7%)\n1:";
13025 }
13026 }
13027 return s;
13028 }
13029 \f
13030 /* Return true if destination of IN_INSN is used as add source in
13031 OUT_INSN. Both IN_INSN and OUT_INSN are of type fmadd. Example:
13032 madd.s dst, x, y, z
13033 madd.s a, dst, b, c */
13034
13035 bool
13036 mips_fmadd_bypass (rtx out_insn, rtx in_insn)
13037 {
13038 int dst_reg, src_reg;
13039
13040 gcc_assert (get_attr_type (in_insn) == TYPE_FMADD);
13041 gcc_assert (get_attr_type (out_insn) == TYPE_FMADD);
13042
13043 extract_insn (in_insn);
13044 dst_reg = REG_P (recog_data.operand[0]);
13045
13046 extract_insn (out_insn);
13047 src_reg = REG_P (recog_data.operand[1]);
13048
13049 if (dst_reg == src_reg)
13050 return true;
13051
13052 return false;
13053 }
13054
13055 /* Return true if IN_INSN is a multiply-add or multiply-subtract
13056 instruction and if OUT_INSN assigns to the accumulator operand. */
13057
13058 bool
13059 mips_linked_madd_p (rtx out_insn, rtx in_insn)
13060 {
13061 enum attr_accum_in accum_in;
13062 int accum_in_opnum;
13063 rtx accum_in_op;
13064
13065 if (recog_memoized (in_insn) < 0)
13066 return false;
13067
13068 accum_in = get_attr_accum_in (in_insn);
13069 if (accum_in == ACCUM_IN_NONE)
13070 return false;
13071
13072 accum_in_opnum = accum_in - ACCUM_IN_0;
13073
13074 extract_insn (in_insn);
13075 gcc_assert (accum_in_opnum < recog_data.n_operands);
13076 accum_in_op = recog_data.operand[accum_in_opnum];
13077
13078 return reg_set_p (accum_in_op, out_insn);
13079 }
13080
13081 /* True if the dependency between OUT_INSN and IN_INSN is on the store
13082 data rather than the address. We need this because the cprestore
13083 pattern is type "store", but is defined using an UNSPEC_VOLATILE,
13084 which causes the default routine to abort. We just return false
13085 for that case. */
13086
13087 bool
13088 mips_store_data_bypass_p (rtx out_insn, rtx in_insn)
13089 {
13090 if (GET_CODE (PATTERN (in_insn)) == UNSPEC_VOLATILE)
13091 return false;
13092
13093 return !store_data_bypass_p (out_insn, in_insn);
13094 }
13095 \f
13096
13097 /* Variables and flags used in scheduler hooks when tuning for
13098 Loongson 2E/2F. */
13099 static struct
13100 {
13101 /* Variables to support Loongson 2E/2F round-robin [F]ALU1/2 dispatch
13102 strategy. */
13103
13104 /* If true, then next ALU1/2 instruction will go to ALU1. */
13105 bool alu1_turn_p;
13106
13107 /* If true, then next FALU1/2 unstruction will go to FALU1. */
13108 bool falu1_turn_p;
13109
13110 /* Codes to query if [f]alu{1,2}_core units are subscribed or not. */
13111 int alu1_core_unit_code;
13112 int alu2_core_unit_code;
13113 int falu1_core_unit_code;
13114 int falu2_core_unit_code;
13115
13116 /* True if current cycle has a multi instruction.
13117 This flag is used in mips_ls2_dfa_post_advance_cycle. */
13118 bool cycle_has_multi_p;
13119
13120 /* Instructions to subscribe ls2_[f]alu{1,2}_turn_enabled units.
13121 These are used in mips_ls2_dfa_post_advance_cycle to initialize
13122 DFA state.
13123 E.g., when alu1_turn_enabled_insn is issued it makes next ALU1/2
13124 instruction to go ALU1. */
13125 rtx_insn *alu1_turn_enabled_insn;
13126 rtx_insn *alu2_turn_enabled_insn;
13127 rtx_insn *falu1_turn_enabled_insn;
13128 rtx_insn *falu2_turn_enabled_insn;
13129 } mips_ls2;
13130
13131 /* Implement TARGET_SCHED_ADJUST_COST. We assume that anti and output
13132 dependencies have no cost, except on the 20Kc where output-dependence
13133 is treated like input-dependence. */
13134
13135 static int
13136 mips_adjust_cost (rtx insn ATTRIBUTE_UNUSED, rtx link,
13137 rtx dep ATTRIBUTE_UNUSED, int cost)
13138 {
13139 if (REG_NOTE_KIND (link) == REG_DEP_OUTPUT
13140 && TUNE_20KC)
13141 return cost;
13142 if (REG_NOTE_KIND (link) != 0)
13143 return 0;
13144 return cost;
13145 }
13146
13147 /* Return the number of instructions that can be issued per cycle. */
13148
13149 static int
13150 mips_issue_rate (void)
13151 {
13152 switch (mips_tune)
13153 {
13154 case PROCESSOR_74KC:
13155 case PROCESSOR_74KF2_1:
13156 case PROCESSOR_74KF1_1:
13157 case PROCESSOR_74KF3_2:
13158 /* The 74k is not strictly quad-issue cpu, but can be seen as one
13159 by the scheduler. It can issue 1 ALU, 1 AGEN and 2 FPU insns,
13160 but in reality only a maximum of 3 insns can be issued as
13161 floating-point loads and stores also require a slot in the
13162 AGEN pipe. */
13163 case PROCESSOR_R10000:
13164 /* All R10K Processors are quad-issue (being the first MIPS
13165 processors to support this feature). */
13166 return 4;
13167
13168 case PROCESSOR_20KC:
13169 case PROCESSOR_R4130:
13170 case PROCESSOR_R5400:
13171 case PROCESSOR_R5500:
13172 case PROCESSOR_R5900:
13173 case PROCESSOR_R7000:
13174 case PROCESSOR_R9000:
13175 case PROCESSOR_OCTEON:
13176 case PROCESSOR_OCTEON2:
13177 return 2;
13178
13179 case PROCESSOR_SB1:
13180 case PROCESSOR_SB1A:
13181 /* This is actually 4, but we get better performance if we claim 3.
13182 This is partly because of unwanted speculative code motion with the
13183 larger number, and partly because in most common cases we can't
13184 reach the theoretical max of 4. */
13185 return 3;
13186
13187 case PROCESSOR_LOONGSON_2E:
13188 case PROCESSOR_LOONGSON_2F:
13189 case PROCESSOR_LOONGSON_3A:
13190 case PROCESSOR_P5600:
13191 return 4;
13192
13193 case PROCESSOR_XLP:
13194 return (reload_completed ? 4 : 3);
13195
13196 default:
13197 return 1;
13198 }
13199 }
13200
13201 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook for Loongson2. */
13202
13203 static void
13204 mips_ls2_init_dfa_post_cycle_insn (void)
13205 {
13206 start_sequence ();
13207 emit_insn (gen_ls2_alu1_turn_enabled_insn ());
13208 mips_ls2.alu1_turn_enabled_insn = get_insns ();
13209 end_sequence ();
13210
13211 start_sequence ();
13212 emit_insn (gen_ls2_alu2_turn_enabled_insn ());
13213 mips_ls2.alu2_turn_enabled_insn = get_insns ();
13214 end_sequence ();
13215
13216 start_sequence ();
13217 emit_insn (gen_ls2_falu1_turn_enabled_insn ());
13218 mips_ls2.falu1_turn_enabled_insn = get_insns ();
13219 end_sequence ();
13220
13221 start_sequence ();
13222 emit_insn (gen_ls2_falu2_turn_enabled_insn ());
13223 mips_ls2.falu2_turn_enabled_insn = get_insns ();
13224 end_sequence ();
13225
13226 mips_ls2.alu1_core_unit_code = get_cpu_unit_code ("ls2_alu1_core");
13227 mips_ls2.alu2_core_unit_code = get_cpu_unit_code ("ls2_alu2_core");
13228 mips_ls2.falu1_core_unit_code = get_cpu_unit_code ("ls2_falu1_core");
13229 mips_ls2.falu2_core_unit_code = get_cpu_unit_code ("ls2_falu2_core");
13230 }
13231
13232 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook.
13233 Init data used in mips_dfa_post_advance_cycle. */
13234
13235 static void
13236 mips_init_dfa_post_cycle_insn (void)
13237 {
13238 if (TUNE_LOONGSON_2EF)
13239 mips_ls2_init_dfa_post_cycle_insn ();
13240 }
13241
13242 /* Initialize STATE when scheduling for Loongson 2E/2F.
13243 Support round-robin dispatch scheme by enabling only one of
13244 ALU1/ALU2 and one of FALU1/FALU2 units for ALU1/2 and FALU1/2 instructions
13245 respectively. */
13246
13247 static void
13248 mips_ls2_dfa_post_advance_cycle (state_t state)
13249 {
13250 if (cpu_unit_reservation_p (state, mips_ls2.alu1_core_unit_code))
13251 {
13252 /* Though there are no non-pipelined ALU1 insns,
13253 we can get an instruction of type 'multi' before reload. */
13254 gcc_assert (mips_ls2.cycle_has_multi_p);
13255 mips_ls2.alu1_turn_p = false;
13256 }
13257
13258 mips_ls2.cycle_has_multi_p = false;
13259
13260 if (cpu_unit_reservation_p (state, mips_ls2.alu2_core_unit_code))
13261 /* We have a non-pipelined alu instruction in the core,
13262 adjust round-robin counter. */
13263 mips_ls2.alu1_turn_p = true;
13264
13265 if (mips_ls2.alu1_turn_p)
13266 {
13267 if (state_transition (state, mips_ls2.alu1_turn_enabled_insn) >= 0)
13268 gcc_unreachable ();
13269 }
13270 else
13271 {
13272 if (state_transition (state, mips_ls2.alu2_turn_enabled_insn) >= 0)
13273 gcc_unreachable ();
13274 }
13275
13276 if (cpu_unit_reservation_p (state, mips_ls2.falu1_core_unit_code))
13277 {
13278 /* There are no non-pipelined FALU1 insns. */
13279 gcc_unreachable ();
13280 mips_ls2.falu1_turn_p = false;
13281 }
13282
13283 if (cpu_unit_reservation_p (state, mips_ls2.falu2_core_unit_code))
13284 /* We have a non-pipelined falu instruction in the core,
13285 adjust round-robin counter. */
13286 mips_ls2.falu1_turn_p = true;
13287
13288 if (mips_ls2.falu1_turn_p)
13289 {
13290 if (state_transition (state, mips_ls2.falu1_turn_enabled_insn) >= 0)
13291 gcc_unreachable ();
13292 }
13293 else
13294 {
13295 if (state_transition (state, mips_ls2.falu2_turn_enabled_insn) >= 0)
13296 gcc_unreachable ();
13297 }
13298 }
13299
13300 /* Implement TARGET_SCHED_DFA_POST_ADVANCE_CYCLE.
13301 This hook is being called at the start of each cycle. */
13302
13303 static void
13304 mips_dfa_post_advance_cycle (void)
13305 {
13306 if (TUNE_LOONGSON_2EF)
13307 mips_ls2_dfa_post_advance_cycle (curr_state);
13308 }
13309
13310 /* Implement TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD. This should
13311 be as wide as the scheduling freedom in the DFA. */
13312
13313 static int
13314 mips_multipass_dfa_lookahead (void)
13315 {
13316 /* Can schedule up to 4 of the 6 function units in any one cycle. */
13317 if (TUNE_SB1)
13318 return 4;
13319
13320 if (TUNE_LOONGSON_2EF || TUNE_LOONGSON_3A)
13321 return 4;
13322
13323 if (TUNE_OCTEON)
13324 return 2;
13325
13326 if (TUNE_P5600)
13327 return 4;
13328
13329 return 0;
13330 }
13331 \f
13332 /* Remove the instruction at index LOWER from ready queue READY and
13333 reinsert it in front of the instruction at index HIGHER. LOWER must
13334 be <= HIGHER. */
13335
13336 static void
13337 mips_promote_ready (rtx_insn **ready, int lower, int higher)
13338 {
13339 rtx_insn *new_head;
13340 int i;
13341
13342 new_head = ready[lower];
13343 for (i = lower; i < higher; i++)
13344 ready[i] = ready[i + 1];
13345 ready[i] = new_head;
13346 }
13347
13348 /* If the priority of the instruction at POS2 in the ready queue READY
13349 is within LIMIT units of that of the instruction at POS1, swap the
13350 instructions if POS2 is not already less than POS1. */
13351
13352 static void
13353 mips_maybe_swap_ready (rtx_insn **ready, int pos1, int pos2, int limit)
13354 {
13355 if (pos1 < pos2
13356 && INSN_PRIORITY (ready[pos1]) + limit >= INSN_PRIORITY (ready[pos2]))
13357 {
13358 rtx_insn *temp;
13359
13360 temp = ready[pos1];
13361 ready[pos1] = ready[pos2];
13362 ready[pos2] = temp;
13363 }
13364 }
13365 \f
13366 /* Used by TUNE_MACC_CHAINS to record the last scheduled instruction
13367 that may clobber hi or lo. */
13368 static rtx mips_macc_chains_last_hilo;
13369
13370 /* A TUNE_MACC_CHAINS helper function. Record that instruction INSN has
13371 been scheduled, updating mips_macc_chains_last_hilo appropriately. */
13372
13373 static void
13374 mips_macc_chains_record (rtx insn)
13375 {
13376 if (get_attr_may_clobber_hilo (insn))
13377 mips_macc_chains_last_hilo = insn;
13378 }
13379
13380 /* A TUNE_MACC_CHAINS helper function. Search ready queue READY, which
13381 has NREADY elements, looking for a multiply-add or multiply-subtract
13382 instruction that is cumulative with mips_macc_chains_last_hilo.
13383 If there is one, promote it ahead of anything else that might
13384 clobber hi or lo. */
13385
13386 static void
13387 mips_macc_chains_reorder (rtx_insn **ready, int nready)
13388 {
13389 int i, j;
13390
13391 if (mips_macc_chains_last_hilo != 0)
13392 for (i = nready - 1; i >= 0; i--)
13393 if (mips_linked_madd_p (mips_macc_chains_last_hilo, ready[i]))
13394 {
13395 for (j = nready - 1; j > i; j--)
13396 if (recog_memoized (ready[j]) >= 0
13397 && get_attr_may_clobber_hilo (ready[j]))
13398 {
13399 mips_promote_ready (ready, i, j);
13400 break;
13401 }
13402 break;
13403 }
13404 }
13405 \f
13406 /* The last instruction to be scheduled. */
13407 static rtx vr4130_last_insn;
13408
13409 /* A note_stores callback used by vr4130_true_reg_dependence_p. DATA
13410 points to an rtx that is initially an instruction. Nullify the rtx
13411 if the instruction uses the value of register X. */
13412
13413 static void
13414 vr4130_true_reg_dependence_p_1 (rtx x, const_rtx pat ATTRIBUTE_UNUSED,
13415 void *data)
13416 {
13417 rtx *insn_ptr;
13418
13419 insn_ptr = (rtx *) data;
13420 if (REG_P (x)
13421 && *insn_ptr != 0
13422 && reg_referenced_p (x, PATTERN (*insn_ptr)))
13423 *insn_ptr = 0;
13424 }
13425
13426 /* Return true if there is true register dependence between vr4130_last_insn
13427 and INSN. */
13428
13429 static bool
13430 vr4130_true_reg_dependence_p (rtx insn)
13431 {
13432 note_stores (PATTERN (vr4130_last_insn),
13433 vr4130_true_reg_dependence_p_1, &insn);
13434 return insn == 0;
13435 }
13436
13437 /* A TUNE_MIPS4130 helper function. Given that INSN1 is at the head of
13438 the ready queue and that INSN2 is the instruction after it, return
13439 true if it is worth promoting INSN2 ahead of INSN1. Look for cases
13440 in which INSN1 and INSN2 can probably issue in parallel, but for
13441 which (INSN2, INSN1) should be less sensitive to instruction
13442 alignment than (INSN1, INSN2). See 4130.md for more details. */
13443
13444 static bool
13445 vr4130_swap_insns_p (rtx insn1, rtx insn2)
13446 {
13447 sd_iterator_def sd_it;
13448 dep_t dep;
13449
13450 /* Check for the following case:
13451
13452 1) there is some other instruction X with an anti dependence on INSN1;
13453 2) X has a higher priority than INSN2; and
13454 3) X is an arithmetic instruction (and thus has no unit restrictions).
13455
13456 If INSN1 is the last instruction blocking X, it would better to
13457 choose (INSN1, X) over (INSN2, INSN1). */
13458 FOR_EACH_DEP (insn1, SD_LIST_FORW, sd_it, dep)
13459 if (DEP_TYPE (dep) == REG_DEP_ANTI
13460 && INSN_PRIORITY (DEP_CON (dep)) > INSN_PRIORITY (insn2)
13461 && recog_memoized (DEP_CON (dep)) >= 0
13462 && get_attr_vr4130_class (DEP_CON (dep)) == VR4130_CLASS_ALU)
13463 return false;
13464
13465 if (vr4130_last_insn != 0
13466 && recog_memoized (insn1) >= 0
13467 && recog_memoized (insn2) >= 0)
13468 {
13469 /* See whether INSN1 and INSN2 use different execution units,
13470 or if they are both ALU-type instructions. If so, they can
13471 probably execute in parallel. */
13472 enum attr_vr4130_class class1 = get_attr_vr4130_class (insn1);
13473 enum attr_vr4130_class class2 = get_attr_vr4130_class (insn2);
13474 if (class1 != class2 || class1 == VR4130_CLASS_ALU)
13475 {
13476 /* If only one of the instructions has a dependence on
13477 vr4130_last_insn, prefer to schedule the other one first. */
13478 bool dep1_p = vr4130_true_reg_dependence_p (insn1);
13479 bool dep2_p = vr4130_true_reg_dependence_p (insn2);
13480 if (dep1_p != dep2_p)
13481 return dep1_p;
13482
13483 /* Prefer to schedule INSN2 ahead of INSN1 if vr4130_last_insn
13484 is not an ALU-type instruction and if INSN1 uses the same
13485 execution unit. (Note that if this condition holds, we already
13486 know that INSN2 uses a different execution unit.) */
13487 if (class1 != VR4130_CLASS_ALU
13488 && recog_memoized (vr4130_last_insn) >= 0
13489 && class1 == get_attr_vr4130_class (vr4130_last_insn))
13490 return true;
13491 }
13492 }
13493 return false;
13494 }
13495
13496 /* A TUNE_MIPS4130 helper function. (READY, NREADY) describes a ready
13497 queue with at least two instructions. Swap the first two if
13498 vr4130_swap_insns_p says that it could be worthwhile. */
13499
13500 static void
13501 vr4130_reorder (rtx_insn **ready, int nready)
13502 {
13503 if (vr4130_swap_insns_p (ready[nready - 1], ready[nready - 2]))
13504 mips_promote_ready (ready, nready - 2, nready - 1);
13505 }
13506 \f
13507 /* Record whether last 74k AGEN instruction was a load or store. */
13508 static enum attr_type mips_last_74k_agen_insn = TYPE_UNKNOWN;
13509
13510 /* Initialize mips_last_74k_agen_insn from INSN. A null argument
13511 resets to TYPE_UNKNOWN state. */
13512
13513 static void
13514 mips_74k_agen_init (rtx insn)
13515 {
13516 if (!insn || CALL_P (insn) || JUMP_P (insn))
13517 mips_last_74k_agen_insn = TYPE_UNKNOWN;
13518 else
13519 {
13520 enum attr_type type = get_attr_type (insn);
13521 if (type == TYPE_LOAD || type == TYPE_STORE)
13522 mips_last_74k_agen_insn = type;
13523 }
13524 }
13525
13526 /* A TUNE_74K helper function. The 74K AGEN pipeline likes multiple
13527 loads to be grouped together, and multiple stores to be grouped
13528 together. Swap things around in the ready queue to make this happen. */
13529
13530 static void
13531 mips_74k_agen_reorder (rtx_insn **ready, int nready)
13532 {
13533 int i;
13534 int store_pos, load_pos;
13535
13536 store_pos = -1;
13537 load_pos = -1;
13538
13539 for (i = nready - 1; i >= 0; i--)
13540 {
13541 rtx_insn *insn = ready[i];
13542 if (USEFUL_INSN_P (insn))
13543 switch (get_attr_type (insn))
13544 {
13545 case TYPE_STORE:
13546 if (store_pos == -1)
13547 store_pos = i;
13548 break;
13549
13550 case TYPE_LOAD:
13551 if (load_pos == -1)
13552 load_pos = i;
13553 break;
13554
13555 default:
13556 break;
13557 }
13558 }
13559
13560 if (load_pos == -1 || store_pos == -1)
13561 return;
13562
13563 switch (mips_last_74k_agen_insn)
13564 {
13565 case TYPE_UNKNOWN:
13566 /* Prefer to schedule loads since they have a higher latency. */
13567 case TYPE_LOAD:
13568 /* Swap loads to the front of the queue. */
13569 mips_maybe_swap_ready (ready, load_pos, store_pos, 4);
13570 break;
13571 case TYPE_STORE:
13572 /* Swap stores to the front of the queue. */
13573 mips_maybe_swap_ready (ready, store_pos, load_pos, 4);
13574 break;
13575 default:
13576 break;
13577 }
13578 }
13579 \f
13580 /* Implement TARGET_SCHED_INIT. */
13581
13582 static void
13583 mips_sched_init (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13584 int max_ready ATTRIBUTE_UNUSED)
13585 {
13586 mips_macc_chains_last_hilo = 0;
13587 vr4130_last_insn = 0;
13588 mips_74k_agen_init (NULL_RTX);
13589
13590 /* When scheduling for Loongson2, branch instructions go to ALU1,
13591 therefore basic block is most likely to start with round-robin counter
13592 pointed to ALU2. */
13593 mips_ls2.alu1_turn_p = false;
13594 mips_ls2.falu1_turn_p = true;
13595 }
13596
13597 /* Subroutine used by TARGET_SCHED_REORDER and TARGET_SCHED_REORDER2. */
13598
13599 static void
13600 mips_sched_reorder_1 (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13601 rtx_insn **ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
13602 {
13603 if (!reload_completed
13604 && TUNE_MACC_CHAINS
13605 && *nreadyp > 0)
13606 mips_macc_chains_reorder (ready, *nreadyp);
13607
13608 if (reload_completed
13609 && TUNE_MIPS4130
13610 && !TARGET_VR4130_ALIGN
13611 && *nreadyp > 1)
13612 vr4130_reorder (ready, *nreadyp);
13613
13614 if (TUNE_74K)
13615 mips_74k_agen_reorder (ready, *nreadyp);
13616 }
13617
13618 /* Implement TARGET_SCHED_REORDER. */
13619
13620 static int
13621 mips_sched_reorder (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13622 rtx_insn **ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
13623 {
13624 mips_sched_reorder_1 (file, verbose, ready, nreadyp, cycle);
13625 return mips_issue_rate ();
13626 }
13627
13628 /* Implement TARGET_SCHED_REORDER2. */
13629
13630 static int
13631 mips_sched_reorder2 (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13632 rtx_insn **ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
13633 {
13634 mips_sched_reorder_1 (file, verbose, ready, nreadyp, cycle);
13635 return cached_can_issue_more;
13636 }
13637
13638 /* Update round-robin counters for ALU1/2 and FALU1/2. */
13639
13640 static void
13641 mips_ls2_variable_issue (rtx insn)
13642 {
13643 if (mips_ls2.alu1_turn_p)
13644 {
13645 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu1_core_unit_code))
13646 mips_ls2.alu1_turn_p = false;
13647 }
13648 else
13649 {
13650 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu2_core_unit_code))
13651 mips_ls2.alu1_turn_p = true;
13652 }
13653
13654 if (mips_ls2.falu1_turn_p)
13655 {
13656 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu1_core_unit_code))
13657 mips_ls2.falu1_turn_p = false;
13658 }
13659 else
13660 {
13661 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu2_core_unit_code))
13662 mips_ls2.falu1_turn_p = true;
13663 }
13664
13665 if (recog_memoized (insn) >= 0)
13666 mips_ls2.cycle_has_multi_p |= (get_attr_type (insn) == TYPE_MULTI);
13667 }
13668
13669 /* Implement TARGET_SCHED_VARIABLE_ISSUE. */
13670
13671 static int
13672 mips_variable_issue (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13673 rtx insn, int more)
13674 {
13675 /* Ignore USEs and CLOBBERs; don't count them against the issue rate. */
13676 if (USEFUL_INSN_P (insn))
13677 {
13678 if (get_attr_type (insn) != TYPE_GHOST)
13679 more--;
13680 if (!reload_completed && TUNE_MACC_CHAINS)
13681 mips_macc_chains_record (insn);
13682 vr4130_last_insn = insn;
13683 if (TUNE_74K)
13684 mips_74k_agen_init (insn);
13685 else if (TUNE_LOONGSON_2EF)
13686 mips_ls2_variable_issue (insn);
13687 }
13688
13689 /* Instructions of type 'multi' should all be split before
13690 the second scheduling pass. */
13691 gcc_assert (!reload_completed
13692 || recog_memoized (insn) < 0
13693 || get_attr_type (insn) != TYPE_MULTI);
13694
13695 cached_can_issue_more = more;
13696 return more;
13697 }
13698 \f
13699 /* Given that we have an rtx of the form (prefetch ... WRITE LOCALITY),
13700 return the first operand of the associated PREF or PREFX insn. */
13701
13702 rtx
13703 mips_prefetch_cookie (rtx write, rtx locality)
13704 {
13705 /* store_streamed / load_streamed. */
13706 if (INTVAL (locality) <= 0)
13707 return GEN_INT (INTVAL (write) + 4);
13708
13709 /* store / load. */
13710 if (INTVAL (locality) <= 2)
13711 return write;
13712
13713 /* store_retained / load_retained. */
13714 return GEN_INT (INTVAL (write) + 6);
13715 }
13716 \f
13717 /* Flags that indicate when a built-in function is available.
13718
13719 BUILTIN_AVAIL_NON_MIPS16
13720 The function is available on the current target if !TARGET_MIPS16.
13721
13722 BUILTIN_AVAIL_MIPS16
13723 The function is available on the current target if TARGET_MIPS16. */
13724 #define BUILTIN_AVAIL_NON_MIPS16 1
13725 #define BUILTIN_AVAIL_MIPS16 2
13726
13727 /* Declare an availability predicate for built-in functions that
13728 require non-MIPS16 mode and also require COND to be true.
13729 NAME is the main part of the predicate's name. */
13730 #define AVAIL_NON_MIPS16(NAME, COND) \
13731 static unsigned int \
13732 mips_builtin_avail_##NAME (void) \
13733 { \
13734 return (COND) ? BUILTIN_AVAIL_NON_MIPS16 : 0; \
13735 }
13736
13737 /* Declare an availability predicate for built-in functions that
13738 support both MIPS16 and non-MIPS16 code and also require COND
13739 to be true. NAME is the main part of the predicate's name. */
13740 #define AVAIL_ALL(NAME, COND) \
13741 static unsigned int \
13742 mips_builtin_avail_##NAME (void) \
13743 { \
13744 return (COND) ? BUILTIN_AVAIL_NON_MIPS16 | BUILTIN_AVAIL_MIPS16 : 0; \
13745 }
13746
13747 /* This structure describes a single built-in function. */
13748 struct mips_builtin_description {
13749 /* The code of the main .md file instruction. See mips_builtin_type
13750 for more information. */
13751 enum insn_code icode;
13752
13753 /* The floating-point comparison code to use with ICODE, if any. */
13754 enum mips_fp_condition cond;
13755
13756 /* The name of the built-in function. */
13757 const char *name;
13758
13759 /* Specifies how the function should be expanded. */
13760 enum mips_builtin_type builtin_type;
13761
13762 /* The function's prototype. */
13763 enum mips_function_type function_type;
13764
13765 /* Whether the function is available. */
13766 unsigned int (*avail) (void);
13767 };
13768
13769 AVAIL_ALL (hard_float, TARGET_HARD_FLOAT_ABI)
13770 AVAIL_NON_MIPS16 (paired_single, TARGET_PAIRED_SINGLE_FLOAT)
13771 AVAIL_NON_MIPS16 (sb1_paired_single, TARGET_SB1 && TARGET_PAIRED_SINGLE_FLOAT)
13772 AVAIL_NON_MIPS16 (mips3d, TARGET_MIPS3D)
13773 AVAIL_NON_MIPS16 (dsp, TARGET_DSP)
13774 AVAIL_NON_MIPS16 (dspr2, TARGET_DSPR2)
13775 AVAIL_NON_MIPS16 (dsp_32, !TARGET_64BIT && TARGET_DSP)
13776 AVAIL_NON_MIPS16 (dsp_64, TARGET_64BIT && TARGET_DSP)
13777 AVAIL_NON_MIPS16 (dspr2_32, !TARGET_64BIT && TARGET_DSPR2)
13778 AVAIL_NON_MIPS16 (loongson, TARGET_LOONGSON_VECTORS)
13779 AVAIL_NON_MIPS16 (cache, TARGET_CACHE_BUILTIN)
13780
13781 /* Construct a mips_builtin_description from the given arguments.
13782
13783 INSN is the name of the associated instruction pattern, without the
13784 leading CODE_FOR_mips_.
13785
13786 CODE is the floating-point condition code associated with the
13787 function. It can be 'f' if the field is not applicable.
13788
13789 NAME is the name of the function itself, without the leading
13790 "__builtin_mips_".
13791
13792 BUILTIN_TYPE and FUNCTION_TYPE are mips_builtin_description fields.
13793
13794 AVAIL is the name of the availability predicate, without the leading
13795 mips_builtin_avail_. */
13796 #define MIPS_BUILTIN(INSN, COND, NAME, BUILTIN_TYPE, \
13797 FUNCTION_TYPE, AVAIL) \
13798 { CODE_FOR_mips_ ## INSN, MIPS_FP_COND_ ## COND, \
13799 "__builtin_mips_" NAME, BUILTIN_TYPE, FUNCTION_TYPE, \
13800 mips_builtin_avail_ ## AVAIL }
13801
13802 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT function
13803 mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE and AVAIL
13804 are as for MIPS_BUILTIN. */
13805 #define DIRECT_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \
13806 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT, FUNCTION_TYPE, AVAIL)
13807
13808 /* Define __builtin_mips_<INSN>_<COND>_{s,d} functions, both of which
13809 are subject to mips_builtin_avail_<AVAIL>. */
13810 #define CMP_SCALAR_BUILTINS(INSN, COND, AVAIL) \
13811 MIPS_BUILTIN (INSN ## _cond_s, COND, #INSN "_" #COND "_s", \
13812 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_SF_SF, AVAIL), \
13813 MIPS_BUILTIN (INSN ## _cond_d, COND, #INSN "_" #COND "_d", \
13814 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_DF_DF, AVAIL)
13815
13816 /* Define __builtin_mips_{any,all,upper,lower}_<INSN>_<COND>_ps.
13817 The lower and upper forms are subject to mips_builtin_avail_<AVAIL>
13818 while the any and all forms are subject to mips_builtin_avail_mips3d. */
13819 #define CMP_PS_BUILTINS(INSN, COND, AVAIL) \
13820 MIPS_BUILTIN (INSN ## _cond_ps, COND, "any_" #INSN "_" #COND "_ps", \
13821 MIPS_BUILTIN_CMP_ANY, MIPS_INT_FTYPE_V2SF_V2SF, \
13822 mips3d), \
13823 MIPS_BUILTIN (INSN ## _cond_ps, COND, "all_" #INSN "_" #COND "_ps", \
13824 MIPS_BUILTIN_CMP_ALL, MIPS_INT_FTYPE_V2SF_V2SF, \
13825 mips3d), \
13826 MIPS_BUILTIN (INSN ## _cond_ps, COND, "lower_" #INSN "_" #COND "_ps", \
13827 MIPS_BUILTIN_CMP_LOWER, MIPS_INT_FTYPE_V2SF_V2SF, \
13828 AVAIL), \
13829 MIPS_BUILTIN (INSN ## _cond_ps, COND, "upper_" #INSN "_" #COND "_ps", \
13830 MIPS_BUILTIN_CMP_UPPER, MIPS_INT_FTYPE_V2SF_V2SF, \
13831 AVAIL)
13832
13833 /* Define __builtin_mips_{any,all}_<INSN>_<COND>_4s. The functions
13834 are subject to mips_builtin_avail_mips3d. */
13835 #define CMP_4S_BUILTINS(INSN, COND) \
13836 MIPS_BUILTIN (INSN ## _cond_4s, COND, "any_" #INSN "_" #COND "_4s", \
13837 MIPS_BUILTIN_CMP_ANY, \
13838 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d), \
13839 MIPS_BUILTIN (INSN ## _cond_4s, COND, "all_" #INSN "_" #COND "_4s", \
13840 MIPS_BUILTIN_CMP_ALL, \
13841 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d)
13842
13843 /* Define __builtin_mips_mov{t,f}_<INSN>_<COND>_ps. The comparison
13844 instruction requires mips_builtin_avail_<AVAIL>. */
13845 #define MOVTF_BUILTINS(INSN, COND, AVAIL) \
13846 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movt_" #INSN "_" #COND "_ps", \
13847 MIPS_BUILTIN_MOVT, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \
13848 AVAIL), \
13849 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movf_" #INSN "_" #COND "_ps", \
13850 MIPS_BUILTIN_MOVF, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \
13851 AVAIL)
13852
13853 /* Define all the built-in functions related to C.cond.fmt condition COND. */
13854 #define CMP_BUILTINS(COND) \
13855 MOVTF_BUILTINS (c, COND, paired_single), \
13856 MOVTF_BUILTINS (cabs, COND, mips3d), \
13857 CMP_SCALAR_BUILTINS (cabs, COND, mips3d), \
13858 CMP_PS_BUILTINS (c, COND, paired_single), \
13859 CMP_PS_BUILTINS (cabs, COND, mips3d), \
13860 CMP_4S_BUILTINS (c, COND), \
13861 CMP_4S_BUILTINS (cabs, COND)
13862
13863 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT_NO_TARGET
13864 function mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE
13865 and AVAIL are as for MIPS_BUILTIN. */
13866 #define DIRECT_NO_TARGET_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \
13867 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT_NO_TARGET, \
13868 FUNCTION_TYPE, AVAIL)
13869
13870 /* Define __builtin_mips_bposge<VALUE>. <VALUE> is 32 for the MIPS32 DSP
13871 branch instruction. AVAIL is as for MIPS_BUILTIN. */
13872 #define BPOSGE_BUILTIN(VALUE, AVAIL) \
13873 MIPS_BUILTIN (bposge, f, "bposge" #VALUE, \
13874 MIPS_BUILTIN_BPOSGE ## VALUE, MIPS_SI_FTYPE_VOID, AVAIL)
13875
13876 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<FN_NAME>
13877 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a
13878 builtin_description field. */
13879 #define LOONGSON_BUILTIN_ALIAS(INSN, FN_NAME, FUNCTION_TYPE) \
13880 { CODE_FOR_loongson_ ## INSN, MIPS_FP_COND_f, \
13881 "__builtin_loongson_" #FN_NAME, MIPS_BUILTIN_DIRECT, \
13882 FUNCTION_TYPE, mips_builtin_avail_loongson }
13883
13884 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<INSN>
13885 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a
13886 builtin_description field. */
13887 #define LOONGSON_BUILTIN(INSN, FUNCTION_TYPE) \
13888 LOONGSON_BUILTIN_ALIAS (INSN, INSN, FUNCTION_TYPE)
13889
13890 /* Like LOONGSON_BUILTIN, but add _<SUFFIX> to the end of the function name.
13891 We use functions of this form when the same insn can be usefully applied
13892 to more than one datatype. */
13893 #define LOONGSON_BUILTIN_SUFFIX(INSN, SUFFIX, FUNCTION_TYPE) \
13894 LOONGSON_BUILTIN_ALIAS (INSN, INSN ## _ ## SUFFIX, FUNCTION_TYPE)
13895
13896 #define CODE_FOR_mips_sqrt_ps CODE_FOR_sqrtv2sf2
13897 #define CODE_FOR_mips_addq_ph CODE_FOR_addv2hi3
13898 #define CODE_FOR_mips_addu_qb CODE_FOR_addv4qi3
13899 #define CODE_FOR_mips_subq_ph CODE_FOR_subv2hi3
13900 #define CODE_FOR_mips_subu_qb CODE_FOR_subv4qi3
13901 #define CODE_FOR_mips_mul_ph CODE_FOR_mulv2hi3
13902 #define CODE_FOR_mips_mult CODE_FOR_mulsidi3_32bit
13903 #define CODE_FOR_mips_multu CODE_FOR_umulsidi3_32bit
13904
13905 #define CODE_FOR_loongson_packsswh CODE_FOR_vec_pack_ssat_v2si
13906 #define CODE_FOR_loongson_packsshb CODE_FOR_vec_pack_ssat_v4hi
13907 #define CODE_FOR_loongson_packushb CODE_FOR_vec_pack_usat_v4hi
13908 #define CODE_FOR_loongson_paddw CODE_FOR_addv2si3
13909 #define CODE_FOR_loongson_paddh CODE_FOR_addv4hi3
13910 #define CODE_FOR_loongson_paddb CODE_FOR_addv8qi3
13911 #define CODE_FOR_loongson_paddsh CODE_FOR_ssaddv4hi3
13912 #define CODE_FOR_loongson_paddsb CODE_FOR_ssaddv8qi3
13913 #define CODE_FOR_loongson_paddush CODE_FOR_usaddv4hi3
13914 #define CODE_FOR_loongson_paddusb CODE_FOR_usaddv8qi3
13915 #define CODE_FOR_loongson_pmaxsh CODE_FOR_smaxv4hi3
13916 #define CODE_FOR_loongson_pmaxub CODE_FOR_umaxv8qi3
13917 #define CODE_FOR_loongson_pminsh CODE_FOR_sminv4hi3
13918 #define CODE_FOR_loongson_pminub CODE_FOR_uminv8qi3
13919 #define CODE_FOR_loongson_pmulhuh CODE_FOR_umulv4hi3_highpart
13920 #define CODE_FOR_loongson_pmulhh CODE_FOR_smulv4hi3_highpart
13921 #define CODE_FOR_loongson_pmullh CODE_FOR_mulv4hi3
13922 #define CODE_FOR_loongson_psllh CODE_FOR_ashlv4hi3
13923 #define CODE_FOR_loongson_psllw CODE_FOR_ashlv2si3
13924 #define CODE_FOR_loongson_psrlh CODE_FOR_lshrv4hi3
13925 #define CODE_FOR_loongson_psrlw CODE_FOR_lshrv2si3
13926 #define CODE_FOR_loongson_psrah CODE_FOR_ashrv4hi3
13927 #define CODE_FOR_loongson_psraw CODE_FOR_ashrv2si3
13928 #define CODE_FOR_loongson_psubw CODE_FOR_subv2si3
13929 #define CODE_FOR_loongson_psubh CODE_FOR_subv4hi3
13930 #define CODE_FOR_loongson_psubb CODE_FOR_subv8qi3
13931 #define CODE_FOR_loongson_psubsh CODE_FOR_sssubv4hi3
13932 #define CODE_FOR_loongson_psubsb CODE_FOR_sssubv8qi3
13933 #define CODE_FOR_loongson_psubush CODE_FOR_ussubv4hi3
13934 #define CODE_FOR_loongson_psubusb CODE_FOR_ussubv8qi3
13935
13936 static const struct mips_builtin_description mips_builtins[] = {
13937 #define MIPS_GET_FCSR 0
13938 DIRECT_BUILTIN (get_fcsr, MIPS_USI_FTYPE_VOID, hard_float),
13939 #define MIPS_SET_FCSR 1
13940 DIRECT_NO_TARGET_BUILTIN (set_fcsr, MIPS_VOID_FTYPE_USI, hard_float),
13941
13942 DIRECT_BUILTIN (pll_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13943 DIRECT_BUILTIN (pul_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13944 DIRECT_BUILTIN (plu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13945 DIRECT_BUILTIN (puu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13946 DIRECT_BUILTIN (cvt_ps_s, MIPS_V2SF_FTYPE_SF_SF, paired_single),
13947 DIRECT_BUILTIN (cvt_s_pl, MIPS_SF_FTYPE_V2SF, paired_single),
13948 DIRECT_BUILTIN (cvt_s_pu, MIPS_SF_FTYPE_V2SF, paired_single),
13949 DIRECT_BUILTIN (abs_ps, MIPS_V2SF_FTYPE_V2SF, paired_single),
13950
13951 DIRECT_BUILTIN (alnv_ps, MIPS_V2SF_FTYPE_V2SF_V2SF_INT, paired_single),
13952 DIRECT_BUILTIN (addr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13953 DIRECT_BUILTIN (mulr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13954 DIRECT_BUILTIN (cvt_pw_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
13955 DIRECT_BUILTIN (cvt_ps_pw, MIPS_V2SF_FTYPE_V2SF, mips3d),
13956
13957 DIRECT_BUILTIN (recip1_s, MIPS_SF_FTYPE_SF, mips3d),
13958 DIRECT_BUILTIN (recip1_d, MIPS_DF_FTYPE_DF, mips3d),
13959 DIRECT_BUILTIN (recip1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
13960 DIRECT_BUILTIN (recip2_s, MIPS_SF_FTYPE_SF_SF, mips3d),
13961 DIRECT_BUILTIN (recip2_d, MIPS_DF_FTYPE_DF_DF, mips3d),
13962 DIRECT_BUILTIN (recip2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13963
13964 DIRECT_BUILTIN (rsqrt1_s, MIPS_SF_FTYPE_SF, mips3d),
13965 DIRECT_BUILTIN (rsqrt1_d, MIPS_DF_FTYPE_DF, mips3d),
13966 DIRECT_BUILTIN (rsqrt1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
13967 DIRECT_BUILTIN (rsqrt2_s, MIPS_SF_FTYPE_SF_SF, mips3d),
13968 DIRECT_BUILTIN (rsqrt2_d, MIPS_DF_FTYPE_DF_DF, mips3d),
13969 DIRECT_BUILTIN (rsqrt2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13970
13971 MIPS_FP_CONDITIONS (CMP_BUILTINS),
13972
13973 /* Built-in functions for the SB-1 processor. */
13974 DIRECT_BUILTIN (sqrt_ps, MIPS_V2SF_FTYPE_V2SF, sb1_paired_single),
13975
13976 /* Built-in functions for the DSP ASE (32-bit and 64-bit). */
13977 DIRECT_BUILTIN (addq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13978 DIRECT_BUILTIN (addq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13979 DIRECT_BUILTIN (addq_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
13980 DIRECT_BUILTIN (addu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13981 DIRECT_BUILTIN (addu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13982 DIRECT_BUILTIN (subq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13983 DIRECT_BUILTIN (subq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13984 DIRECT_BUILTIN (subq_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
13985 DIRECT_BUILTIN (subu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13986 DIRECT_BUILTIN (subu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13987 DIRECT_BUILTIN (addsc, MIPS_SI_FTYPE_SI_SI, dsp),
13988 DIRECT_BUILTIN (addwc, MIPS_SI_FTYPE_SI_SI, dsp),
13989 DIRECT_BUILTIN (modsub, MIPS_SI_FTYPE_SI_SI, dsp),
13990 DIRECT_BUILTIN (raddu_w_qb, MIPS_SI_FTYPE_V4QI, dsp),
13991 DIRECT_BUILTIN (absq_s_ph, MIPS_V2HI_FTYPE_V2HI, dsp),
13992 DIRECT_BUILTIN (absq_s_w, MIPS_SI_FTYPE_SI, dsp),
13993 DIRECT_BUILTIN (precrq_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp),
13994 DIRECT_BUILTIN (precrq_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp),
13995 DIRECT_BUILTIN (precrq_rs_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp),
13996 DIRECT_BUILTIN (precrqu_s_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp),
13997 DIRECT_BUILTIN (preceq_w_phl, MIPS_SI_FTYPE_V2HI, dsp),
13998 DIRECT_BUILTIN (preceq_w_phr, MIPS_SI_FTYPE_V2HI, dsp),
13999 DIRECT_BUILTIN (precequ_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp),
14000 DIRECT_BUILTIN (precequ_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp),
14001 DIRECT_BUILTIN (precequ_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp),
14002 DIRECT_BUILTIN (precequ_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp),
14003 DIRECT_BUILTIN (preceu_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp),
14004 DIRECT_BUILTIN (preceu_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp),
14005 DIRECT_BUILTIN (preceu_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp),
14006 DIRECT_BUILTIN (preceu_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp),
14007 DIRECT_BUILTIN (shll_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp),
14008 DIRECT_BUILTIN (shll_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
14009 DIRECT_BUILTIN (shll_s_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
14010 DIRECT_BUILTIN (shll_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
14011 DIRECT_BUILTIN (shrl_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp),
14012 DIRECT_BUILTIN (shra_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
14013 DIRECT_BUILTIN (shra_r_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
14014 DIRECT_BUILTIN (shra_r_w, MIPS_SI_FTYPE_SI_SI, dsp),
14015 DIRECT_BUILTIN (muleu_s_ph_qbl, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp),
14016 DIRECT_BUILTIN (muleu_s_ph_qbr, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp),
14017 DIRECT_BUILTIN (mulq_rs_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
14018 DIRECT_BUILTIN (muleq_s_w_phl, MIPS_SI_FTYPE_V2HI_V2HI, dsp),
14019 DIRECT_BUILTIN (muleq_s_w_phr, MIPS_SI_FTYPE_V2HI_V2HI, dsp),
14020 DIRECT_BUILTIN (bitrev, MIPS_SI_FTYPE_SI, dsp),
14021 DIRECT_BUILTIN (insv, MIPS_SI_FTYPE_SI_SI, dsp),
14022 DIRECT_BUILTIN (repl_qb, MIPS_V4QI_FTYPE_SI, dsp),
14023 DIRECT_BUILTIN (repl_ph, MIPS_V2HI_FTYPE_SI, dsp),
14024 DIRECT_NO_TARGET_BUILTIN (cmpu_eq_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
14025 DIRECT_NO_TARGET_BUILTIN (cmpu_lt_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
14026 DIRECT_NO_TARGET_BUILTIN (cmpu_le_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
14027 DIRECT_BUILTIN (cmpgu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
14028 DIRECT_BUILTIN (cmpgu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
14029 DIRECT_BUILTIN (cmpgu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
14030 DIRECT_NO_TARGET_BUILTIN (cmp_eq_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
14031 DIRECT_NO_TARGET_BUILTIN (cmp_lt_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
14032 DIRECT_NO_TARGET_BUILTIN (cmp_le_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
14033 DIRECT_BUILTIN (pick_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
14034 DIRECT_BUILTIN (pick_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
14035 DIRECT_BUILTIN (packrl_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
14036 DIRECT_NO_TARGET_BUILTIN (wrdsp, MIPS_VOID_FTYPE_SI_SI, dsp),
14037 DIRECT_BUILTIN (rddsp, MIPS_SI_FTYPE_SI, dsp),
14038 DIRECT_BUILTIN (lbux, MIPS_SI_FTYPE_POINTER_SI, dsp),
14039 DIRECT_BUILTIN (lhx, MIPS_SI_FTYPE_POINTER_SI, dsp),
14040 DIRECT_BUILTIN (lwx, MIPS_SI_FTYPE_POINTER_SI, dsp),
14041 BPOSGE_BUILTIN (32, dsp),
14042
14043 /* The following are for the MIPS DSP ASE REV 2 (32-bit and 64-bit). */
14044 DIRECT_BUILTIN (absq_s_qb, MIPS_V4QI_FTYPE_V4QI, dspr2),
14045 DIRECT_BUILTIN (addu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14046 DIRECT_BUILTIN (addu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14047 DIRECT_BUILTIN (adduh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
14048 DIRECT_BUILTIN (adduh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
14049 DIRECT_BUILTIN (append, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
14050 DIRECT_BUILTIN (balign, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
14051 DIRECT_BUILTIN (cmpgdu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
14052 DIRECT_BUILTIN (cmpgdu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
14053 DIRECT_BUILTIN (cmpgdu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
14054 DIRECT_BUILTIN (mul_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14055 DIRECT_BUILTIN (mul_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14056 DIRECT_BUILTIN (mulq_rs_w, MIPS_SI_FTYPE_SI_SI, dspr2),
14057 DIRECT_BUILTIN (mulq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14058 DIRECT_BUILTIN (mulq_s_w, MIPS_SI_FTYPE_SI_SI, dspr2),
14059 DIRECT_BUILTIN (precr_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dspr2),
14060 DIRECT_BUILTIN (precr_sra_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2),
14061 DIRECT_BUILTIN (precr_sra_r_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2),
14062 DIRECT_BUILTIN (prepend, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
14063 DIRECT_BUILTIN (shra_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2),
14064 DIRECT_BUILTIN (shra_r_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2),
14065 DIRECT_BUILTIN (shrl_ph, MIPS_V2HI_FTYPE_V2HI_SI, dspr2),
14066 DIRECT_BUILTIN (subu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14067 DIRECT_BUILTIN (subu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14068 DIRECT_BUILTIN (subuh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
14069 DIRECT_BUILTIN (subuh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
14070 DIRECT_BUILTIN (addqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14071 DIRECT_BUILTIN (addqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14072 DIRECT_BUILTIN (addqh_w, MIPS_SI_FTYPE_SI_SI, dspr2),
14073 DIRECT_BUILTIN (addqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2),
14074 DIRECT_BUILTIN (subqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14075 DIRECT_BUILTIN (subqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
14076 DIRECT_BUILTIN (subqh_w, MIPS_SI_FTYPE_SI_SI, dspr2),
14077 DIRECT_BUILTIN (subqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2),
14078
14079 /* Built-in functions for the DSP ASE (32-bit only). */
14080 DIRECT_BUILTIN (dpau_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
14081 DIRECT_BUILTIN (dpau_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
14082 DIRECT_BUILTIN (dpsu_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
14083 DIRECT_BUILTIN (dpsu_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
14084 DIRECT_BUILTIN (dpaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14085 DIRECT_BUILTIN (dpsq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14086 DIRECT_BUILTIN (mulsaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14087 DIRECT_BUILTIN (dpaq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
14088 DIRECT_BUILTIN (dpsq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
14089 DIRECT_BUILTIN (maq_s_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14090 DIRECT_BUILTIN (maq_s_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14091 DIRECT_BUILTIN (maq_sa_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14092 DIRECT_BUILTIN (maq_sa_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
14093 DIRECT_BUILTIN (extr_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
14094 DIRECT_BUILTIN (extr_r_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
14095 DIRECT_BUILTIN (extr_rs_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
14096 DIRECT_BUILTIN (extr_s_h, MIPS_SI_FTYPE_DI_SI, dsp_32),
14097 DIRECT_BUILTIN (extp, MIPS_SI_FTYPE_DI_SI, dsp_32),
14098 DIRECT_BUILTIN (extpdp, MIPS_SI_FTYPE_DI_SI, dsp_32),
14099 DIRECT_BUILTIN (shilo, MIPS_DI_FTYPE_DI_SI, dsp_32),
14100 DIRECT_BUILTIN (mthlip, MIPS_DI_FTYPE_DI_SI, dsp_32),
14101 DIRECT_BUILTIN (madd, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
14102 DIRECT_BUILTIN (maddu, MIPS_DI_FTYPE_DI_USI_USI, dsp_32),
14103 DIRECT_BUILTIN (msub, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
14104 DIRECT_BUILTIN (msubu, MIPS_DI_FTYPE_DI_USI_USI, dsp_32),
14105 DIRECT_BUILTIN (mult, MIPS_DI_FTYPE_SI_SI, dsp_32),
14106 DIRECT_BUILTIN (multu, MIPS_DI_FTYPE_USI_USI, dsp_32),
14107
14108 /* Built-in functions for the DSP ASE (64-bit only). */
14109 DIRECT_BUILTIN (ldx, MIPS_DI_FTYPE_POINTER_SI, dsp_64),
14110
14111 /* The following are for the MIPS DSP ASE REV 2 (32-bit only). */
14112 DIRECT_BUILTIN (dpa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14113 DIRECT_BUILTIN (dps_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14114 DIRECT_BUILTIN (mulsa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14115 DIRECT_BUILTIN (dpax_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14116 DIRECT_BUILTIN (dpsx_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14117 DIRECT_BUILTIN (dpaqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14118 DIRECT_BUILTIN (dpaqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14119 DIRECT_BUILTIN (dpsqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14120 DIRECT_BUILTIN (dpsqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
14121
14122 /* Builtin functions for ST Microelectronics Loongson-2E/2F cores. */
14123 LOONGSON_BUILTIN (packsswh, MIPS_V4HI_FTYPE_V2SI_V2SI),
14124 LOONGSON_BUILTIN (packsshb, MIPS_V8QI_FTYPE_V4HI_V4HI),
14125 LOONGSON_BUILTIN (packushb, MIPS_UV8QI_FTYPE_UV4HI_UV4HI),
14126 LOONGSON_BUILTIN_SUFFIX (paddw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14127 LOONGSON_BUILTIN_SUFFIX (paddh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14128 LOONGSON_BUILTIN_SUFFIX (paddb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14129 LOONGSON_BUILTIN_SUFFIX (paddw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14130 LOONGSON_BUILTIN_SUFFIX (paddh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14131 LOONGSON_BUILTIN_SUFFIX (paddb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14132 LOONGSON_BUILTIN_SUFFIX (paddd, u, MIPS_UDI_FTYPE_UDI_UDI),
14133 LOONGSON_BUILTIN_SUFFIX (paddd, s, MIPS_DI_FTYPE_DI_DI),
14134 LOONGSON_BUILTIN (paddsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14135 LOONGSON_BUILTIN (paddsb, MIPS_V8QI_FTYPE_V8QI_V8QI),
14136 LOONGSON_BUILTIN (paddush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14137 LOONGSON_BUILTIN (paddusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14138 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_ud, MIPS_UDI_FTYPE_UDI_UDI),
14139 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_uw, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14140 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_uh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14141 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_ub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14142 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_sd, MIPS_DI_FTYPE_DI_DI),
14143 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_sw, MIPS_V2SI_FTYPE_V2SI_V2SI),
14144 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_sh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14145 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_sb, MIPS_V8QI_FTYPE_V8QI_V8QI),
14146 LOONGSON_BUILTIN (pavgh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14147 LOONGSON_BUILTIN (pavgb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14148 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14149 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14150 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14151 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14152 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14153 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14154 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14155 LOONGSON_BUILTIN_SUFFIX (pcmpgth, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14156 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14157 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14158 LOONGSON_BUILTIN_SUFFIX (pcmpgth, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14159 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14160 LOONGSON_BUILTIN_SUFFIX (pextrh, u, MIPS_UV4HI_FTYPE_UV4HI_USI),
14161 LOONGSON_BUILTIN_SUFFIX (pextrh, s, MIPS_V4HI_FTYPE_V4HI_USI),
14162 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14163 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14164 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14165 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14166 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14167 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14168 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14169 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14170 LOONGSON_BUILTIN (pmaddhw, MIPS_V2SI_FTYPE_V4HI_V4HI),
14171 LOONGSON_BUILTIN (pmaxsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14172 LOONGSON_BUILTIN (pmaxub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14173 LOONGSON_BUILTIN (pminsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14174 LOONGSON_BUILTIN (pminub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14175 LOONGSON_BUILTIN_SUFFIX (pmovmskb, u, MIPS_UV8QI_FTYPE_UV8QI),
14176 LOONGSON_BUILTIN_SUFFIX (pmovmskb, s, MIPS_V8QI_FTYPE_V8QI),
14177 LOONGSON_BUILTIN (pmulhuh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14178 LOONGSON_BUILTIN (pmulhh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14179 LOONGSON_BUILTIN (pmullh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14180 LOONGSON_BUILTIN (pmuluw, MIPS_UDI_FTYPE_UV2SI_UV2SI),
14181 LOONGSON_BUILTIN (pasubub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14182 LOONGSON_BUILTIN (biadd, MIPS_UV4HI_FTYPE_UV8QI),
14183 LOONGSON_BUILTIN (psadbh, MIPS_UV4HI_FTYPE_UV8QI_UV8QI),
14184 LOONGSON_BUILTIN_SUFFIX (pshufh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14185 LOONGSON_BUILTIN_SUFFIX (pshufh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14186 LOONGSON_BUILTIN_SUFFIX (psllh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14187 LOONGSON_BUILTIN_SUFFIX (psllh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14188 LOONGSON_BUILTIN_SUFFIX (psllw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
14189 LOONGSON_BUILTIN_SUFFIX (psllw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
14190 LOONGSON_BUILTIN_SUFFIX (psrah, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14191 LOONGSON_BUILTIN_SUFFIX (psrah, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14192 LOONGSON_BUILTIN_SUFFIX (psraw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
14193 LOONGSON_BUILTIN_SUFFIX (psraw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
14194 LOONGSON_BUILTIN_SUFFIX (psrlh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14195 LOONGSON_BUILTIN_SUFFIX (psrlh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14196 LOONGSON_BUILTIN_SUFFIX (psrlw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
14197 LOONGSON_BUILTIN_SUFFIX (psrlw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
14198 LOONGSON_BUILTIN_SUFFIX (psubw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14199 LOONGSON_BUILTIN_SUFFIX (psubh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14200 LOONGSON_BUILTIN_SUFFIX (psubb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14201 LOONGSON_BUILTIN_SUFFIX (psubw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14202 LOONGSON_BUILTIN_SUFFIX (psubh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14203 LOONGSON_BUILTIN_SUFFIX (psubb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14204 LOONGSON_BUILTIN_SUFFIX (psubd, u, MIPS_UDI_FTYPE_UDI_UDI),
14205 LOONGSON_BUILTIN_SUFFIX (psubd, s, MIPS_DI_FTYPE_DI_DI),
14206 LOONGSON_BUILTIN (psubsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14207 LOONGSON_BUILTIN (psubsb, MIPS_V8QI_FTYPE_V8QI_V8QI),
14208 LOONGSON_BUILTIN (psubush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14209 LOONGSON_BUILTIN (psubusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14210 LOONGSON_BUILTIN_SUFFIX (punpckhbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14211 LOONGSON_BUILTIN_SUFFIX (punpckhhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14212 LOONGSON_BUILTIN_SUFFIX (punpckhwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14213 LOONGSON_BUILTIN_SUFFIX (punpckhbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14214 LOONGSON_BUILTIN_SUFFIX (punpckhhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14215 LOONGSON_BUILTIN_SUFFIX (punpckhwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14216 LOONGSON_BUILTIN_SUFFIX (punpcklbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14217 LOONGSON_BUILTIN_SUFFIX (punpcklhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14218 LOONGSON_BUILTIN_SUFFIX (punpcklwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14219 LOONGSON_BUILTIN_SUFFIX (punpcklbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14220 LOONGSON_BUILTIN_SUFFIX (punpcklhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14221 LOONGSON_BUILTIN_SUFFIX (punpcklwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14222
14223 /* Sundry other built-in functions. */
14224 DIRECT_NO_TARGET_BUILTIN (cache, MIPS_VOID_FTYPE_SI_CVPOINTER, cache)
14225 };
14226
14227 /* Index I is the function declaration for mips_builtins[I], or null if the
14228 function isn't defined on this target. */
14229 static GTY(()) tree mips_builtin_decls[ARRAY_SIZE (mips_builtins)];
14230
14231 /* MODE is a vector mode whose elements have type TYPE. Return the type
14232 of the vector itself. */
14233
14234 static tree
14235 mips_builtin_vector_type (tree type, enum machine_mode mode)
14236 {
14237 static tree types[2 * (int) MAX_MACHINE_MODE];
14238 int mode_index;
14239
14240 mode_index = (int) mode;
14241
14242 if (TREE_CODE (type) == INTEGER_TYPE && TYPE_UNSIGNED (type))
14243 mode_index += MAX_MACHINE_MODE;
14244
14245 if (types[mode_index] == NULL_TREE)
14246 types[mode_index] = build_vector_type_for_mode (type, mode);
14247 return types[mode_index];
14248 }
14249
14250 /* Return a type for 'const volatile void *'. */
14251
14252 static tree
14253 mips_build_cvpointer_type (void)
14254 {
14255 static tree cache;
14256
14257 if (cache == NULL_TREE)
14258 cache = build_pointer_type (build_qualified_type
14259 (void_type_node,
14260 TYPE_QUAL_CONST | TYPE_QUAL_VOLATILE));
14261 return cache;
14262 }
14263
14264 /* Source-level argument types. */
14265 #define MIPS_ATYPE_VOID void_type_node
14266 #define MIPS_ATYPE_INT integer_type_node
14267 #define MIPS_ATYPE_POINTER ptr_type_node
14268 #define MIPS_ATYPE_CVPOINTER mips_build_cvpointer_type ()
14269
14270 /* Standard mode-based argument types. */
14271 #define MIPS_ATYPE_UQI unsigned_intQI_type_node
14272 #define MIPS_ATYPE_SI intSI_type_node
14273 #define MIPS_ATYPE_USI unsigned_intSI_type_node
14274 #define MIPS_ATYPE_DI intDI_type_node
14275 #define MIPS_ATYPE_UDI unsigned_intDI_type_node
14276 #define MIPS_ATYPE_SF float_type_node
14277 #define MIPS_ATYPE_DF double_type_node
14278
14279 /* Vector argument types. */
14280 #define MIPS_ATYPE_V2SF mips_builtin_vector_type (float_type_node, V2SFmode)
14281 #define MIPS_ATYPE_V2HI mips_builtin_vector_type (intHI_type_node, V2HImode)
14282 #define MIPS_ATYPE_V2SI mips_builtin_vector_type (intSI_type_node, V2SImode)
14283 #define MIPS_ATYPE_V4QI mips_builtin_vector_type (intQI_type_node, V4QImode)
14284 #define MIPS_ATYPE_V4HI mips_builtin_vector_type (intHI_type_node, V4HImode)
14285 #define MIPS_ATYPE_V8QI mips_builtin_vector_type (intQI_type_node, V8QImode)
14286 #define MIPS_ATYPE_UV2SI \
14287 mips_builtin_vector_type (unsigned_intSI_type_node, V2SImode)
14288 #define MIPS_ATYPE_UV4HI \
14289 mips_builtin_vector_type (unsigned_intHI_type_node, V4HImode)
14290 #define MIPS_ATYPE_UV8QI \
14291 mips_builtin_vector_type (unsigned_intQI_type_node, V8QImode)
14292
14293 /* MIPS_FTYPE_ATYPESN takes N MIPS_FTYPES-like type codes and lists
14294 their associated MIPS_ATYPEs. */
14295 #define MIPS_FTYPE_ATYPES1(A, B) \
14296 MIPS_ATYPE_##A, MIPS_ATYPE_##B
14297
14298 #define MIPS_FTYPE_ATYPES2(A, B, C) \
14299 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C
14300
14301 #define MIPS_FTYPE_ATYPES3(A, B, C, D) \
14302 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D
14303
14304 #define MIPS_FTYPE_ATYPES4(A, B, C, D, E) \
14305 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D, \
14306 MIPS_ATYPE_##E
14307
14308 /* Return the function type associated with function prototype TYPE. */
14309
14310 static tree
14311 mips_build_function_type (enum mips_function_type type)
14312 {
14313 static tree types[(int) MIPS_MAX_FTYPE_MAX];
14314
14315 if (types[(int) type] == NULL_TREE)
14316 switch (type)
14317 {
14318 #define DEF_MIPS_FTYPE(NUM, ARGS) \
14319 case MIPS_FTYPE_NAME##NUM ARGS: \
14320 types[(int) type] \
14321 = build_function_type_list (MIPS_FTYPE_ATYPES##NUM ARGS, \
14322 NULL_TREE); \
14323 break;
14324 #include "config/mips/mips-ftypes.def"
14325 #undef DEF_MIPS_FTYPE
14326 default:
14327 gcc_unreachable ();
14328 }
14329
14330 return types[(int) type];
14331 }
14332
14333 /* Implement TARGET_INIT_BUILTINS. */
14334
14335 static void
14336 mips_init_builtins (void)
14337 {
14338 const struct mips_builtin_description *d;
14339 unsigned int i;
14340
14341 /* Iterate through all of the bdesc arrays, initializing all of the
14342 builtin functions. */
14343 for (i = 0; i < ARRAY_SIZE (mips_builtins); i++)
14344 {
14345 d = &mips_builtins[i];
14346 if (d->avail ())
14347 mips_builtin_decls[i]
14348 = add_builtin_function (d->name,
14349 mips_build_function_type (d->function_type),
14350 i, BUILT_IN_MD, NULL, NULL);
14351 }
14352 }
14353
14354 /* Implement TARGET_BUILTIN_DECL. */
14355
14356 static tree
14357 mips_builtin_decl (unsigned int code, bool initialize_p ATTRIBUTE_UNUSED)
14358 {
14359 if (code >= ARRAY_SIZE (mips_builtins))
14360 return error_mark_node;
14361 return mips_builtin_decls[code];
14362 }
14363
14364 /* Take argument ARGNO from EXP's argument list and convert it into
14365 an expand operand. Store the operand in *OP. */
14366
14367 static void
14368 mips_prepare_builtin_arg (struct expand_operand *op, tree exp,
14369 unsigned int argno)
14370 {
14371 tree arg;
14372 rtx value;
14373
14374 arg = CALL_EXPR_ARG (exp, argno);
14375 value = expand_normal (arg);
14376 create_input_operand (op, value, TYPE_MODE (TREE_TYPE (arg)));
14377 }
14378
14379 /* Expand instruction ICODE as part of a built-in function sequence.
14380 Use the first NOPS elements of OPS as the instruction's operands.
14381 HAS_TARGET_P is true if operand 0 is a target; it is false if the
14382 instruction has no target.
14383
14384 Return the target rtx if HAS_TARGET_P, otherwise return const0_rtx. */
14385
14386 static rtx
14387 mips_expand_builtin_insn (enum insn_code icode, unsigned int nops,
14388 struct expand_operand *ops, bool has_target_p)
14389 {
14390 if (!maybe_expand_insn (icode, nops, ops))
14391 {
14392 error ("invalid argument to built-in function");
14393 return has_target_p ? gen_reg_rtx (ops[0].mode) : const0_rtx;
14394 }
14395 return has_target_p ? ops[0].value : const0_rtx;
14396 }
14397
14398 /* Expand a floating-point comparison for built-in function call EXP.
14399 The first NARGS arguments are the values to be compared. ICODE is
14400 the .md pattern that does the comparison and COND is the condition
14401 that is being tested. Return an rtx for the result. */
14402
14403 static rtx
14404 mips_expand_builtin_compare_1 (enum insn_code icode,
14405 enum mips_fp_condition cond,
14406 tree exp, int nargs)
14407 {
14408 struct expand_operand ops[MAX_RECOG_OPERANDS];
14409 rtx output;
14410 int opno, argno;
14411
14412 /* The instruction should have a target operand, an operand for each
14413 argument, and an operand for COND. */
14414 gcc_assert (nargs + 2 == insn_data[(int) icode].n_generator_args);
14415
14416 output = mips_allocate_fcc (insn_data[(int) icode].operand[0].mode);
14417 opno = 0;
14418 create_fixed_operand (&ops[opno++], output);
14419 for (argno = 0; argno < nargs; argno++)
14420 mips_prepare_builtin_arg (&ops[opno++], exp, argno);
14421 create_integer_operand (&ops[opno++], (int) cond);
14422 return mips_expand_builtin_insn (icode, opno, ops, true);
14423 }
14424
14425 /* Expand a MIPS_BUILTIN_DIRECT or MIPS_BUILTIN_DIRECT_NO_TARGET function;
14426 HAS_TARGET_P says which. EXP is the CALL_EXPR that calls the function
14427 and ICODE is the code of the associated .md pattern. TARGET, if nonnull,
14428 suggests a good place to put the result. */
14429
14430 static rtx
14431 mips_expand_builtin_direct (enum insn_code icode, rtx target, tree exp,
14432 bool has_target_p)
14433 {
14434 struct expand_operand ops[MAX_RECOG_OPERANDS];
14435 int opno, argno;
14436
14437 /* Map any target to operand 0. */
14438 opno = 0;
14439 if (has_target_p)
14440 create_output_operand (&ops[opno++], target, TYPE_MODE (TREE_TYPE (exp)));
14441
14442 /* Map the arguments to the other operands. */
14443 gcc_assert (opno + call_expr_nargs (exp)
14444 == insn_data[icode].n_generator_args);
14445 for (argno = 0; argno < call_expr_nargs (exp); argno++)
14446 mips_prepare_builtin_arg (&ops[opno++], exp, argno);
14447
14448 return mips_expand_builtin_insn (icode, opno, ops, has_target_p);
14449 }
14450
14451 /* Expand a __builtin_mips_movt_*_ps or __builtin_mips_movf_*_ps
14452 function; TYPE says which. EXP is the CALL_EXPR that calls the
14453 function, ICODE is the instruction that should be used to compare
14454 the first two arguments, and COND is the condition it should test.
14455 TARGET, if nonnull, suggests a good place to put the result. */
14456
14457 static rtx
14458 mips_expand_builtin_movtf (enum mips_builtin_type type,
14459 enum insn_code icode, enum mips_fp_condition cond,
14460 rtx target, tree exp)
14461 {
14462 struct expand_operand ops[4];
14463 rtx cmp_result;
14464
14465 cmp_result = mips_expand_builtin_compare_1 (icode, cond, exp, 2);
14466 create_output_operand (&ops[0], target, TYPE_MODE (TREE_TYPE (exp)));
14467 if (type == MIPS_BUILTIN_MOVT)
14468 {
14469 mips_prepare_builtin_arg (&ops[2], exp, 2);
14470 mips_prepare_builtin_arg (&ops[1], exp, 3);
14471 }
14472 else
14473 {
14474 mips_prepare_builtin_arg (&ops[1], exp, 2);
14475 mips_prepare_builtin_arg (&ops[2], exp, 3);
14476 }
14477 create_fixed_operand (&ops[3], cmp_result);
14478 return mips_expand_builtin_insn (CODE_FOR_mips_cond_move_tf_ps,
14479 4, ops, true);
14480 }
14481
14482 /* Move VALUE_IF_TRUE into TARGET if CONDITION is true; move VALUE_IF_FALSE
14483 into TARGET otherwise. Return TARGET. */
14484
14485 static rtx
14486 mips_builtin_branch_and_move (rtx condition, rtx target,
14487 rtx value_if_true, rtx value_if_false)
14488 {
14489 rtx_code_label *true_label, *done_label;
14490
14491 true_label = gen_label_rtx ();
14492 done_label = gen_label_rtx ();
14493
14494 /* First assume that CONDITION is false. */
14495 mips_emit_move (target, value_if_false);
14496
14497 /* Branch to TRUE_LABEL if CONDITION is true and DONE_LABEL otherwise. */
14498 emit_jump_insn (gen_condjump (condition, true_label));
14499 emit_jump_insn (gen_jump (done_label));
14500 emit_barrier ();
14501
14502 /* Fix TARGET if CONDITION is true. */
14503 emit_label (true_label);
14504 mips_emit_move (target, value_if_true);
14505
14506 emit_label (done_label);
14507 return target;
14508 }
14509
14510 /* Expand a comparison built-in function of type BUILTIN_TYPE. EXP is
14511 the CALL_EXPR that calls the function, ICODE is the code of the
14512 comparison instruction, and COND is the condition it should test.
14513 TARGET, if nonnull, suggests a good place to put the boolean result. */
14514
14515 static rtx
14516 mips_expand_builtin_compare (enum mips_builtin_type builtin_type,
14517 enum insn_code icode, enum mips_fp_condition cond,
14518 rtx target, tree exp)
14519 {
14520 rtx offset, condition, cmp_result;
14521
14522 if (target == 0 || GET_MODE (target) != SImode)
14523 target = gen_reg_rtx (SImode);
14524 cmp_result = mips_expand_builtin_compare_1 (icode, cond, exp,
14525 call_expr_nargs (exp));
14526
14527 /* If the comparison sets more than one register, we define the result
14528 to be 0 if all registers are false and -1 if all registers are true.
14529 The value of the complete result is indeterminate otherwise. */
14530 switch (builtin_type)
14531 {
14532 case MIPS_BUILTIN_CMP_ALL:
14533 condition = gen_rtx_NE (VOIDmode, cmp_result, constm1_rtx);
14534 return mips_builtin_branch_and_move (condition, target,
14535 const0_rtx, const1_rtx);
14536
14537 case MIPS_BUILTIN_CMP_UPPER:
14538 case MIPS_BUILTIN_CMP_LOWER:
14539 offset = GEN_INT (builtin_type == MIPS_BUILTIN_CMP_UPPER);
14540 condition = gen_single_cc (cmp_result, offset);
14541 return mips_builtin_branch_and_move (condition, target,
14542 const1_rtx, const0_rtx);
14543
14544 default:
14545 condition = gen_rtx_NE (VOIDmode, cmp_result, const0_rtx);
14546 return mips_builtin_branch_and_move (condition, target,
14547 const1_rtx, const0_rtx);
14548 }
14549 }
14550
14551 /* Expand a bposge built-in function of type BUILTIN_TYPE. TARGET,
14552 if nonnull, suggests a good place to put the boolean result. */
14553
14554 static rtx
14555 mips_expand_builtin_bposge (enum mips_builtin_type builtin_type, rtx target)
14556 {
14557 rtx condition, cmp_result;
14558 int cmp_value;
14559
14560 if (target == 0 || GET_MODE (target) != SImode)
14561 target = gen_reg_rtx (SImode);
14562
14563 cmp_result = gen_rtx_REG (CCDSPmode, CCDSP_PO_REGNUM);
14564
14565 if (builtin_type == MIPS_BUILTIN_BPOSGE32)
14566 cmp_value = 32;
14567 else
14568 gcc_assert (0);
14569
14570 condition = gen_rtx_GE (VOIDmode, cmp_result, GEN_INT (cmp_value));
14571 return mips_builtin_branch_and_move (condition, target,
14572 const1_rtx, const0_rtx);
14573 }
14574
14575 /* Implement TARGET_EXPAND_BUILTIN. */
14576
14577 static rtx
14578 mips_expand_builtin (tree exp, rtx target, rtx subtarget ATTRIBUTE_UNUSED,
14579 enum machine_mode mode, int ignore)
14580 {
14581 tree fndecl;
14582 unsigned int fcode, avail;
14583 const struct mips_builtin_description *d;
14584
14585 fndecl = TREE_OPERAND (CALL_EXPR_FN (exp), 0);
14586 fcode = DECL_FUNCTION_CODE (fndecl);
14587 gcc_assert (fcode < ARRAY_SIZE (mips_builtins));
14588 d = &mips_builtins[fcode];
14589 avail = d->avail ();
14590 gcc_assert (avail != 0);
14591 if (TARGET_MIPS16 && !(avail & BUILTIN_AVAIL_MIPS16))
14592 {
14593 error ("built-in function %qE not supported for MIPS16",
14594 DECL_NAME (fndecl));
14595 return ignore ? const0_rtx : CONST0_RTX (mode);
14596 }
14597 switch (d->builtin_type)
14598 {
14599 case MIPS_BUILTIN_DIRECT:
14600 return mips_expand_builtin_direct (d->icode, target, exp, true);
14601
14602 case MIPS_BUILTIN_DIRECT_NO_TARGET:
14603 return mips_expand_builtin_direct (d->icode, target, exp, false);
14604
14605 case MIPS_BUILTIN_MOVT:
14606 case MIPS_BUILTIN_MOVF:
14607 return mips_expand_builtin_movtf (d->builtin_type, d->icode,
14608 d->cond, target, exp);
14609
14610 case MIPS_BUILTIN_CMP_ANY:
14611 case MIPS_BUILTIN_CMP_ALL:
14612 case MIPS_BUILTIN_CMP_UPPER:
14613 case MIPS_BUILTIN_CMP_LOWER:
14614 case MIPS_BUILTIN_CMP_SINGLE:
14615 return mips_expand_builtin_compare (d->builtin_type, d->icode,
14616 d->cond, target, exp);
14617
14618 case MIPS_BUILTIN_BPOSGE32:
14619 return mips_expand_builtin_bposge (d->builtin_type, target);
14620 }
14621 gcc_unreachable ();
14622 }
14623 \f
14624 /* An entry in the MIPS16 constant pool. VALUE is the pool constant,
14625 MODE is its mode, and LABEL is the CODE_LABEL associated with it. */
14626 struct mips16_constant {
14627 struct mips16_constant *next;
14628 rtx value;
14629 rtx_code_label *label;
14630 enum machine_mode mode;
14631 };
14632
14633 /* Information about an incomplete MIPS16 constant pool. FIRST is the
14634 first constant, HIGHEST_ADDRESS is the highest address that the first
14635 byte of the pool can have, and INSN_ADDRESS is the current instruction
14636 address. */
14637 struct mips16_constant_pool {
14638 struct mips16_constant *first;
14639 int highest_address;
14640 int insn_address;
14641 };
14642
14643 /* Add constant VALUE to POOL and return its label. MODE is the
14644 value's mode (used for CONST_INTs, etc.). */
14645
14646 static rtx_code_label *
14647 mips16_add_constant (struct mips16_constant_pool *pool,
14648 rtx value, enum machine_mode mode)
14649 {
14650 struct mips16_constant **p, *c;
14651 bool first_of_size_p;
14652
14653 /* See whether the constant is already in the pool. If so, return the
14654 existing label, otherwise leave P pointing to the place where the
14655 constant should be added.
14656
14657 Keep the pool sorted in increasing order of mode size so that we can
14658 reduce the number of alignments needed. */
14659 first_of_size_p = true;
14660 for (p = &pool->first; *p != 0; p = &(*p)->next)
14661 {
14662 if (mode == (*p)->mode && rtx_equal_p (value, (*p)->value))
14663 return (*p)->label;
14664 if (GET_MODE_SIZE (mode) < GET_MODE_SIZE ((*p)->mode))
14665 break;
14666 if (GET_MODE_SIZE (mode) == GET_MODE_SIZE ((*p)->mode))
14667 first_of_size_p = false;
14668 }
14669
14670 /* In the worst case, the constant needed by the earliest instruction
14671 will end up at the end of the pool. The entire pool must then be
14672 accessible from that instruction.
14673
14674 When adding the first constant, set the pool's highest address to
14675 the address of the first out-of-range byte. Adjust this address
14676 downwards each time a new constant is added. */
14677 if (pool->first == 0)
14678 /* For LWPC, ADDIUPC and DADDIUPC, the base PC value is the address
14679 of the instruction with the lowest two bits clear. The base PC
14680 value for LDPC has the lowest three bits clear. Assume the worst
14681 case here; namely that the PC-relative instruction occupies the
14682 last 2 bytes in an aligned word. */
14683 pool->highest_address = pool->insn_address - (UNITS_PER_WORD - 2) + 0x8000;
14684 pool->highest_address -= GET_MODE_SIZE (mode);
14685 if (first_of_size_p)
14686 /* Take into account the worst possible padding due to alignment. */
14687 pool->highest_address -= GET_MODE_SIZE (mode) - 1;
14688
14689 /* Create a new entry. */
14690 c = XNEW (struct mips16_constant);
14691 c->value = value;
14692 c->mode = mode;
14693 c->label = gen_label_rtx ();
14694 c->next = *p;
14695 *p = c;
14696
14697 return c->label;
14698 }
14699
14700 /* Output constant VALUE after instruction INSN and return the last
14701 instruction emitted. MODE is the mode of the constant. */
14702
14703 static rtx_insn *
14704 mips16_emit_constants_1 (enum machine_mode mode, rtx value, rtx_insn *insn)
14705 {
14706 if (SCALAR_INT_MODE_P (mode) || ALL_SCALAR_FIXED_POINT_MODE_P (mode))
14707 {
14708 rtx size = GEN_INT (GET_MODE_SIZE (mode));
14709 return emit_insn_after (gen_consttable_int (value, size), insn);
14710 }
14711
14712 if (SCALAR_FLOAT_MODE_P (mode))
14713 return emit_insn_after (gen_consttable_float (value), insn);
14714
14715 if (VECTOR_MODE_P (mode))
14716 {
14717 int i;
14718
14719 for (i = 0; i < CONST_VECTOR_NUNITS (value); i++)
14720 insn = mips16_emit_constants_1 (GET_MODE_INNER (mode),
14721 CONST_VECTOR_ELT (value, i), insn);
14722 return insn;
14723 }
14724
14725 gcc_unreachable ();
14726 }
14727
14728 /* Dump out the constants in CONSTANTS after INSN. */
14729
14730 static void
14731 mips16_emit_constants (struct mips16_constant *constants, rtx_insn *insn)
14732 {
14733 struct mips16_constant *c, *next;
14734 int align;
14735
14736 align = 0;
14737 for (c = constants; c != NULL; c = next)
14738 {
14739 /* If necessary, increase the alignment of PC. */
14740 if (align < GET_MODE_SIZE (c->mode))
14741 {
14742 int align_log = floor_log2 (GET_MODE_SIZE (c->mode));
14743 insn = emit_insn_after (gen_align (GEN_INT (align_log)), insn);
14744 }
14745 align = GET_MODE_SIZE (c->mode);
14746
14747 insn = emit_label_after (c->label, insn);
14748 insn = mips16_emit_constants_1 (c->mode, c->value, insn);
14749
14750 next = c->next;
14751 free (c);
14752 }
14753
14754 emit_barrier_after (insn);
14755 }
14756
14757 /* Return the length of instruction INSN. */
14758
14759 static int
14760 mips16_insn_length (rtx_insn *insn)
14761 {
14762 if (JUMP_TABLE_DATA_P (insn))
14763 {
14764 rtx body = PATTERN (insn);
14765 if (GET_CODE (body) == ADDR_VEC)
14766 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 0);
14767 else if (GET_CODE (body) == ADDR_DIFF_VEC)
14768 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 1);
14769 else
14770 gcc_unreachable ();
14771 }
14772 return get_attr_length (insn);
14773 }
14774
14775 /* If *X is a symbolic constant that refers to the constant pool, add
14776 the constant to POOL and rewrite *X to use the constant's label. */
14777
14778 static void
14779 mips16_rewrite_pool_constant (struct mips16_constant_pool *pool, rtx *x)
14780 {
14781 rtx base, offset;
14782 rtx_code_label *label;
14783
14784 split_const (*x, &base, &offset);
14785 if (GET_CODE (base) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (base))
14786 {
14787 label = mips16_add_constant (pool, copy_rtx (get_pool_constant (base)),
14788 get_pool_mode (base));
14789 base = gen_rtx_LABEL_REF (Pmode, label);
14790 *x = mips_unspec_address_offset (base, offset, SYMBOL_PC_RELATIVE);
14791 }
14792 }
14793
14794 /* This structure is used to communicate with mips16_rewrite_pool_refs.
14795 INSN is the instruction we're rewriting and POOL points to the current
14796 constant pool. */
14797 struct mips16_rewrite_pool_refs_info {
14798 rtx_insn *insn;
14799 struct mips16_constant_pool *pool;
14800 };
14801
14802 /* Rewrite *X so that constant pool references refer to the constant's
14803 label instead. DATA points to a mips16_rewrite_pool_refs_info
14804 structure. */
14805
14806 static int
14807 mips16_rewrite_pool_refs (rtx *x, void *data)
14808 {
14809 struct mips16_rewrite_pool_refs_info *info =
14810 (struct mips16_rewrite_pool_refs_info *) data;
14811
14812 if (force_to_mem_operand (*x, Pmode))
14813 {
14814 rtx mem = force_const_mem (GET_MODE (*x), *x);
14815 validate_change (info->insn, x, mem, false);
14816 }
14817
14818 if (MEM_P (*x))
14819 {
14820 mips16_rewrite_pool_constant (info->pool, &XEXP (*x, 0));
14821 return -1;
14822 }
14823
14824 /* Don't rewrite the __mips16_rdwr symbol. */
14825 if (GET_CODE (*x) == UNSPEC && XINT (*x, 1) == UNSPEC_TLS_GET_TP)
14826 return -1;
14827
14828 if (TARGET_MIPS16_TEXT_LOADS)
14829 mips16_rewrite_pool_constant (info->pool, x);
14830
14831 return GET_CODE (*x) == CONST ? -1 : 0;
14832 }
14833
14834 /* Return whether CFG is used in mips_reorg. */
14835
14836 static bool
14837 mips_cfg_in_reorg (void)
14838 {
14839 return (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE
14840 || TARGET_RELAX_PIC_CALLS);
14841 }
14842
14843 /* Build MIPS16 constant pools. Split the instructions if SPLIT_P,
14844 otherwise assume that they are already split. */
14845
14846 static void
14847 mips16_lay_out_constants (bool split_p)
14848 {
14849 struct mips16_constant_pool pool;
14850 struct mips16_rewrite_pool_refs_info info;
14851 rtx_insn *insn, *barrier;
14852
14853 if (!TARGET_MIPS16_PCREL_LOADS)
14854 return;
14855
14856 if (split_p)
14857 {
14858 if (mips_cfg_in_reorg ())
14859 split_all_insns ();
14860 else
14861 split_all_insns_noflow ();
14862 }
14863 barrier = 0;
14864 memset (&pool, 0, sizeof (pool));
14865 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
14866 {
14867 /* Rewrite constant pool references in INSN. */
14868 if (USEFUL_INSN_P (insn))
14869 {
14870 info.insn = insn;
14871 info.pool = &pool;
14872 for_each_rtx (&PATTERN (insn), mips16_rewrite_pool_refs, &info);
14873 }
14874
14875 pool.insn_address += mips16_insn_length (insn);
14876
14877 if (pool.first != NULL)
14878 {
14879 /* If there are no natural barriers between the first user of
14880 the pool and the highest acceptable address, we'll need to
14881 create a new instruction to jump around the constant pool.
14882 In the worst case, this instruction will be 4 bytes long.
14883
14884 If it's too late to do this transformation after INSN,
14885 do it immediately before INSN. */
14886 if (barrier == 0 && pool.insn_address + 4 > pool.highest_address)
14887 {
14888 rtx_code_label *label;
14889 rtx_insn *jump;
14890
14891 label = gen_label_rtx ();
14892
14893 jump = emit_jump_insn_before (gen_jump (label), insn);
14894 JUMP_LABEL (jump) = label;
14895 LABEL_NUSES (label) = 1;
14896 barrier = emit_barrier_after (jump);
14897
14898 emit_label_after (label, barrier);
14899 pool.insn_address += 4;
14900 }
14901
14902 /* See whether the constant pool is now out of range of the first
14903 user. If so, output the constants after the previous barrier.
14904 Note that any instructions between BARRIER and INSN (inclusive)
14905 will use negative offsets to refer to the pool. */
14906 if (pool.insn_address > pool.highest_address)
14907 {
14908 mips16_emit_constants (pool.first, barrier);
14909 pool.first = NULL;
14910 barrier = 0;
14911 }
14912 else if (BARRIER_P (insn))
14913 barrier = insn;
14914 }
14915 }
14916 mips16_emit_constants (pool.first, get_last_insn ());
14917 }
14918 \f
14919 /* Return true if it is worth r10k_simplify_address's while replacing
14920 an address with X. We are looking for constants, and for addresses
14921 at a known offset from the incoming stack pointer. */
14922
14923 static bool
14924 r10k_simplified_address_p (rtx x)
14925 {
14926 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1)))
14927 x = XEXP (x, 0);
14928 return x == virtual_incoming_args_rtx || CONSTANT_P (x);
14929 }
14930
14931 /* X is an expression that appears in INSN. Try to use the UD chains
14932 to simplify it, returning the simplified form on success and the
14933 original form otherwise. Replace the incoming value of $sp with
14934 virtual_incoming_args_rtx (which should never occur in X otherwise). */
14935
14936 static rtx
14937 r10k_simplify_address (rtx x, rtx_insn *insn)
14938 {
14939 rtx newx, op0, op1, set, note;
14940 rtx_insn *def_insn;
14941 df_ref use, def;
14942 struct df_link *defs;
14943
14944 newx = NULL_RTX;
14945 if (UNARY_P (x))
14946 {
14947 op0 = r10k_simplify_address (XEXP (x, 0), insn);
14948 if (op0 != XEXP (x, 0))
14949 newx = simplify_gen_unary (GET_CODE (x), GET_MODE (x),
14950 op0, GET_MODE (XEXP (x, 0)));
14951 }
14952 else if (BINARY_P (x))
14953 {
14954 op0 = r10k_simplify_address (XEXP (x, 0), insn);
14955 op1 = r10k_simplify_address (XEXP (x, 1), insn);
14956 if (op0 != XEXP (x, 0) || op1 != XEXP (x, 1))
14957 newx = simplify_gen_binary (GET_CODE (x), GET_MODE (x), op0, op1);
14958 }
14959 else if (GET_CODE (x) == LO_SUM)
14960 {
14961 /* LO_SUMs can be offset from HIGHs, if we know they won't
14962 overflow. See mips_classify_address for the rationale behind
14963 the lax check. */
14964 op0 = r10k_simplify_address (XEXP (x, 0), insn);
14965 if (GET_CODE (op0) == HIGH)
14966 newx = XEXP (x, 1);
14967 }
14968 else if (REG_P (x))
14969 {
14970 /* Uses are recorded by regno_reg_rtx, not X itself. */
14971 use = df_find_use (insn, regno_reg_rtx[REGNO (x)]);
14972 gcc_assert (use);
14973 defs = DF_REF_CHAIN (use);
14974
14975 /* Require a single definition. */
14976 if (defs && defs->next == NULL)
14977 {
14978 def = defs->ref;
14979 if (DF_REF_IS_ARTIFICIAL (def))
14980 {
14981 /* Replace the incoming value of $sp with
14982 virtual_incoming_args_rtx. */
14983 if (x == stack_pointer_rtx
14984 && DF_REF_BB (def) == ENTRY_BLOCK_PTR_FOR_FN (cfun))
14985 newx = virtual_incoming_args_rtx;
14986 }
14987 else if (dominated_by_p (CDI_DOMINATORS, DF_REF_BB (use),
14988 DF_REF_BB (def)))
14989 {
14990 /* Make sure that DEF_INSN is a single set of REG. */
14991 def_insn = DF_REF_INSN (def);
14992 if (NONJUMP_INSN_P (def_insn))
14993 {
14994 set = single_set (def_insn);
14995 if (set && rtx_equal_p (SET_DEST (set), x))
14996 {
14997 /* Prefer to use notes, since the def-use chains
14998 are often shorter. */
14999 note = find_reg_equal_equiv_note (def_insn);
15000 if (note)
15001 newx = XEXP (note, 0);
15002 else
15003 newx = SET_SRC (set);
15004 newx = r10k_simplify_address (newx, def_insn);
15005 }
15006 }
15007 }
15008 }
15009 }
15010 if (newx && r10k_simplified_address_p (newx))
15011 return newx;
15012 return x;
15013 }
15014
15015 /* Return true if ADDRESS is known to be an uncached address
15016 on R10K systems. */
15017
15018 static bool
15019 r10k_uncached_address_p (unsigned HOST_WIDE_INT address)
15020 {
15021 unsigned HOST_WIDE_INT upper;
15022
15023 /* Check for KSEG1. */
15024 if (address + 0x60000000 < 0x20000000)
15025 return true;
15026
15027 /* Check for uncached XKPHYS addresses. */
15028 if (Pmode == DImode)
15029 {
15030 upper = (address >> 40) & 0xf9ffff;
15031 if (upper == 0x900000 || upper == 0xb80000)
15032 return true;
15033 }
15034 return false;
15035 }
15036
15037 /* Return true if we can prove that an access to address X in instruction
15038 INSN would be safe from R10K speculation. This X is a general
15039 expression; it might not be a legitimate address. */
15040
15041 static bool
15042 r10k_safe_address_p (rtx x, rtx_insn *insn)
15043 {
15044 rtx base, offset;
15045 HOST_WIDE_INT offset_val;
15046
15047 x = r10k_simplify_address (x, insn);
15048
15049 /* Check for references to the stack frame. It doesn't really matter
15050 how much of the frame has been allocated at INSN; -mr10k-cache-barrier
15051 allows us to assume that accesses to any part of the eventual frame
15052 is safe from speculation at any point in the function. */
15053 mips_split_plus (x, &base, &offset_val);
15054 if (base == virtual_incoming_args_rtx
15055 && offset_val >= -cfun->machine->frame.total_size
15056 && offset_val < cfun->machine->frame.args_size)
15057 return true;
15058
15059 /* Check for uncached addresses. */
15060 if (CONST_INT_P (x))
15061 return r10k_uncached_address_p (INTVAL (x));
15062
15063 /* Check for accesses to a static object. */
15064 split_const (x, &base, &offset);
15065 return offset_within_block_p (base, INTVAL (offset));
15066 }
15067
15068 /* Return true if a MEM with MEM_EXPR EXPR and MEM_OFFSET OFFSET is
15069 an in-range access to an automatic variable, or to an object with
15070 a link-time-constant address. */
15071
15072 static bool
15073 r10k_safe_mem_expr_p (tree expr, unsigned HOST_WIDE_INT offset)
15074 {
15075 HOST_WIDE_INT bitoffset, bitsize;
15076 tree inner, var_offset;
15077 enum machine_mode mode;
15078 int unsigned_p, volatile_p;
15079
15080 inner = get_inner_reference (expr, &bitsize, &bitoffset, &var_offset, &mode,
15081 &unsigned_p, &volatile_p, false);
15082 if (!DECL_P (inner) || !DECL_SIZE_UNIT (inner) || var_offset)
15083 return false;
15084
15085 offset += bitoffset / BITS_PER_UNIT;
15086 return offset < tree_to_uhwi (DECL_SIZE_UNIT (inner));
15087 }
15088
15089 /* A for_each_rtx callback for which DATA points to the instruction
15090 containing *X. Stop the search if we find a MEM that is not safe
15091 from R10K speculation. */
15092
15093 static int
15094 r10k_needs_protection_p_1 (rtx *loc, void *data)
15095 {
15096 rtx mem;
15097
15098 mem = *loc;
15099 if (!MEM_P (mem))
15100 return 0;
15101
15102 if (MEM_EXPR (mem)
15103 && MEM_OFFSET_KNOWN_P (mem)
15104 && r10k_safe_mem_expr_p (MEM_EXPR (mem), MEM_OFFSET (mem)))
15105 return -1;
15106
15107 if (r10k_safe_address_p (XEXP (mem, 0), (rtx_insn *) data))
15108 return -1;
15109
15110 return 1;
15111 }
15112
15113 /* A note_stores callback for which DATA points to an instruction pointer.
15114 If *DATA is nonnull, make it null if it X contains a MEM that is not
15115 safe from R10K speculation. */
15116
15117 static void
15118 r10k_needs_protection_p_store (rtx x, const_rtx pat ATTRIBUTE_UNUSED,
15119 void *data)
15120 {
15121 rtx_insn **insn_ptr;
15122
15123 insn_ptr = (rtx_insn **) data;
15124 if (*insn_ptr && for_each_rtx (&x, r10k_needs_protection_p_1, *insn_ptr))
15125 *insn_ptr = NULL;
15126 }
15127
15128 /* A for_each_rtx callback that iterates over the pattern of a CALL_INSN.
15129 Return nonzero if the call is not to a declared function. */
15130
15131 static int
15132 r10k_needs_protection_p_call (rtx *loc, void *data ATTRIBUTE_UNUSED)
15133 {
15134 rtx x;
15135
15136 x = *loc;
15137 if (!MEM_P (x))
15138 return 0;
15139
15140 x = XEXP (x, 0);
15141 if (GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_DECL (x))
15142 return -1;
15143
15144 return 1;
15145 }
15146
15147 /* Return true if instruction INSN needs to be protected by an R10K
15148 cache barrier. */
15149
15150 static bool
15151 r10k_needs_protection_p (rtx_insn *insn)
15152 {
15153 if (CALL_P (insn))
15154 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_call, NULL);
15155
15156 if (mips_r10k_cache_barrier == R10K_CACHE_BARRIER_STORE)
15157 {
15158 note_stores (PATTERN (insn), r10k_needs_protection_p_store, &insn);
15159 return insn == NULL_RTX;
15160 }
15161
15162 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_1, insn);
15163 }
15164
15165 /* Return true if BB is only reached by blocks in PROTECTED_BBS and if every
15166 edge is unconditional. */
15167
15168 static bool
15169 r10k_protected_bb_p (basic_block bb, sbitmap protected_bbs)
15170 {
15171 edge_iterator ei;
15172 edge e;
15173
15174 FOR_EACH_EDGE (e, ei, bb->preds)
15175 if (!single_succ_p (e->src)
15176 || !bitmap_bit_p (protected_bbs, e->src->index)
15177 || (e->flags & EDGE_COMPLEX) != 0)
15178 return false;
15179 return true;
15180 }
15181
15182 /* Implement -mr10k-cache-barrier= for the current function. */
15183
15184 static void
15185 r10k_insert_cache_barriers (void)
15186 {
15187 int *rev_post_order;
15188 unsigned int i, n;
15189 basic_block bb;
15190 sbitmap protected_bbs;
15191 rtx_insn *insn, *end;
15192 rtx unprotected_region;
15193
15194 if (TARGET_MIPS16)
15195 {
15196 sorry ("%qs does not support MIPS16 code", "-mr10k-cache-barrier");
15197 return;
15198 }
15199
15200 /* Calculate dominators. */
15201 calculate_dominance_info (CDI_DOMINATORS);
15202
15203 /* Bit X of PROTECTED_BBS is set if the last operation in basic block
15204 X is protected by a cache barrier. */
15205 protected_bbs = sbitmap_alloc (last_basic_block_for_fn (cfun));
15206 bitmap_clear (protected_bbs);
15207
15208 /* Iterate over the basic blocks in reverse post-order. */
15209 rev_post_order = XNEWVEC (int, last_basic_block_for_fn (cfun));
15210 n = pre_and_rev_post_order_compute (NULL, rev_post_order, false);
15211 for (i = 0; i < n; i++)
15212 {
15213 bb = BASIC_BLOCK_FOR_FN (cfun, rev_post_order[i]);
15214
15215 /* If this block is only reached by unconditional edges, and if the
15216 source of every edge is protected, the beginning of the block is
15217 also protected. */
15218 if (r10k_protected_bb_p (bb, protected_bbs))
15219 unprotected_region = NULL_RTX;
15220 else
15221 unprotected_region = pc_rtx;
15222 end = NEXT_INSN (BB_END (bb));
15223
15224 /* UNPROTECTED_REGION is:
15225
15226 - null if we are processing a protected region,
15227 - pc_rtx if we are processing an unprotected region but have
15228 not yet found the first instruction in it
15229 - the first instruction in an unprotected region otherwise. */
15230 for (insn = BB_HEAD (bb); insn != end; insn = NEXT_INSN (insn))
15231 {
15232 if (unprotected_region && USEFUL_INSN_P (insn))
15233 {
15234 if (recog_memoized (insn) == CODE_FOR_mips_cache)
15235 /* This CACHE instruction protects the following code. */
15236 unprotected_region = NULL_RTX;
15237 else
15238 {
15239 /* See if INSN is the first instruction in this
15240 unprotected region. */
15241 if (unprotected_region == pc_rtx)
15242 unprotected_region = insn;
15243
15244 /* See if INSN needs to be protected. If so,
15245 we must insert a cache barrier somewhere between
15246 PREV_INSN (UNPROTECTED_REGION) and INSN. It isn't
15247 clear which position is better performance-wise,
15248 but as a tie-breaker, we assume that it is better
15249 to allow delay slots to be back-filled where
15250 possible, and that it is better not to insert
15251 barriers in the middle of already-scheduled code.
15252 We therefore insert the barrier at the beginning
15253 of the region. */
15254 if (r10k_needs_protection_p (insn))
15255 {
15256 emit_insn_before (gen_r10k_cache_barrier (),
15257 unprotected_region);
15258 unprotected_region = NULL_RTX;
15259 }
15260 }
15261 }
15262
15263 if (CALL_P (insn))
15264 /* The called function is not required to protect the exit path.
15265 The code that follows a call is therefore unprotected. */
15266 unprotected_region = pc_rtx;
15267 }
15268
15269 /* Record whether the end of this block is protected. */
15270 if (unprotected_region == NULL_RTX)
15271 bitmap_set_bit (protected_bbs, bb->index);
15272 }
15273 XDELETEVEC (rev_post_order);
15274
15275 sbitmap_free (protected_bbs);
15276
15277 free_dominance_info (CDI_DOMINATORS);
15278 }
15279 \f
15280 /* If INSN is a call, return the underlying CALL expr. Return NULL_RTX
15281 otherwise. If INSN has two call rtx, then store the second one in
15282 SECOND_CALL. */
15283
15284 static rtx
15285 mips_call_expr_from_insn (rtx_insn *insn, rtx *second_call)
15286 {
15287 rtx x;
15288 rtx x2;
15289
15290 if (!CALL_P (insn))
15291 return NULL_RTX;
15292
15293 x = PATTERN (insn);
15294 if (GET_CODE (x) == PARALLEL)
15295 {
15296 /* Calls returning complex values have two CALL rtx. Look for the second
15297 one here, and return it via the SECOND_CALL arg. */
15298 x2 = XVECEXP (x, 0, 1);
15299 if (GET_CODE (x2) == SET)
15300 x2 = XEXP (x2, 1);
15301 if (GET_CODE (x2) == CALL)
15302 *second_call = x2;
15303
15304 x = XVECEXP (x, 0, 0);
15305 }
15306 if (GET_CODE (x) == SET)
15307 x = XEXP (x, 1);
15308 gcc_assert (GET_CODE (x) == CALL);
15309
15310 return x;
15311 }
15312
15313 /* REG is set in DEF. See if the definition is one of the ways we load a
15314 register with a symbol address for a mips_use_pic_fn_addr_reg_p call.
15315 If it is, return the symbol reference of the function, otherwise return
15316 NULL_RTX.
15317
15318 If RECURSE_P is true, use mips_find_pic_call_symbol to interpret
15319 the values of source registers, otherwise treat such registers as
15320 having an unknown value. */
15321
15322 static rtx
15323 mips_pic_call_symbol_from_set (df_ref def, rtx reg, bool recurse_p)
15324 {
15325 rtx_insn *def_insn;
15326 rtx set;
15327
15328 if (DF_REF_IS_ARTIFICIAL (def))
15329 return NULL_RTX;
15330
15331 def_insn = DF_REF_INSN (def);
15332 set = single_set (def_insn);
15333 if (set && rtx_equal_p (SET_DEST (set), reg))
15334 {
15335 rtx note, src, symbol;
15336
15337 /* First see whether the source is a plain symbol. This is used
15338 when calling symbols that are not lazily bound. */
15339 src = SET_SRC (set);
15340 if (GET_CODE (src) == SYMBOL_REF)
15341 return src;
15342
15343 /* Handle %call16 references. */
15344 symbol = mips_strip_unspec_call (src);
15345 if (symbol)
15346 {
15347 gcc_assert (GET_CODE (symbol) == SYMBOL_REF);
15348 return symbol;
15349 }
15350
15351 /* If we have something more complicated, look for a
15352 REG_EQUAL or REG_EQUIV note. */
15353 note = find_reg_equal_equiv_note (def_insn);
15354 if (note && GET_CODE (XEXP (note, 0)) == SYMBOL_REF)
15355 return XEXP (note, 0);
15356
15357 /* Follow at most one simple register copy. Such copies are
15358 interesting in cases like:
15359
15360 for (...)
15361 {
15362 locally_binding_fn (...);
15363 }
15364
15365 and:
15366
15367 locally_binding_fn (...);
15368 ...
15369 locally_binding_fn (...);
15370
15371 where the load of locally_binding_fn can legitimately be
15372 hoisted or shared. However, we do not expect to see complex
15373 chains of copies, so a full worklist solution to the problem
15374 would probably be overkill. */
15375 if (recurse_p && REG_P (src))
15376 return mips_find_pic_call_symbol (def_insn, src, false);
15377 }
15378
15379 return NULL_RTX;
15380 }
15381
15382 /* Find the definition of the use of REG in INSN. See if the definition
15383 is one of the ways we load a register with a symbol address for a
15384 mips_use_pic_fn_addr_reg_p call. If it is return the symbol reference
15385 of the function, otherwise return NULL_RTX. RECURSE_P is as for
15386 mips_pic_call_symbol_from_set. */
15387
15388 static rtx
15389 mips_find_pic_call_symbol (rtx_insn *insn, rtx reg, bool recurse_p)
15390 {
15391 df_ref use;
15392 struct df_link *defs;
15393 rtx symbol;
15394
15395 use = df_find_use (insn, regno_reg_rtx[REGNO (reg)]);
15396 if (!use)
15397 return NULL_RTX;
15398 defs = DF_REF_CHAIN (use);
15399 if (!defs)
15400 return NULL_RTX;
15401 symbol = mips_pic_call_symbol_from_set (defs->ref, reg, recurse_p);
15402 if (!symbol)
15403 return NULL_RTX;
15404
15405 /* If we have more than one definition, they need to be identical. */
15406 for (defs = defs->next; defs; defs = defs->next)
15407 {
15408 rtx other;
15409
15410 other = mips_pic_call_symbol_from_set (defs->ref, reg, recurse_p);
15411 if (!rtx_equal_p (symbol, other))
15412 return NULL_RTX;
15413 }
15414
15415 return symbol;
15416 }
15417
15418 /* Replace the args_size operand of the call expression CALL with the
15419 call-attribute UNSPEC and fill in SYMBOL as the function symbol. */
15420
15421 static void
15422 mips_annotate_pic_call_expr (rtx call, rtx symbol)
15423 {
15424 rtx args_size;
15425
15426 args_size = XEXP (call, 1);
15427 XEXP (call, 1) = gen_rtx_UNSPEC (GET_MODE (args_size),
15428 gen_rtvec (2, args_size, symbol),
15429 UNSPEC_CALL_ATTR);
15430 }
15431
15432 /* OPERANDS[ARGS_SIZE_OPNO] is the arg_size operand of a CALL expression. See
15433 if instead of the arg_size argument it contains the call attributes. If
15434 yes return true along with setting OPERANDS[ARGS_SIZE_OPNO] to the function
15435 symbol from the call attributes. Also return false if ARGS_SIZE_OPNO is
15436 -1. */
15437
15438 bool
15439 mips_get_pic_call_symbol (rtx *operands, int args_size_opno)
15440 {
15441 rtx args_size, symbol;
15442
15443 if (!TARGET_RELAX_PIC_CALLS || args_size_opno == -1)
15444 return false;
15445
15446 args_size = operands[args_size_opno];
15447 if (GET_CODE (args_size) != UNSPEC)
15448 return false;
15449 gcc_assert (XINT (args_size, 1) == UNSPEC_CALL_ATTR);
15450
15451 symbol = XVECEXP (args_size, 0, 1);
15452 gcc_assert (GET_CODE (symbol) == SYMBOL_REF);
15453
15454 operands[args_size_opno] = symbol;
15455 return true;
15456 }
15457
15458 /* Use DF to annotate PIC indirect calls with the function symbol they
15459 dispatch to. */
15460
15461 static void
15462 mips_annotate_pic_calls (void)
15463 {
15464 basic_block bb;
15465 rtx_insn *insn;
15466
15467 FOR_EACH_BB_FN (bb, cfun)
15468 FOR_BB_INSNS (bb, insn)
15469 {
15470 rtx call, reg, symbol, second_call;
15471
15472 second_call = 0;
15473 call = mips_call_expr_from_insn (insn, &second_call);
15474 if (!call)
15475 continue;
15476 gcc_assert (MEM_P (XEXP (call, 0)));
15477 reg = XEXP (XEXP (call, 0), 0);
15478 if (!REG_P (reg))
15479 continue;
15480
15481 symbol = mips_find_pic_call_symbol (insn, reg, true);
15482 if (symbol)
15483 {
15484 mips_annotate_pic_call_expr (call, symbol);
15485 if (second_call)
15486 mips_annotate_pic_call_expr (second_call, symbol);
15487 }
15488 }
15489 }
15490 \f
15491 /* A temporary variable used by for_each_rtx callbacks, etc. */
15492 static rtx_insn *mips_sim_insn;
15493
15494 /* A structure representing the state of the processor pipeline.
15495 Used by the mips_sim_* family of functions. */
15496 struct mips_sim {
15497 /* The maximum number of instructions that can be issued in a cycle.
15498 (Caches mips_issue_rate.) */
15499 unsigned int issue_rate;
15500
15501 /* The current simulation time. */
15502 unsigned int time;
15503
15504 /* How many more instructions can be issued in the current cycle. */
15505 unsigned int insns_left;
15506
15507 /* LAST_SET[X].INSN is the last instruction to set register X.
15508 LAST_SET[X].TIME is the time at which that instruction was issued.
15509 INSN is null if no instruction has yet set register X. */
15510 struct {
15511 rtx_insn *insn;
15512 unsigned int time;
15513 } last_set[FIRST_PSEUDO_REGISTER];
15514
15515 /* The pipeline's current DFA state. */
15516 state_t dfa_state;
15517 };
15518
15519 /* Reset STATE to the initial simulation state. */
15520
15521 static void
15522 mips_sim_reset (struct mips_sim *state)
15523 {
15524 curr_state = state->dfa_state;
15525
15526 state->time = 0;
15527 state->insns_left = state->issue_rate;
15528 memset (&state->last_set, 0, sizeof (state->last_set));
15529 state_reset (curr_state);
15530
15531 targetm.sched.init (0, false, 0);
15532 advance_state (curr_state);
15533 }
15534
15535 /* Initialize STATE before its first use. DFA_STATE points to an
15536 allocated but uninitialized DFA state. */
15537
15538 static void
15539 mips_sim_init (struct mips_sim *state, state_t dfa_state)
15540 {
15541 if (targetm.sched.init_dfa_pre_cycle_insn)
15542 targetm.sched.init_dfa_pre_cycle_insn ();
15543
15544 if (targetm.sched.init_dfa_post_cycle_insn)
15545 targetm.sched.init_dfa_post_cycle_insn ();
15546
15547 state->issue_rate = mips_issue_rate ();
15548 state->dfa_state = dfa_state;
15549 mips_sim_reset (state);
15550 }
15551
15552 /* Advance STATE by one clock cycle. */
15553
15554 static void
15555 mips_sim_next_cycle (struct mips_sim *state)
15556 {
15557 curr_state = state->dfa_state;
15558
15559 state->time++;
15560 state->insns_left = state->issue_rate;
15561 advance_state (curr_state);
15562 }
15563
15564 /* Advance simulation state STATE until instruction INSN can read
15565 register REG. */
15566
15567 static void
15568 mips_sim_wait_reg (struct mips_sim *state, rtx_insn *insn, rtx reg)
15569 {
15570 unsigned int regno, end_regno;
15571
15572 end_regno = END_REGNO (reg);
15573 for (regno = REGNO (reg); regno < end_regno; regno++)
15574 if (state->last_set[regno].insn != 0)
15575 {
15576 unsigned int t;
15577
15578 t = (state->last_set[regno].time
15579 + insn_latency (state->last_set[regno].insn, insn));
15580 while (state->time < t)
15581 mips_sim_next_cycle (state);
15582 }
15583 }
15584
15585 /* A for_each_rtx callback. If *X is a register, advance simulation state
15586 DATA until mips_sim_insn can read the register's value. */
15587
15588 static int
15589 mips_sim_wait_regs_2 (rtx *x, void *data)
15590 {
15591 if (REG_P (*x))
15592 mips_sim_wait_reg ((struct mips_sim *) data, mips_sim_insn, *x);
15593 return 0;
15594 }
15595
15596 /* Call mips_sim_wait_regs_2 (R, DATA) for each register R mentioned in *X. */
15597
15598 static void
15599 mips_sim_wait_regs_1 (rtx *x, void *data)
15600 {
15601 for_each_rtx (x, mips_sim_wait_regs_2, data);
15602 }
15603
15604 /* Advance simulation state STATE until all of INSN's register
15605 dependencies are satisfied. */
15606
15607 static void
15608 mips_sim_wait_regs (struct mips_sim *state, rtx_insn *insn)
15609 {
15610 mips_sim_insn = insn;
15611 note_uses (&PATTERN (insn), mips_sim_wait_regs_1, state);
15612 }
15613
15614 /* Advance simulation state STATE until the units required by
15615 instruction INSN are available. */
15616
15617 static void
15618 mips_sim_wait_units (struct mips_sim *state, rtx_insn *insn)
15619 {
15620 state_t tmp_state;
15621
15622 tmp_state = alloca (state_size ());
15623 while (state->insns_left == 0
15624 || (memcpy (tmp_state, state->dfa_state, state_size ()),
15625 state_transition (tmp_state, insn) >= 0))
15626 mips_sim_next_cycle (state);
15627 }
15628
15629 /* Advance simulation state STATE until INSN is ready to issue. */
15630
15631 static void
15632 mips_sim_wait_insn (struct mips_sim *state, rtx_insn *insn)
15633 {
15634 mips_sim_wait_regs (state, insn);
15635 mips_sim_wait_units (state, insn);
15636 }
15637
15638 /* mips_sim_insn has just set X. Update the LAST_SET array
15639 in simulation state DATA. */
15640
15641 static void
15642 mips_sim_record_set (rtx x, const_rtx pat ATTRIBUTE_UNUSED, void *data)
15643 {
15644 struct mips_sim *state;
15645
15646 state = (struct mips_sim *) data;
15647 if (REG_P (x))
15648 {
15649 unsigned int regno, end_regno;
15650
15651 end_regno = END_REGNO (x);
15652 for (regno = REGNO (x); regno < end_regno; regno++)
15653 {
15654 state->last_set[regno].insn = mips_sim_insn;
15655 state->last_set[regno].time = state->time;
15656 }
15657 }
15658 }
15659
15660 /* Issue instruction INSN in scheduler state STATE. Assume that INSN
15661 can issue immediately (i.e., that mips_sim_wait_insn has already
15662 been called). */
15663
15664 static void
15665 mips_sim_issue_insn (struct mips_sim *state, rtx_insn *insn)
15666 {
15667 curr_state = state->dfa_state;
15668
15669 state_transition (curr_state, insn);
15670 state->insns_left = targetm.sched.variable_issue (0, false, insn,
15671 state->insns_left);
15672
15673 mips_sim_insn = insn;
15674 note_stores (PATTERN (insn), mips_sim_record_set, state);
15675 }
15676
15677 /* Simulate issuing a NOP in state STATE. */
15678
15679 static void
15680 mips_sim_issue_nop (struct mips_sim *state)
15681 {
15682 if (state->insns_left == 0)
15683 mips_sim_next_cycle (state);
15684 state->insns_left--;
15685 }
15686
15687 /* Update simulation state STATE so that it's ready to accept the instruction
15688 after INSN. INSN should be part of the main rtl chain, not a member of a
15689 SEQUENCE. */
15690
15691 static void
15692 mips_sim_finish_insn (struct mips_sim *state, rtx_insn *insn)
15693 {
15694 /* If INSN is a jump with an implicit delay slot, simulate a nop. */
15695 if (JUMP_P (insn))
15696 mips_sim_issue_nop (state);
15697
15698 switch (GET_CODE (SEQ_BEGIN (insn)))
15699 {
15700 case CODE_LABEL:
15701 case CALL_INSN:
15702 /* We can't predict the processor state after a call or label. */
15703 mips_sim_reset (state);
15704 break;
15705
15706 case JUMP_INSN:
15707 /* The delay slots of branch likely instructions are only executed
15708 when the branch is taken. Therefore, if the caller has simulated
15709 the delay slot instruction, STATE does not really reflect the state
15710 of the pipeline for the instruction after the delay slot. Also,
15711 branch likely instructions tend to incur a penalty when not taken,
15712 so there will probably be an extra delay between the branch and
15713 the instruction after the delay slot. */
15714 if (INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (insn)))
15715 mips_sim_reset (state);
15716 break;
15717
15718 default:
15719 break;
15720 }
15721 }
15722
15723 /* Use simulator state STATE to calculate the execution time of
15724 instruction sequence SEQ. */
15725
15726 static unsigned int
15727 mips_seq_time (struct mips_sim *state, rtx_insn *seq)
15728 {
15729 mips_sim_reset (state);
15730 for (rtx_insn *insn = seq; insn; insn = NEXT_INSN (insn))
15731 {
15732 mips_sim_wait_insn (state, insn);
15733 mips_sim_issue_insn (state, insn);
15734 }
15735 return state->time;
15736 }
15737 \f
15738 /* Return the execution-time cost of mips_tuning_info.fast_mult_zero_zero_p
15739 setting SETTING, using STATE to simulate instruction sequences. */
15740
15741 static unsigned int
15742 mips_mult_zero_zero_cost (struct mips_sim *state, bool setting)
15743 {
15744 mips_tuning_info.fast_mult_zero_zero_p = setting;
15745 start_sequence ();
15746
15747 enum machine_mode dword_mode = TARGET_64BIT ? TImode : DImode;
15748 rtx hilo = gen_rtx_REG (dword_mode, MD_REG_FIRST);
15749 mips_emit_move_or_split (hilo, const0_rtx, SPLIT_FOR_SPEED);
15750
15751 /* If the target provides mulsidi3_32bit then that's the most likely
15752 consumer of the result. Test for bypasses. */
15753 if (dword_mode == DImode && HAVE_maddsidi4)
15754 {
15755 rtx gpr = gen_rtx_REG (SImode, GP_REG_FIRST + 4);
15756 emit_insn (gen_maddsidi4 (hilo, gpr, gpr, hilo));
15757 }
15758
15759 unsigned int time = mips_seq_time (state, get_insns ());
15760 end_sequence ();
15761 return time;
15762 }
15763
15764 /* Check the relative speeds of "MULT $0,$0" and "MTLO $0; MTHI $0"
15765 and set up mips_tuning_info.fast_mult_zero_zero_p accordingly.
15766 Prefer MULT -- which is shorter -- in the event of a tie. */
15767
15768 static void
15769 mips_set_fast_mult_zero_zero_p (struct mips_sim *state)
15770 {
15771 if (TARGET_MIPS16)
15772 /* No MTLO or MTHI available. */
15773 mips_tuning_info.fast_mult_zero_zero_p = true;
15774 else
15775 {
15776 unsigned int true_time = mips_mult_zero_zero_cost (state, true);
15777 unsigned int false_time = mips_mult_zero_zero_cost (state, false);
15778 mips_tuning_info.fast_mult_zero_zero_p = (true_time <= false_time);
15779 }
15780 }
15781
15782 /* Set up costs based on the current architecture and tuning settings. */
15783
15784 static void
15785 mips_set_tuning_info (void)
15786 {
15787 if (mips_tuning_info.initialized_p
15788 && mips_tuning_info.arch == mips_arch
15789 && mips_tuning_info.tune == mips_tune
15790 && mips_tuning_info.mips16_p == TARGET_MIPS16)
15791 return;
15792
15793 mips_tuning_info.arch = mips_arch;
15794 mips_tuning_info.tune = mips_tune;
15795 mips_tuning_info.mips16_p = TARGET_MIPS16;
15796 mips_tuning_info.initialized_p = true;
15797
15798 dfa_start ();
15799
15800 struct mips_sim state;
15801 mips_sim_init (&state, alloca (state_size ()));
15802
15803 mips_set_fast_mult_zero_zero_p (&state);
15804
15805 dfa_finish ();
15806 }
15807
15808 /* Implement TARGET_EXPAND_TO_RTL_HOOK. */
15809
15810 static void
15811 mips_expand_to_rtl_hook (void)
15812 {
15813 /* We need to call this at a point where we can safely create sequences
15814 of instructions, so TARGET_OVERRIDE_OPTIONS is too early. We also
15815 need to call it at a point where the DFA infrastructure is not
15816 already in use, so we can't just call it lazily on demand.
15817
15818 At present, mips_tuning_info is only needed during post-expand
15819 RTL passes such as split_insns, so this hook should be early enough.
15820 We may need to move the call elsewhere if mips_tuning_info starts
15821 to be used for other things (such as rtx_costs, or expanders that
15822 could be called during gimple optimization). */
15823 mips_set_tuning_info ();
15824 }
15825 \f
15826 /* The VR4130 pipeline issues aligned pairs of instructions together,
15827 but it stalls the second instruction if it depends on the first.
15828 In order to cut down the amount of logic required, this dependence
15829 check is not based on a full instruction decode. Instead, any non-SPECIAL
15830 instruction is assumed to modify the register specified by bits 20-16
15831 (which is usually the "rt" field).
15832
15833 In BEQ, BEQL, BNE and BNEL instructions, the rt field is actually an
15834 input, so we can end up with a false dependence between the branch
15835 and its delay slot. If this situation occurs in instruction INSN,
15836 try to avoid it by swapping rs and rt. */
15837
15838 static void
15839 vr4130_avoid_branch_rt_conflict (rtx_insn *insn)
15840 {
15841 rtx_insn *first, *second;
15842
15843 first = SEQ_BEGIN (insn);
15844 second = SEQ_END (insn);
15845 if (JUMP_P (first)
15846 && NONJUMP_INSN_P (second)
15847 && GET_CODE (PATTERN (first)) == SET
15848 && GET_CODE (SET_DEST (PATTERN (first))) == PC
15849 && GET_CODE (SET_SRC (PATTERN (first))) == IF_THEN_ELSE)
15850 {
15851 /* Check for the right kind of condition. */
15852 rtx cond = XEXP (SET_SRC (PATTERN (first)), 0);
15853 if ((GET_CODE (cond) == EQ || GET_CODE (cond) == NE)
15854 && REG_P (XEXP (cond, 0))
15855 && REG_P (XEXP (cond, 1))
15856 && reg_referenced_p (XEXP (cond, 1), PATTERN (second))
15857 && !reg_referenced_p (XEXP (cond, 0), PATTERN (second)))
15858 {
15859 /* SECOND mentions the rt register but not the rs register. */
15860 rtx tmp = XEXP (cond, 0);
15861 XEXP (cond, 0) = XEXP (cond, 1);
15862 XEXP (cond, 1) = tmp;
15863 }
15864 }
15865 }
15866
15867 /* Implement -mvr4130-align. Go through each basic block and simulate the
15868 processor pipeline. If we find that a pair of instructions could execute
15869 in parallel, and the first of those instructions is not 8-byte aligned,
15870 insert a nop to make it aligned. */
15871
15872 static void
15873 vr4130_align_insns (void)
15874 {
15875 struct mips_sim state;
15876 rtx_insn *insn, *subinsn, *last, *last2, *next;
15877 bool aligned_p;
15878
15879 dfa_start ();
15880
15881 /* LAST is the last instruction before INSN to have a nonzero length.
15882 LAST2 is the last such instruction before LAST. */
15883 last = 0;
15884 last2 = 0;
15885
15886 /* ALIGNED_P is true if INSN is known to be at an aligned address. */
15887 aligned_p = true;
15888
15889 mips_sim_init (&state, alloca (state_size ()));
15890 for (insn = get_insns (); insn != 0; insn = next)
15891 {
15892 unsigned int length;
15893
15894 next = NEXT_INSN (insn);
15895
15896 /* See the comment above vr4130_avoid_branch_rt_conflict for details.
15897 This isn't really related to the alignment pass, but we do it on
15898 the fly to avoid a separate instruction walk. */
15899 vr4130_avoid_branch_rt_conflict (insn);
15900
15901 length = get_attr_length (insn);
15902 if (length > 0 && USEFUL_INSN_P (insn))
15903 FOR_EACH_SUBINSN (subinsn, insn)
15904 {
15905 mips_sim_wait_insn (&state, subinsn);
15906
15907 /* If we want this instruction to issue in parallel with the
15908 previous one, make sure that the previous instruction is
15909 aligned. There are several reasons why this isn't worthwhile
15910 when the second instruction is a call:
15911
15912 - Calls are less likely to be performance critical,
15913 - There's a good chance that the delay slot can execute
15914 in parallel with the call.
15915 - The return address would then be unaligned.
15916
15917 In general, if we're going to insert a nop between instructions
15918 X and Y, it's better to insert it immediately after X. That
15919 way, if the nop makes Y aligned, it will also align any labels
15920 between X and Y. */
15921 if (state.insns_left != state.issue_rate
15922 && !CALL_P (subinsn))
15923 {
15924 if (subinsn == SEQ_BEGIN (insn) && aligned_p)
15925 {
15926 /* SUBINSN is the first instruction in INSN and INSN is
15927 aligned. We want to align the previous instruction
15928 instead, so insert a nop between LAST2 and LAST.
15929
15930 Note that LAST could be either a single instruction
15931 or a branch with a delay slot. In the latter case,
15932 LAST, like INSN, is already aligned, but the delay
15933 slot must have some extra delay that stops it from
15934 issuing at the same time as the branch. We therefore
15935 insert a nop before the branch in order to align its
15936 delay slot. */
15937 gcc_assert (last2);
15938 emit_insn_after (gen_nop (), last2);
15939 aligned_p = false;
15940 }
15941 else if (subinsn != SEQ_BEGIN (insn) && !aligned_p)
15942 {
15943 /* SUBINSN is the delay slot of INSN, but INSN is
15944 currently unaligned. Insert a nop between
15945 LAST and INSN to align it. */
15946 gcc_assert (last);
15947 emit_insn_after (gen_nop (), last);
15948 aligned_p = true;
15949 }
15950 }
15951 mips_sim_issue_insn (&state, subinsn);
15952 }
15953 mips_sim_finish_insn (&state, insn);
15954
15955 /* Update LAST, LAST2 and ALIGNED_P for the next instruction. */
15956 length = get_attr_length (insn);
15957 if (length > 0)
15958 {
15959 /* If the instruction is an asm statement or multi-instruction
15960 mips.md patern, the length is only an estimate. Insert an
15961 8 byte alignment after it so that the following instructions
15962 can be handled correctly. */
15963 if (NONJUMP_INSN_P (SEQ_BEGIN (insn))
15964 && (recog_memoized (insn) < 0 || length >= 8))
15965 {
15966 next = emit_insn_after (gen_align (GEN_INT (3)), insn);
15967 next = NEXT_INSN (next);
15968 mips_sim_next_cycle (&state);
15969 aligned_p = true;
15970 }
15971 else if (length & 4)
15972 aligned_p = !aligned_p;
15973 last2 = last;
15974 last = insn;
15975 }
15976
15977 /* See whether INSN is an aligned label. */
15978 if (LABEL_P (insn) && label_to_alignment (insn) >= 3)
15979 aligned_p = true;
15980 }
15981 dfa_finish ();
15982 }
15983 \f
15984 /* This structure records that the current function has a LO_SUM
15985 involving SYMBOL_REF or LABEL_REF BASE and that MAX_OFFSET is
15986 the largest offset applied to BASE by all such LO_SUMs. */
15987 struct mips_lo_sum_offset {
15988 rtx base;
15989 HOST_WIDE_INT offset;
15990 };
15991
15992 /* Return a hash value for SYMBOL_REF or LABEL_REF BASE. */
15993
15994 static hashval_t
15995 mips_hash_base (rtx base)
15996 {
15997 int do_not_record_p;
15998
15999 return hash_rtx (base, GET_MODE (base), &do_not_record_p, NULL, false);
16000 }
16001
16002 /* Hashtable helpers. */
16003
16004 struct mips_lo_sum_offset_hasher : typed_free_remove <mips_lo_sum_offset>
16005 {
16006 typedef mips_lo_sum_offset value_type;
16007 typedef rtx_def compare_type;
16008 static inline hashval_t hash (const value_type *);
16009 static inline bool equal (const value_type *, const compare_type *);
16010 };
16011
16012 /* Hash-table callbacks for mips_lo_sum_offsets. */
16013
16014 inline hashval_t
16015 mips_lo_sum_offset_hasher::hash (const value_type *entry)
16016 {
16017 return mips_hash_base (entry->base);
16018 }
16019
16020 inline bool
16021 mips_lo_sum_offset_hasher::equal (const value_type *entry,
16022 const compare_type *value)
16023 {
16024 return rtx_equal_p (entry->base, value);
16025 }
16026
16027 typedef hash_table<mips_lo_sum_offset_hasher> mips_offset_table;
16028
16029 /* Look up symbolic constant X in HTAB, which is a hash table of
16030 mips_lo_sum_offsets. If OPTION is NO_INSERT, return true if X can be
16031 paired with a recorded LO_SUM, otherwise record X in the table. */
16032
16033 static bool
16034 mips_lo_sum_offset_lookup (mips_offset_table *htab, rtx x,
16035 enum insert_option option)
16036 {
16037 rtx base, offset;
16038 mips_lo_sum_offset **slot;
16039 struct mips_lo_sum_offset *entry;
16040
16041 /* Split X into a base and offset. */
16042 split_const (x, &base, &offset);
16043 if (UNSPEC_ADDRESS_P (base))
16044 base = UNSPEC_ADDRESS (base);
16045
16046 /* Look up the base in the hash table. */
16047 slot = htab->find_slot_with_hash (base, mips_hash_base (base), option);
16048 if (slot == NULL)
16049 return false;
16050
16051 entry = (struct mips_lo_sum_offset *) *slot;
16052 if (option == INSERT)
16053 {
16054 if (entry == NULL)
16055 {
16056 entry = XNEW (struct mips_lo_sum_offset);
16057 entry->base = base;
16058 entry->offset = INTVAL (offset);
16059 *slot = entry;
16060 }
16061 else
16062 {
16063 if (INTVAL (offset) > entry->offset)
16064 entry->offset = INTVAL (offset);
16065 }
16066 }
16067 return INTVAL (offset) <= entry->offset;
16068 }
16069
16070 /* A for_each_rtx callback for which DATA is a mips_lo_sum_offset hash table.
16071 Record every LO_SUM in *LOC. */
16072
16073 static int
16074 mips_record_lo_sum (rtx *loc, void *data)
16075 {
16076 if (GET_CODE (*loc) == LO_SUM)
16077 mips_lo_sum_offset_lookup ((mips_offset_table*) data,
16078 XEXP (*loc, 1), INSERT);
16079 return 0;
16080 }
16081
16082 /* Return true if INSN is a SET of an orphaned high-part relocation.
16083 HTAB is a hash table of mips_lo_sum_offsets that describes all the
16084 LO_SUMs in the current function. */
16085
16086 static bool
16087 mips_orphaned_high_part_p (mips_offset_table *htab, rtx insn)
16088 {
16089 enum mips_symbol_type type;
16090 rtx x, set;
16091
16092 set = single_set (insn);
16093 if (set)
16094 {
16095 /* Check for %his. */
16096 x = SET_SRC (set);
16097 if (GET_CODE (x) == HIGH
16098 && absolute_symbolic_operand (XEXP (x, 0), VOIDmode))
16099 return !mips_lo_sum_offset_lookup (htab, XEXP (x, 0), NO_INSERT);
16100
16101 /* Check for local %gots (and %got_pages, which is redundant but OK). */
16102 if (GET_CODE (x) == UNSPEC
16103 && XINT (x, 1) == UNSPEC_LOAD_GOT
16104 && mips_symbolic_constant_p (XVECEXP (x, 0, 1),
16105 SYMBOL_CONTEXT_LEA, &type)
16106 && type == SYMBOL_GOTOFF_PAGE)
16107 return !mips_lo_sum_offset_lookup (htab, XVECEXP (x, 0, 1), NO_INSERT);
16108 }
16109 return false;
16110 }
16111
16112 /* Subroutine of mips_reorg_process_insns. If there is a hazard between
16113 INSN and a previous instruction, avoid it by inserting nops after
16114 instruction AFTER.
16115
16116 *DELAYED_REG and *HILO_DELAY describe the hazards that apply at
16117 this point. If *DELAYED_REG is non-null, INSN must wait a cycle
16118 before using the value of that register. *HILO_DELAY counts the
16119 number of instructions since the last hilo hazard (that is,
16120 the number of instructions since the last MFLO or MFHI).
16121
16122 After inserting nops for INSN, update *DELAYED_REG and *HILO_DELAY
16123 for the next instruction.
16124
16125 LO_REG is an rtx for the LO register, used in dependence checking. */
16126
16127 static void
16128 mips_avoid_hazard (rtx_insn *after, rtx_insn *insn, int *hilo_delay,
16129 rtx *delayed_reg, rtx lo_reg)
16130 {
16131 rtx pattern, set;
16132 int nops, ninsns;
16133
16134 pattern = PATTERN (insn);
16135
16136 /* Do not put the whole function in .set noreorder if it contains
16137 an asm statement. We don't know whether there will be hazards
16138 between the asm statement and the gcc-generated code. */
16139 if (GET_CODE (pattern) == ASM_INPUT || asm_noperands (pattern) >= 0)
16140 cfun->machine->all_noreorder_p = false;
16141
16142 /* Ignore zero-length instructions (barriers and the like). */
16143 ninsns = get_attr_length (insn) / 4;
16144 if (ninsns == 0)
16145 return;
16146
16147 /* Work out how many nops are needed. Note that we only care about
16148 registers that are explicitly mentioned in the instruction's pattern.
16149 It doesn't matter that calls use the argument registers or that they
16150 clobber hi and lo. */
16151 if (*hilo_delay < 2 && reg_set_p (lo_reg, pattern))
16152 nops = 2 - *hilo_delay;
16153 else if (*delayed_reg != 0 && reg_referenced_p (*delayed_reg, pattern))
16154 nops = 1;
16155 else
16156 nops = 0;
16157
16158 /* Insert the nops between this instruction and the previous one.
16159 Each new nop takes us further from the last hilo hazard. */
16160 *hilo_delay += nops;
16161 while (nops-- > 0)
16162 emit_insn_after (gen_hazard_nop (), after);
16163
16164 /* Set up the state for the next instruction. */
16165 *hilo_delay += ninsns;
16166 *delayed_reg = 0;
16167 if (INSN_CODE (insn) >= 0)
16168 switch (get_attr_hazard (insn))
16169 {
16170 case HAZARD_NONE:
16171 break;
16172
16173 case HAZARD_HILO:
16174 *hilo_delay = 0;
16175 break;
16176
16177 case HAZARD_DELAY:
16178 set = single_set (insn);
16179 gcc_assert (set);
16180 *delayed_reg = SET_DEST (set);
16181 break;
16182 }
16183 }
16184
16185 /* Go through the instruction stream and insert nops where necessary.
16186 Also delete any high-part relocations whose partnering low parts
16187 are now all dead. See if the whole function can then be put into
16188 .set noreorder and .set nomacro. */
16189
16190 static void
16191 mips_reorg_process_insns (void)
16192 {
16193 rtx_insn *insn, *last_insn, *subinsn, *next_insn;
16194 rtx lo_reg, delayed_reg;
16195 int hilo_delay;
16196
16197 /* Force all instructions to be split into their final form. */
16198 split_all_insns_noflow ();
16199
16200 /* Recalculate instruction lengths without taking nops into account. */
16201 cfun->machine->ignore_hazard_length_p = true;
16202 shorten_branches (get_insns ());
16203
16204 cfun->machine->all_noreorder_p = true;
16205
16206 /* We don't track MIPS16 PC-relative offsets closely enough to make
16207 a good job of "set .noreorder" code in MIPS16 mode. */
16208 if (TARGET_MIPS16)
16209 cfun->machine->all_noreorder_p = false;
16210
16211 /* Code that doesn't use explicit relocs can't be ".set nomacro". */
16212 if (!TARGET_EXPLICIT_RELOCS)
16213 cfun->machine->all_noreorder_p = false;
16214
16215 /* Profiled functions can't be all noreorder because the profiler
16216 support uses assembler macros. */
16217 if (crtl->profile)
16218 cfun->machine->all_noreorder_p = false;
16219
16220 /* Code compiled with -mfix-vr4120, -mfix-rm7000 or -mfix-24k can't be
16221 all noreorder because we rely on the assembler to work around some
16222 errata. The R5900 too has several bugs. */
16223 if (TARGET_FIX_VR4120
16224 || TARGET_FIX_RM7000
16225 || TARGET_FIX_24K
16226 || TARGET_MIPS5900)
16227 cfun->machine->all_noreorder_p = false;
16228
16229 /* The same is true for -mfix-vr4130 if we might generate MFLO or
16230 MFHI instructions. Note that we avoid using MFLO and MFHI if
16231 the VR4130 MACC and DMACC instructions are available instead;
16232 see the *mfhilo_{si,di}_macc patterns. */
16233 if (TARGET_FIX_VR4130 && !ISA_HAS_MACCHI)
16234 cfun->machine->all_noreorder_p = false;
16235
16236 mips_offset_table htab (37);
16237
16238 /* Make a first pass over the instructions, recording all the LO_SUMs. */
16239 for (insn = get_insns (); insn != 0; insn = NEXT_INSN (insn))
16240 FOR_EACH_SUBINSN (subinsn, insn)
16241 if (USEFUL_INSN_P (subinsn))
16242 {
16243 rtx body = PATTERN (insn);
16244 int noperands = asm_noperands (body);
16245 if (noperands >= 0)
16246 {
16247 rtx *ops = XALLOCAVEC (rtx, noperands);
16248 bool *used = XALLOCAVEC (bool, noperands);
16249 const char *string = decode_asm_operands (body, ops, NULL, NULL,
16250 NULL, NULL);
16251 get_referenced_operands (string, used, noperands);
16252 for (int i = 0; i < noperands; ++i)
16253 if (used[i])
16254 for_each_rtx (&ops[i], mips_record_lo_sum, &htab);
16255 }
16256 else
16257 for_each_rtx (&PATTERN (subinsn), mips_record_lo_sum, &htab);
16258 }
16259
16260 last_insn = 0;
16261 hilo_delay = 2;
16262 delayed_reg = 0;
16263 lo_reg = gen_rtx_REG (SImode, LO_REGNUM);
16264
16265 /* Make a second pass over the instructions. Delete orphaned
16266 high-part relocations or turn them into NOPs. Avoid hazards
16267 by inserting NOPs. */
16268 for (insn = get_insns (); insn != 0; insn = next_insn)
16269 {
16270 next_insn = NEXT_INSN (insn);
16271 if (USEFUL_INSN_P (insn))
16272 {
16273 if (GET_CODE (PATTERN (insn)) == SEQUENCE)
16274 {
16275 /* If we find an orphaned high-part relocation in a delay
16276 slot, it's easier to turn that instruction into a NOP than
16277 to delete it. The delay slot will be a NOP either way. */
16278 FOR_EACH_SUBINSN (subinsn, insn)
16279 if (INSN_P (subinsn))
16280 {
16281 if (mips_orphaned_high_part_p (&htab, subinsn))
16282 {
16283 PATTERN (subinsn) = gen_nop ();
16284 INSN_CODE (subinsn) = CODE_FOR_nop;
16285 }
16286 mips_avoid_hazard (last_insn, subinsn, &hilo_delay,
16287 &delayed_reg, lo_reg);
16288 }
16289 last_insn = insn;
16290 }
16291 else
16292 {
16293 /* INSN is a single instruction. Delete it if it's an
16294 orphaned high-part relocation. */
16295 if (mips_orphaned_high_part_p (&htab, insn))
16296 delete_insn (insn);
16297 /* Also delete cache barriers if the last instruction
16298 was an annulled branch. INSN will not be speculatively
16299 executed. */
16300 else if (recog_memoized (insn) == CODE_FOR_r10k_cache_barrier
16301 && last_insn
16302 && JUMP_P (SEQ_BEGIN (last_insn))
16303 && INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (last_insn)))
16304 delete_insn (insn);
16305 else
16306 {
16307 mips_avoid_hazard (last_insn, insn, &hilo_delay,
16308 &delayed_reg, lo_reg);
16309 last_insn = insn;
16310 }
16311 }
16312 }
16313 }
16314 }
16315
16316 /* Return true if the function has a long branch instruction. */
16317
16318 static bool
16319 mips_has_long_branch_p (void)
16320 {
16321 rtx_insn *insn, *subinsn;
16322 int normal_length;
16323
16324 /* We need up-to-date instruction lengths. */
16325 shorten_branches (get_insns ());
16326
16327 /* Look for a branch that is longer than normal. The normal length for
16328 non-MIPS16 branches is 8, because the length includes the delay slot.
16329 It is 4 for MIPS16, because MIPS16 branches are extended instructions,
16330 but they have no delay slot. */
16331 normal_length = (TARGET_MIPS16 ? 4 : 8);
16332 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
16333 FOR_EACH_SUBINSN (subinsn, insn)
16334 if (JUMP_P (subinsn)
16335 && get_attr_length (subinsn) > normal_length
16336 && (any_condjump_p (subinsn) || any_uncondjump_p (subinsn)))
16337 return true;
16338
16339 return false;
16340 }
16341
16342 /* If we are using a GOT, but have not decided to use a global pointer yet,
16343 see whether we need one to implement long branches. Convert the ghost
16344 global-pointer instructions into real ones if so. */
16345
16346 static bool
16347 mips_expand_ghost_gp_insns (void)
16348 {
16349 /* Quick exit if we already know that we will or won't need a
16350 global pointer. */
16351 if (!TARGET_USE_GOT
16352 || cfun->machine->global_pointer == INVALID_REGNUM
16353 || mips_must_initialize_gp_p ())
16354 return false;
16355
16356 /* Run a full check for long branches. */
16357 if (!mips_has_long_branch_p ())
16358 return false;
16359
16360 /* We've now established that we need $gp. */
16361 cfun->machine->must_initialize_gp_p = true;
16362 split_all_insns_noflow ();
16363
16364 return true;
16365 }
16366
16367 /* Subroutine of mips_reorg to manage passes that require DF. */
16368
16369 static void
16370 mips_df_reorg (void)
16371 {
16372 /* Create def-use chains. */
16373 df_set_flags (DF_EQ_NOTES);
16374 df_chain_add_problem (DF_UD_CHAIN);
16375 df_analyze ();
16376
16377 if (TARGET_RELAX_PIC_CALLS)
16378 mips_annotate_pic_calls ();
16379
16380 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE)
16381 r10k_insert_cache_barriers ();
16382
16383 df_finish_pass (false);
16384 }
16385
16386 /* Emit code to load LABEL_REF SRC into MIPS16 register DEST. This is
16387 called very late in mips_reorg, but the caller is required to run
16388 mips16_lay_out_constants on the result. */
16389
16390 static void
16391 mips16_load_branch_target (rtx dest, rtx src)
16392 {
16393 if (TARGET_ABICALLS && !TARGET_ABSOLUTE_ABICALLS)
16394 {
16395 rtx page, low;
16396
16397 if (mips_cfun_has_cprestore_slot_p ())
16398 mips_emit_move (dest, mips_cprestore_slot (dest, true));
16399 else
16400 mips_emit_move (dest, pic_offset_table_rtx);
16401 page = mips_unspec_address (src, SYMBOL_GOTOFF_PAGE);
16402 low = mips_unspec_address (src, SYMBOL_GOT_PAGE_OFST);
16403 emit_insn (gen_rtx_SET (VOIDmode, dest,
16404 PMODE_INSN (gen_unspec_got, (dest, page))));
16405 emit_insn (gen_rtx_SET (VOIDmode, dest,
16406 gen_rtx_LO_SUM (Pmode, dest, low)));
16407 }
16408 else
16409 {
16410 src = mips_unspec_address (src, SYMBOL_ABSOLUTE);
16411 mips_emit_move (dest, src);
16412 }
16413 }
16414
16415 /* If we're compiling a MIPS16 function, look for and split any long branches.
16416 This must be called after all other instruction modifications in
16417 mips_reorg. */
16418
16419 static void
16420 mips16_split_long_branches (void)
16421 {
16422 bool something_changed;
16423
16424 if (!TARGET_MIPS16)
16425 return;
16426
16427 /* Loop until the alignments for all targets are sufficient. */
16428 do
16429 {
16430 rtx_insn *insn;
16431
16432 shorten_branches (get_insns ());
16433 something_changed = false;
16434 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
16435 if (JUMP_P (insn)
16436 && get_attr_length (insn) > 4
16437 && (any_condjump_p (insn) || any_uncondjump_p (insn)))
16438 {
16439 rtx old_label, new_label, temp, saved_temp;
16440 rtx target;
16441 rtx_insn *jump, *jump_sequence;
16442
16443 start_sequence ();
16444
16445 /* Free up a MIPS16 register by saving it in $1. */
16446 saved_temp = gen_rtx_REG (Pmode, AT_REGNUM);
16447 temp = gen_rtx_REG (Pmode, GP_REG_FIRST + 2);
16448 emit_move_insn (saved_temp, temp);
16449
16450 /* Load the branch target into TEMP. */
16451 old_label = JUMP_LABEL (insn);
16452 target = gen_rtx_LABEL_REF (Pmode, old_label);
16453 mips16_load_branch_target (temp, target);
16454
16455 /* Jump to the target and restore the register's
16456 original value. */
16457 jump = emit_jump_insn (PMODE_INSN (gen_indirect_jump_and_restore,
16458 (temp, temp, saved_temp)));
16459 JUMP_LABEL (jump) = old_label;
16460 LABEL_NUSES (old_label)++;
16461
16462 /* Rewrite any symbolic references that are supposed to use
16463 a PC-relative constant pool. */
16464 mips16_lay_out_constants (false);
16465
16466 if (simplejump_p (insn))
16467 /* We're going to replace INSN with a longer form. */
16468 new_label = NULL_RTX;
16469 else
16470 {
16471 /* Create a branch-around label for the original
16472 instruction. */
16473 new_label = gen_label_rtx ();
16474 emit_label (new_label);
16475 }
16476
16477 jump_sequence = get_insns ();
16478 end_sequence ();
16479
16480 emit_insn_after (jump_sequence, insn);
16481 if (new_label)
16482 invert_jump (insn, new_label, false);
16483 else
16484 delete_insn (insn);
16485 something_changed = true;
16486 }
16487 }
16488 while (something_changed);
16489 }
16490
16491 /* Implement TARGET_MACHINE_DEPENDENT_REORG. */
16492
16493 static void
16494 mips_reorg (void)
16495 {
16496 /* Restore the BLOCK_FOR_INSN pointers, which are needed by DF. Also during
16497 insn splitting in mips16_lay_out_constants, DF insn info is only kept up
16498 to date if the CFG is available. */
16499 if (mips_cfg_in_reorg ())
16500 compute_bb_for_insn ();
16501 mips16_lay_out_constants (true);
16502 if (mips_cfg_in_reorg ())
16503 {
16504 mips_df_reorg ();
16505 free_bb_for_insn ();
16506 }
16507 }
16508
16509 /* We use a machine specific pass to do a second machine dependent reorg
16510 pass after delay branch scheduling. */
16511
16512 static unsigned int
16513 mips_machine_reorg2 (void)
16514 {
16515 mips_reorg_process_insns ();
16516 if (!TARGET_MIPS16
16517 && TARGET_EXPLICIT_RELOCS
16518 && TUNE_MIPS4130
16519 && TARGET_VR4130_ALIGN)
16520 vr4130_align_insns ();
16521 if (mips_expand_ghost_gp_insns ())
16522 /* The expansion could invalidate some of the VR4130 alignment
16523 optimizations, but this should be an extremely rare case anyhow. */
16524 mips_reorg_process_insns ();
16525 mips16_split_long_branches ();
16526 return 0;
16527 }
16528
16529 namespace {
16530
16531 const pass_data pass_data_mips_machine_reorg2 =
16532 {
16533 RTL_PASS, /* type */
16534 "mach2", /* name */
16535 OPTGROUP_NONE, /* optinfo_flags */
16536 TV_MACH_DEP, /* tv_id */
16537 0, /* properties_required */
16538 0, /* properties_provided */
16539 0, /* properties_destroyed */
16540 0, /* todo_flags_start */
16541 0, /* todo_flags_finish */
16542 };
16543
16544 class pass_mips_machine_reorg2 : public rtl_opt_pass
16545 {
16546 public:
16547 pass_mips_machine_reorg2(gcc::context *ctxt)
16548 : rtl_opt_pass(pass_data_mips_machine_reorg2, ctxt)
16549 {}
16550
16551 /* opt_pass methods: */
16552 virtual unsigned int execute (function *) { return mips_machine_reorg2 (); }
16553
16554 }; // class pass_mips_machine_reorg2
16555
16556 } // anon namespace
16557
16558 rtl_opt_pass *
16559 make_pass_mips_machine_reorg2 (gcc::context *ctxt)
16560 {
16561 return new pass_mips_machine_reorg2 (ctxt);
16562 }
16563
16564 \f
16565 /* Implement TARGET_ASM_OUTPUT_MI_THUNK. Generate rtl rather than asm text
16566 in order to avoid duplicating too much logic from elsewhere. */
16567
16568 static void
16569 mips_output_mi_thunk (FILE *file, tree thunk_fndecl ATTRIBUTE_UNUSED,
16570 HOST_WIDE_INT delta, HOST_WIDE_INT vcall_offset,
16571 tree function)
16572 {
16573 rtx this_rtx, temp1, temp2, fnaddr;
16574 rtx_insn *insn;
16575 bool use_sibcall_p;
16576
16577 /* Pretend to be a post-reload pass while generating rtl. */
16578 reload_completed = 1;
16579
16580 /* Mark the end of the (empty) prologue. */
16581 emit_note (NOTE_INSN_PROLOGUE_END);
16582
16583 /* Determine if we can use a sibcall to call FUNCTION directly. */
16584 fnaddr = XEXP (DECL_RTL (function), 0);
16585 use_sibcall_p = (mips_function_ok_for_sibcall (function, NULL)
16586 && const_call_insn_operand (fnaddr, Pmode));
16587
16588 /* Determine if we need to load FNADDR from the GOT. */
16589 if (!use_sibcall_p
16590 && (mips_got_symbol_type_p
16591 (mips_classify_symbol (fnaddr, SYMBOL_CONTEXT_LEA))))
16592 {
16593 /* Pick a global pointer. Use a call-clobbered register if
16594 TARGET_CALL_SAVED_GP. */
16595 cfun->machine->global_pointer
16596 = TARGET_CALL_SAVED_GP ? 15 : GLOBAL_POINTER_REGNUM;
16597 cfun->machine->must_initialize_gp_p = true;
16598 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer);
16599
16600 /* Set up the global pointer for n32 or n64 abicalls. */
16601 mips_emit_loadgp ();
16602 }
16603
16604 /* We need two temporary registers in some cases. */
16605 temp1 = gen_rtx_REG (Pmode, 2);
16606 temp2 = gen_rtx_REG (Pmode, 3);
16607
16608 /* Find out which register contains the "this" pointer. */
16609 if (aggregate_value_p (TREE_TYPE (TREE_TYPE (function)), function))
16610 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST + 1);
16611 else
16612 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST);
16613
16614 /* Add DELTA to THIS_RTX. */
16615 if (delta != 0)
16616 {
16617 rtx offset = GEN_INT (delta);
16618 if (!SMALL_OPERAND (delta))
16619 {
16620 mips_emit_move (temp1, offset);
16621 offset = temp1;
16622 }
16623 emit_insn (gen_add3_insn (this_rtx, this_rtx, offset));
16624 }
16625
16626 /* If needed, add *(*THIS_RTX + VCALL_OFFSET) to THIS_RTX. */
16627 if (vcall_offset != 0)
16628 {
16629 rtx addr;
16630
16631 /* Set TEMP1 to *THIS_RTX. */
16632 mips_emit_move (temp1, gen_rtx_MEM (Pmode, this_rtx));
16633
16634 /* Set ADDR to a legitimate address for *THIS_RTX + VCALL_OFFSET. */
16635 addr = mips_add_offset (temp2, temp1, vcall_offset);
16636
16637 /* Load the offset and add it to THIS_RTX. */
16638 mips_emit_move (temp1, gen_rtx_MEM (Pmode, addr));
16639 emit_insn (gen_add3_insn (this_rtx, this_rtx, temp1));
16640 }
16641
16642 /* Jump to the target function. Use a sibcall if direct jumps are
16643 allowed, otherwise load the address into a register first. */
16644 if (use_sibcall_p)
16645 {
16646 insn = emit_call_insn (gen_sibcall_internal (fnaddr, const0_rtx));
16647 SIBLING_CALL_P (insn) = 1;
16648 }
16649 else
16650 {
16651 /* This is messy. GAS treats "la $25,foo" as part of a call
16652 sequence and may allow a global "foo" to be lazily bound.
16653 The general move patterns therefore reject this combination.
16654
16655 In this context, lazy binding would actually be OK
16656 for TARGET_CALL_CLOBBERED_GP, but it's still wrong for
16657 TARGET_CALL_SAVED_GP; see mips_load_call_address.
16658 We must therefore load the address via a temporary
16659 register if mips_dangerous_for_la25_p.
16660
16661 If we jump to the temporary register rather than $25,
16662 the assembler can use the move insn to fill the jump's
16663 delay slot.
16664
16665 We can use the same technique for MIPS16 code, where $25
16666 is not a valid JR register. */
16667 if (TARGET_USE_PIC_FN_ADDR_REG
16668 && !TARGET_MIPS16
16669 && !mips_dangerous_for_la25_p (fnaddr))
16670 temp1 = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
16671 mips_load_call_address (MIPS_CALL_SIBCALL, temp1, fnaddr);
16672
16673 if (TARGET_USE_PIC_FN_ADDR_REG
16674 && REGNO (temp1) != PIC_FUNCTION_ADDR_REGNUM)
16675 mips_emit_move (gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM), temp1);
16676 emit_jump_insn (gen_indirect_jump (temp1));
16677 }
16678
16679 /* Run just enough of rest_of_compilation. This sequence was
16680 "borrowed" from alpha.c. */
16681 insn = get_insns ();
16682 split_all_insns_noflow ();
16683 mips16_lay_out_constants (true);
16684 shorten_branches (insn);
16685 final_start_function (insn, file, 1);
16686 final (insn, file, 1);
16687 final_end_function ();
16688
16689 /* Clean up the vars set above. Note that final_end_function resets
16690 the global pointer for us. */
16691 reload_completed = 0;
16692 }
16693 \f
16694
16695 /* The last argument passed to mips_set_compression_mode,
16696 or negative if the function hasn't been called yet. */
16697 static unsigned int old_compression_mode = -1;
16698
16699 /* Set up the target-dependent global state for ISA mode COMPRESSION_MODE,
16700 which is either MASK_MIPS16 or MASK_MICROMIPS. */
16701
16702 static void
16703 mips_set_compression_mode (unsigned int compression_mode)
16704 {
16705
16706 if (compression_mode == old_compression_mode)
16707 return;
16708
16709 /* Restore base settings of various flags. */
16710 target_flags = mips_base_target_flags;
16711 flag_schedule_insns = mips_base_schedule_insns;
16712 flag_reorder_blocks_and_partition = mips_base_reorder_blocks_and_partition;
16713 flag_move_loop_invariants = mips_base_move_loop_invariants;
16714 align_loops = mips_base_align_loops;
16715 align_jumps = mips_base_align_jumps;
16716 align_functions = mips_base_align_functions;
16717 target_flags &= ~(MASK_MIPS16 | MASK_MICROMIPS);
16718 target_flags |= compression_mode;
16719
16720 if (compression_mode & MASK_MIPS16)
16721 {
16722 /* Switch to MIPS16 mode. */
16723 target_flags |= MASK_MIPS16;
16724
16725 /* Turn off SYNCI if it was on, MIPS16 doesn't support it. */
16726 target_flags &= ~MASK_SYNCI;
16727
16728 /* Don't run the scheduler before reload, since it tends to
16729 increase register pressure. */
16730 flag_schedule_insns = 0;
16731
16732 /* Don't do hot/cold partitioning. mips16_lay_out_constants expects
16733 the whole function to be in a single section. */
16734 flag_reorder_blocks_and_partition = 0;
16735
16736 /* Don't move loop invariants, because it tends to increase
16737 register pressure. It also introduces an extra move in cases
16738 where the constant is the first operand in a two-operand binary
16739 instruction, or when it forms a register argument to a functon
16740 call. */
16741 flag_move_loop_invariants = 0;
16742
16743 target_flags |= MASK_EXPLICIT_RELOCS;
16744
16745 /* Experiments suggest we get the best overall section-anchor
16746 results from using the range of an unextended LW or SW. Code
16747 that makes heavy use of byte or short accesses can do better
16748 with ranges of 0...31 and 0...63 respectively, but most code is
16749 sensitive to the range of LW and SW instead. */
16750 targetm.min_anchor_offset = 0;
16751 targetm.max_anchor_offset = 127;
16752
16753 targetm.const_anchor = 0;
16754
16755 /* MIPS16 has no BAL instruction. */
16756 target_flags &= ~MASK_RELAX_PIC_CALLS;
16757
16758 /* The R4000 errata don't apply to any known MIPS16 cores.
16759 It's simpler to make the R4000 fixes and MIPS16 mode
16760 mutually exclusive. */
16761 target_flags &= ~MASK_FIX_R4000;
16762
16763 if (flag_pic && !TARGET_OLDABI)
16764 sorry ("MIPS16 PIC for ABIs other than o32 and o64");
16765
16766 if (TARGET_XGOT)
16767 sorry ("MIPS16 -mxgot code");
16768
16769 if (TARGET_HARD_FLOAT_ABI && !TARGET_OLDABI)
16770 sorry ("hard-float MIPS16 code for ABIs other than o32 and o64");
16771 }
16772 else
16773 {
16774 /* Switch to microMIPS or the standard encoding. */
16775
16776 if (TARGET_MICROMIPS)
16777 /* Avoid branch likely. */
16778 target_flags &= ~MASK_BRANCHLIKELY;
16779
16780 /* Provide default values for align_* for 64-bit targets. */
16781 if (TARGET_64BIT)
16782 {
16783 if (align_loops == 0)
16784 align_loops = 8;
16785 if (align_jumps == 0)
16786 align_jumps = 8;
16787 if (align_functions == 0)
16788 align_functions = 8;
16789 }
16790
16791 targetm.min_anchor_offset = -32768;
16792 targetm.max_anchor_offset = 32767;
16793
16794 targetm.const_anchor = 0x8000;
16795 }
16796
16797 /* (Re)initialize MIPS target internals for new ISA. */
16798 mips_init_relocs ();
16799
16800 if (compression_mode & MASK_MIPS16)
16801 {
16802 if (!mips16_globals)
16803 mips16_globals = save_target_globals_default_opts ();
16804 else
16805 restore_target_globals (mips16_globals);
16806 }
16807 else
16808 restore_target_globals (&default_target_globals);
16809
16810 old_compression_mode = compression_mode;
16811 }
16812
16813 /* Implement TARGET_SET_CURRENT_FUNCTION. Decide whether the current
16814 function should use the MIPS16 or microMIPS ISA and switch modes
16815 accordingly. */
16816
16817 static void
16818 mips_set_current_function (tree fndecl)
16819 {
16820 mips_set_compression_mode (mips_get_compress_mode (fndecl));
16821 }
16822 \f
16823 /* Allocate a chunk of memory for per-function machine-dependent data. */
16824
16825 static struct machine_function *
16826 mips_init_machine_status (void)
16827 {
16828 return ggc_cleared_alloc<machine_function> ();
16829 }
16830
16831 /* Return the processor associated with the given ISA level, or null
16832 if the ISA isn't valid. */
16833
16834 static const struct mips_cpu_info *
16835 mips_cpu_info_from_isa (int isa)
16836 {
16837 unsigned int i;
16838
16839 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++)
16840 if (mips_cpu_info_table[i].isa == isa)
16841 return mips_cpu_info_table + i;
16842
16843 return NULL;
16844 }
16845
16846 /* Return a mips_cpu_info entry determined by an option valued
16847 OPT. */
16848
16849 static const struct mips_cpu_info *
16850 mips_cpu_info_from_opt (int opt)
16851 {
16852 switch (opt)
16853 {
16854 case MIPS_ARCH_OPTION_FROM_ABI:
16855 /* 'from-abi' selects the most compatible architecture for the
16856 given ABI: MIPS I for 32-bit ABIs and MIPS III for 64-bit
16857 ABIs. For the EABIs, we have to decide whether we're using
16858 the 32-bit or 64-bit version. */
16859 return mips_cpu_info_from_isa (ABI_NEEDS_32BIT_REGS ? 1
16860 : ABI_NEEDS_64BIT_REGS ? 3
16861 : (TARGET_64BIT ? 3 : 1));
16862
16863 case MIPS_ARCH_OPTION_NATIVE:
16864 gcc_unreachable ();
16865
16866 default:
16867 return &mips_cpu_info_table[opt];
16868 }
16869 }
16870
16871 /* Return a default mips_cpu_info entry, given that no -march= option
16872 was explicitly specified. */
16873
16874 static const struct mips_cpu_info *
16875 mips_default_arch (void)
16876 {
16877 #if defined (MIPS_CPU_STRING_DEFAULT)
16878 unsigned int i;
16879 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++)
16880 if (strcmp (mips_cpu_info_table[i].name, MIPS_CPU_STRING_DEFAULT) == 0)
16881 return mips_cpu_info_table + i;
16882 gcc_unreachable ();
16883 #elif defined (MIPS_ISA_DEFAULT)
16884 return mips_cpu_info_from_isa (MIPS_ISA_DEFAULT);
16885 #else
16886 /* 'from-abi' makes a good default: you get whatever the ABI
16887 requires. */
16888 return mips_cpu_info_from_opt (MIPS_ARCH_OPTION_FROM_ABI);
16889 #endif
16890 }
16891
16892 /* Set up globals to generate code for the ISA or processor
16893 described by INFO. */
16894
16895 static void
16896 mips_set_architecture (const struct mips_cpu_info *info)
16897 {
16898 if (info != 0)
16899 {
16900 mips_arch_info = info;
16901 mips_arch = info->cpu;
16902 mips_isa = info->isa;
16903 if (mips_isa < 32)
16904 mips_isa_rev = 0;
16905 else
16906 mips_isa_rev = (mips_isa & 31) + 1;
16907 }
16908 }
16909
16910 /* Likewise for tuning. */
16911
16912 static void
16913 mips_set_tune (const struct mips_cpu_info *info)
16914 {
16915 if (info != 0)
16916 {
16917 mips_tune_info = info;
16918 mips_tune = info->cpu;
16919 }
16920 }
16921
16922 /* Implement TARGET_OPTION_OVERRIDE. */
16923
16924 static void
16925 mips_option_override (void)
16926 {
16927 int i, start, regno, mode;
16928
16929 if (global_options_set.x_mips_isa_option)
16930 mips_isa_option_info = &mips_cpu_info_table[mips_isa_option];
16931
16932 #ifdef SUBTARGET_OVERRIDE_OPTIONS
16933 SUBTARGET_OVERRIDE_OPTIONS;
16934 #endif
16935
16936 /* MIPS16 and microMIPS cannot coexist. */
16937 if (TARGET_MICROMIPS && TARGET_MIPS16)
16938 error ("unsupported combination: %s", "-mips16 -mmicromips");
16939
16940 /* Save the base compression state and process flags as though we
16941 were generating uncompressed code. */
16942 mips_base_compression_flags = TARGET_COMPRESSION;
16943 target_flags &= ~TARGET_COMPRESSION;
16944
16945 /* -mno-float overrides -mhard-float and -msoft-float. */
16946 if (TARGET_NO_FLOAT)
16947 {
16948 target_flags |= MASK_SOFT_FLOAT_ABI;
16949 target_flags_explicit |= MASK_SOFT_FLOAT_ABI;
16950 }
16951
16952 if (TARGET_FLIP_MIPS16)
16953 TARGET_INTERLINK_COMPRESSED = 1;
16954
16955 /* Set the small data limit. */
16956 mips_small_data_threshold = (global_options_set.x_g_switch_value
16957 ? g_switch_value
16958 : MIPS_DEFAULT_GVALUE);
16959
16960 /* The following code determines the architecture and register size.
16961 Similar code was added to GAS 2.14 (see tc-mips.c:md_after_parse_args()).
16962 The GAS and GCC code should be kept in sync as much as possible. */
16963
16964 if (global_options_set.x_mips_arch_option)
16965 mips_set_architecture (mips_cpu_info_from_opt (mips_arch_option));
16966
16967 if (mips_isa_option_info != 0)
16968 {
16969 if (mips_arch_info == 0)
16970 mips_set_architecture (mips_isa_option_info);
16971 else if (mips_arch_info->isa != mips_isa_option_info->isa)
16972 error ("%<-%s%> conflicts with the other architecture options, "
16973 "which specify a %s processor",
16974 mips_isa_option_info->name,
16975 mips_cpu_info_from_isa (mips_arch_info->isa)->name);
16976 }
16977
16978 if (mips_arch_info == 0)
16979 mips_set_architecture (mips_default_arch ());
16980
16981 if (ABI_NEEDS_64BIT_REGS && !ISA_HAS_64BIT_REGS)
16982 error ("%<-march=%s%> is not compatible with the selected ABI",
16983 mips_arch_info->name);
16984
16985 /* Optimize for mips_arch, unless -mtune selects a different processor. */
16986 if (global_options_set.x_mips_tune_option)
16987 mips_set_tune (mips_cpu_info_from_opt (mips_tune_option));
16988
16989 if (mips_tune_info == 0)
16990 mips_set_tune (mips_arch_info);
16991
16992 if ((target_flags_explicit & MASK_64BIT) != 0)
16993 {
16994 /* The user specified the size of the integer registers. Make sure
16995 it agrees with the ABI and ISA. */
16996 if (TARGET_64BIT && !ISA_HAS_64BIT_REGS)
16997 error ("%<-mgp64%> used with a 32-bit processor");
16998 else if (!TARGET_64BIT && ABI_NEEDS_64BIT_REGS)
16999 error ("%<-mgp32%> used with a 64-bit ABI");
17000 else if (TARGET_64BIT && ABI_NEEDS_32BIT_REGS)
17001 error ("%<-mgp64%> used with a 32-bit ABI");
17002 }
17003 else
17004 {
17005 /* Infer the integer register size from the ABI and processor.
17006 Restrict ourselves to 32-bit registers if that's all the
17007 processor has, or if the ABI cannot handle 64-bit registers. */
17008 if (ABI_NEEDS_32BIT_REGS || !ISA_HAS_64BIT_REGS)
17009 target_flags &= ~MASK_64BIT;
17010 else
17011 target_flags |= MASK_64BIT;
17012 }
17013
17014 if ((target_flags_explicit & MASK_FLOAT64) != 0)
17015 {
17016 if (TARGET_SINGLE_FLOAT && TARGET_FLOAT64)
17017 error ("unsupported combination: %s", "-mfp64 -msingle-float");
17018 else if (TARGET_64BIT && TARGET_DOUBLE_FLOAT && !TARGET_FLOAT64)
17019 error ("unsupported combination: %s", "-mgp64 -mfp32 -mdouble-float");
17020 else if (!TARGET_64BIT && TARGET_FLOAT64)
17021 {
17022 if (!ISA_HAS_MXHC1)
17023 error ("%<-mgp32%> and %<-mfp64%> can only be combined if"
17024 " the target supports the mfhc1 and mthc1 instructions");
17025 else if (mips_abi != ABI_32)
17026 error ("%<-mgp32%> and %<-mfp64%> can only be combined when using"
17027 " the o32 ABI");
17028 }
17029 }
17030 else
17031 {
17032 /* -msingle-float selects 32-bit float registers. Otherwise the
17033 float registers should be the same size as the integer ones. */
17034 if (TARGET_64BIT && TARGET_DOUBLE_FLOAT)
17035 target_flags |= MASK_FLOAT64;
17036 else
17037 target_flags &= ~MASK_FLOAT64;
17038 }
17039
17040 /* End of code shared with GAS. */
17041
17042 /* The R5900 FPU only supports single precision. */
17043 if (TARGET_MIPS5900 && TARGET_HARD_FLOAT_ABI && TARGET_DOUBLE_FLOAT)
17044 error ("unsupported combination: %s",
17045 "-march=r5900 -mhard-float -mdouble-float");
17046
17047 /* If a -mlong* option was given, check that it matches the ABI,
17048 otherwise infer the -mlong* setting from the other options. */
17049 if ((target_flags_explicit & MASK_LONG64) != 0)
17050 {
17051 if (TARGET_LONG64)
17052 {
17053 if (mips_abi == ABI_N32)
17054 error ("%qs is incompatible with %qs", "-mabi=n32", "-mlong64");
17055 else if (mips_abi == ABI_32)
17056 error ("%qs is incompatible with %qs", "-mabi=32", "-mlong64");
17057 else if (mips_abi == ABI_O64 && TARGET_ABICALLS)
17058 /* We have traditionally allowed non-abicalls code to use
17059 an LP64 form of o64. However, it would take a bit more
17060 effort to support the combination of 32-bit GOT entries
17061 and 64-bit pointers, so we treat the abicalls case as
17062 an error. */
17063 error ("the combination of %qs and %qs is incompatible with %qs",
17064 "-mabi=o64", "-mabicalls", "-mlong64");
17065 }
17066 else
17067 {
17068 if (mips_abi == ABI_64)
17069 error ("%qs is incompatible with %qs", "-mabi=64", "-mlong32");
17070 }
17071 }
17072 else
17073 {
17074 if ((mips_abi == ABI_EABI && TARGET_64BIT) || mips_abi == ABI_64)
17075 target_flags |= MASK_LONG64;
17076 else
17077 target_flags &= ~MASK_LONG64;
17078 }
17079
17080 if (!TARGET_OLDABI)
17081 flag_pcc_struct_return = 0;
17082
17083 /* Decide which rtx_costs structure to use. */
17084 if (optimize_size)
17085 mips_cost = &mips_rtx_cost_optimize_size;
17086 else
17087 mips_cost = &mips_rtx_cost_data[mips_tune];
17088
17089 /* If the user hasn't specified a branch cost, use the processor's
17090 default. */
17091 if (mips_branch_cost == 0)
17092 mips_branch_cost = mips_cost->branch_cost;
17093
17094 /* If neither -mbranch-likely nor -mno-branch-likely was given
17095 on the command line, set MASK_BRANCHLIKELY based on the target
17096 architecture and tuning flags. Annulled delay slots are a
17097 size win, so we only consider the processor-specific tuning
17098 for !optimize_size. */
17099 if ((target_flags_explicit & MASK_BRANCHLIKELY) == 0)
17100 {
17101 if (ISA_HAS_BRANCHLIKELY
17102 && (optimize_size
17103 || (mips_tune_info->tune_flags & PTF_AVOID_BRANCHLIKELY) == 0))
17104 target_flags |= MASK_BRANCHLIKELY;
17105 else
17106 target_flags &= ~MASK_BRANCHLIKELY;
17107 }
17108 else if (TARGET_BRANCHLIKELY && !ISA_HAS_BRANCHLIKELY)
17109 warning (0, "the %qs architecture does not support branch-likely"
17110 " instructions", mips_arch_info->name);
17111
17112 /* If the user hasn't specified -mimadd or -mno-imadd set
17113 MASK_IMADD based on the target architecture and tuning
17114 flags. */
17115 if ((target_flags_explicit & MASK_IMADD) == 0)
17116 {
17117 if (ISA_HAS_MADD_MSUB &&
17118 (mips_tune_info->tune_flags & PTF_AVOID_IMADD) == 0)
17119 target_flags |= MASK_IMADD;
17120 else
17121 target_flags &= ~MASK_IMADD;
17122 }
17123 else if (TARGET_IMADD && !ISA_HAS_MADD_MSUB)
17124 warning (0, "the %qs architecture does not support madd or msub"
17125 " instructions", mips_arch_info->name);
17126
17127 /* The effect of -mabicalls isn't defined for the EABI. */
17128 if (mips_abi == ABI_EABI && TARGET_ABICALLS)
17129 {
17130 error ("unsupported combination: %s", "-mabicalls -mabi=eabi");
17131 target_flags &= ~MASK_ABICALLS;
17132 }
17133
17134 /* PIC requires -mabicalls. */
17135 if (flag_pic)
17136 {
17137 if (mips_abi == ABI_EABI)
17138 error ("cannot generate position-independent code for %qs",
17139 "-mabi=eabi");
17140 else if (!TARGET_ABICALLS)
17141 error ("position-independent code requires %qs", "-mabicalls");
17142 }
17143
17144 if (TARGET_ABICALLS_PIC2)
17145 /* We need to set flag_pic for executables as well as DSOs
17146 because we may reference symbols that are not defined in
17147 the final executable. (MIPS does not use things like
17148 copy relocs, for example.)
17149
17150 There is a body of code that uses __PIC__ to distinguish
17151 between -mabicalls and -mno-abicalls code. The non-__PIC__
17152 variant is usually appropriate for TARGET_ABICALLS_PIC0, as
17153 long as any indirect jumps use $25. */
17154 flag_pic = 1;
17155
17156 /* -mvr4130-align is a "speed over size" optimization: it usually produces
17157 faster code, but at the expense of more nops. Enable it at -O3 and
17158 above. */
17159 if (optimize > 2 && (target_flags_explicit & MASK_VR4130_ALIGN) == 0)
17160 target_flags |= MASK_VR4130_ALIGN;
17161
17162 /* Prefer a call to memcpy over inline code when optimizing for size,
17163 though see MOVE_RATIO in mips.h. */
17164 if (optimize_size && (target_flags_explicit & MASK_MEMCPY) == 0)
17165 target_flags |= MASK_MEMCPY;
17166
17167 /* If we have a nonzero small-data limit, check that the -mgpopt
17168 setting is consistent with the other target flags. */
17169 if (mips_small_data_threshold > 0)
17170 {
17171 if (!TARGET_GPOPT)
17172 {
17173 if (!TARGET_EXPLICIT_RELOCS)
17174 error ("%<-mno-gpopt%> needs %<-mexplicit-relocs%>");
17175
17176 TARGET_LOCAL_SDATA = false;
17177 TARGET_EXTERN_SDATA = false;
17178 }
17179 else
17180 {
17181 if (TARGET_VXWORKS_RTP)
17182 warning (0, "cannot use small-data accesses for %qs", "-mrtp");
17183
17184 if (TARGET_ABICALLS)
17185 warning (0, "cannot use small-data accesses for %qs",
17186 "-mabicalls");
17187 }
17188 }
17189
17190 /* Pre-IEEE 754-2008 MIPS hardware has a quirky almost-IEEE format
17191 for all its floating point. */
17192 if (mips_nan != MIPS_IEEE_754_2008)
17193 {
17194 REAL_MODE_FORMAT (SFmode) = &mips_single_format;
17195 REAL_MODE_FORMAT (DFmode) = &mips_double_format;
17196 REAL_MODE_FORMAT (TFmode) = &mips_quad_format;
17197 }
17198
17199 /* Make sure that the user didn't turn off paired single support when
17200 MIPS-3D support is requested. */
17201 if (TARGET_MIPS3D
17202 && (target_flags_explicit & MASK_PAIRED_SINGLE_FLOAT)
17203 && !TARGET_PAIRED_SINGLE_FLOAT)
17204 error ("%<-mips3d%> requires %<-mpaired-single%>");
17205
17206 /* If TARGET_MIPS3D, enable MASK_PAIRED_SINGLE_FLOAT. */
17207 if (TARGET_MIPS3D)
17208 target_flags |= MASK_PAIRED_SINGLE_FLOAT;
17209
17210 /* Make sure that when TARGET_PAIRED_SINGLE_FLOAT is true, TARGET_FLOAT64
17211 and TARGET_HARD_FLOAT_ABI are both true. */
17212 if (TARGET_PAIRED_SINGLE_FLOAT && !(TARGET_FLOAT64 && TARGET_HARD_FLOAT_ABI))
17213 {
17214 error ("%qs must be used with %qs",
17215 TARGET_MIPS3D ? "-mips3d" : "-mpaired-single",
17216 TARGET_HARD_FLOAT_ABI ? "-mfp64" : "-mhard-float");
17217 target_flags &= ~MASK_PAIRED_SINGLE_FLOAT;
17218 TARGET_MIPS3D = 0;
17219 }
17220
17221 /* Make sure that -mpaired-single is only used on ISAs that support it.
17222 We must disable it otherwise since it relies on other ISA properties
17223 like ISA_HAS_8CC having their normal values. */
17224 if (TARGET_PAIRED_SINGLE_FLOAT && !ISA_HAS_PAIRED_SINGLE)
17225 {
17226 error ("the %qs architecture does not support paired-single"
17227 " instructions", mips_arch_info->name);
17228 target_flags &= ~MASK_PAIRED_SINGLE_FLOAT;
17229 TARGET_MIPS3D = 0;
17230 }
17231
17232 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE
17233 && !TARGET_CACHE_BUILTIN)
17234 {
17235 error ("%qs requires a target that provides the %qs instruction",
17236 "-mr10k-cache-barrier", "cache");
17237 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_NONE;
17238 }
17239
17240 /* If TARGET_DSPR2, enable TARGET_DSP. */
17241 if (TARGET_DSPR2)
17242 TARGET_DSP = true;
17243
17244 /* .eh_frame addresses should be the same width as a C pointer.
17245 Most MIPS ABIs support only one pointer size, so the assembler
17246 will usually know exactly how big an .eh_frame address is.
17247
17248 Unfortunately, this is not true of the 64-bit EABI. The ABI was
17249 originally defined to use 64-bit pointers (i.e. it is LP64), and
17250 this is still the default mode. However, we also support an n32-like
17251 ILP32 mode, which is selected by -mlong32. The problem is that the
17252 assembler has traditionally not had an -mlong option, so it has
17253 traditionally not known whether we're using the ILP32 or LP64 form.
17254
17255 As it happens, gas versions up to and including 2.19 use _32-bit_
17256 addresses for EABI64 .cfi_* directives. This is wrong for the
17257 default LP64 mode, so we can't use the directives by default.
17258 Moreover, since gas's current behavior is at odds with gcc's
17259 default behavior, it seems unwise to rely on future versions
17260 of gas behaving the same way. We therefore avoid using .cfi
17261 directives for -mlong32 as well. */
17262 if (mips_abi == ABI_EABI && TARGET_64BIT)
17263 flag_dwarf2_cfi_asm = 0;
17264
17265 /* .cfi_* directives generate a read-only section, so fall back on
17266 manual .eh_frame creation if we need the section to be writable. */
17267 if (TARGET_WRITABLE_EH_FRAME)
17268 flag_dwarf2_cfi_asm = 0;
17269
17270 mips_init_print_operand_punct ();
17271
17272 /* Set up array to map GCC register number to debug register number.
17273 Ignore the special purpose register numbers. */
17274
17275 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
17276 {
17277 mips_dbx_regno[i] = IGNORED_DWARF_REGNUM;
17278 if (GP_REG_P (i) || FP_REG_P (i) || ALL_COP_REG_P (i))
17279 mips_dwarf_regno[i] = i;
17280 else
17281 mips_dwarf_regno[i] = INVALID_REGNUM;
17282 }
17283
17284 start = GP_DBX_FIRST - GP_REG_FIRST;
17285 for (i = GP_REG_FIRST; i <= GP_REG_LAST; i++)
17286 mips_dbx_regno[i] = i + start;
17287
17288 start = FP_DBX_FIRST - FP_REG_FIRST;
17289 for (i = FP_REG_FIRST; i <= FP_REG_LAST; i++)
17290 mips_dbx_regno[i] = i + start;
17291
17292 /* Accumulator debug registers use big-endian ordering. */
17293 mips_dbx_regno[HI_REGNUM] = MD_DBX_FIRST + 0;
17294 mips_dbx_regno[LO_REGNUM] = MD_DBX_FIRST + 1;
17295 mips_dwarf_regno[HI_REGNUM] = MD_REG_FIRST + 0;
17296 mips_dwarf_regno[LO_REGNUM] = MD_REG_FIRST + 1;
17297 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2)
17298 {
17299 mips_dwarf_regno[i + TARGET_LITTLE_ENDIAN] = i;
17300 mips_dwarf_regno[i + TARGET_BIG_ENDIAN] = i + 1;
17301 }
17302
17303 /* Set up mips_hard_regno_mode_ok. */
17304 for (mode = 0; mode < MAX_MACHINE_MODE; mode++)
17305 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
17306 mips_hard_regno_mode_ok[mode][regno]
17307 = mips_hard_regno_mode_ok_p (regno, (enum machine_mode) mode);
17308
17309 /* Function to allocate machine-dependent function status. */
17310 init_machine_status = &mips_init_machine_status;
17311
17312 /* Default to working around R4000 errata only if the processor
17313 was selected explicitly. */
17314 if ((target_flags_explicit & MASK_FIX_R4000) == 0
17315 && strcmp (mips_arch_info->name, "r4000") == 0)
17316 target_flags |= MASK_FIX_R4000;
17317
17318 /* Default to working around R4400 errata only if the processor
17319 was selected explicitly. */
17320 if ((target_flags_explicit & MASK_FIX_R4400) == 0
17321 && strcmp (mips_arch_info->name, "r4400") == 0)
17322 target_flags |= MASK_FIX_R4400;
17323
17324 /* Default to working around R10000 errata only if the processor
17325 was selected explicitly. */
17326 if ((target_flags_explicit & MASK_FIX_R10000) == 0
17327 && strcmp (mips_arch_info->name, "r10000") == 0)
17328 target_flags |= MASK_FIX_R10000;
17329
17330 /* Make sure that branch-likely instructions available when using
17331 -mfix-r10000. The instructions are not available if either:
17332
17333 1. -mno-branch-likely was passed.
17334 2. The selected ISA does not support branch-likely and
17335 the command line does not include -mbranch-likely. */
17336 if (TARGET_FIX_R10000
17337 && ((target_flags_explicit & MASK_BRANCHLIKELY) == 0
17338 ? !ISA_HAS_BRANCHLIKELY
17339 : !TARGET_BRANCHLIKELY))
17340 sorry ("%qs requires branch-likely instructions", "-mfix-r10000");
17341
17342 if (TARGET_SYNCI && !ISA_HAS_SYNCI)
17343 {
17344 warning (0, "the %qs architecture does not support the synci "
17345 "instruction", mips_arch_info->name);
17346 target_flags &= ~MASK_SYNCI;
17347 }
17348
17349 /* Only optimize PIC indirect calls if they are actually required. */
17350 if (!TARGET_USE_GOT || !TARGET_EXPLICIT_RELOCS)
17351 target_flags &= ~MASK_RELAX_PIC_CALLS;
17352
17353 /* Save base state of options. */
17354 mips_base_target_flags = target_flags;
17355 mips_base_schedule_insns = flag_schedule_insns;
17356 mips_base_reorder_blocks_and_partition = flag_reorder_blocks_and_partition;
17357 mips_base_move_loop_invariants = flag_move_loop_invariants;
17358 mips_base_align_loops = align_loops;
17359 mips_base_align_jumps = align_jumps;
17360 mips_base_align_functions = align_functions;
17361
17362 /* Now select the ISA mode.
17363
17364 Do all CPP-sensitive stuff in uncompressed mode; we'll switch modes
17365 later if required. */
17366 mips_set_compression_mode (0);
17367
17368 /* We register a second machine specific reorg pass after delay slot
17369 filling. Registering the pass must be done at start up. It's
17370 convenient to do it here. */
17371 opt_pass *new_pass = make_pass_mips_machine_reorg2 (g);
17372 struct register_pass_info insert_pass_mips_machine_reorg2 =
17373 {
17374 new_pass, /* pass */
17375 "dbr", /* reference_pass_name */
17376 1, /* ref_pass_instance_number */
17377 PASS_POS_INSERT_AFTER /* po_op */
17378 };
17379 register_pass (&insert_pass_mips_machine_reorg2);
17380
17381 if (TARGET_HARD_FLOAT_ABI && TARGET_MIPS5900)
17382 REAL_MODE_FORMAT (SFmode) = &spu_single_format;
17383 }
17384
17385 /* Swap the register information for registers I and I + 1, which
17386 currently have the wrong endianness. Note that the registers'
17387 fixedness and call-clobberedness might have been set on the
17388 command line. */
17389
17390 static void
17391 mips_swap_registers (unsigned int i)
17392 {
17393 int tmpi;
17394 const char *tmps;
17395
17396 #define SWAP_INT(X, Y) (tmpi = (X), (X) = (Y), (Y) = tmpi)
17397 #define SWAP_STRING(X, Y) (tmps = (X), (X) = (Y), (Y) = tmps)
17398
17399 SWAP_INT (fixed_regs[i], fixed_regs[i + 1]);
17400 SWAP_INT (call_used_regs[i], call_used_regs[i + 1]);
17401 SWAP_INT (call_really_used_regs[i], call_really_used_regs[i + 1]);
17402 SWAP_STRING (reg_names[i], reg_names[i + 1]);
17403
17404 #undef SWAP_STRING
17405 #undef SWAP_INT
17406 }
17407
17408 /* Implement TARGET_CONDITIONAL_REGISTER_USAGE. */
17409
17410 static void
17411 mips_conditional_register_usage (void)
17412 {
17413
17414 if (ISA_HAS_DSP)
17415 {
17416 /* These DSP control register fields are global. */
17417 global_regs[CCDSP_PO_REGNUM] = 1;
17418 global_regs[CCDSP_SC_REGNUM] = 1;
17419 }
17420 else
17421 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17422 reg_class_contents[(int) DSP_ACC_REGS]);
17423
17424 if (!TARGET_HARD_FLOAT)
17425 {
17426 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17427 reg_class_contents[(int) FP_REGS]);
17428 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17429 reg_class_contents[(int) ST_REGS]);
17430 }
17431 else if (!ISA_HAS_8CC)
17432 {
17433 /* We only have a single condition-code register. We implement
17434 this by fixing all the condition-code registers and generating
17435 RTL that refers directly to ST_REG_FIRST. */
17436 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17437 reg_class_contents[(int) ST_REGS]);
17438 SET_HARD_REG_BIT (accessible_reg_set, FPSW_REGNUM);
17439 fixed_regs[FPSW_REGNUM] = call_used_regs[FPSW_REGNUM] = 1;
17440 }
17441 if (TARGET_MIPS16)
17442 {
17443 /* In MIPS16 mode, we prohibit the unused $s registers, since they
17444 are call-saved, and saving them via a MIPS16 register would
17445 probably waste more time than just reloading the value.
17446
17447 We permit the $t temporary registers when optimizing for speed
17448 but not when optimizing for space because using them results in
17449 code that is larger (but faster) then not using them. We do
17450 allow $24 (t8) because it is used in CMP and CMPI instructions
17451 and $25 (t9) because it is used as the function call address in
17452 SVR4 PIC code. */
17453
17454 fixed_regs[18] = call_used_regs[18] = 1;
17455 fixed_regs[19] = call_used_regs[19] = 1;
17456 fixed_regs[20] = call_used_regs[20] = 1;
17457 fixed_regs[21] = call_used_regs[21] = 1;
17458 fixed_regs[22] = call_used_regs[22] = 1;
17459 fixed_regs[23] = call_used_regs[23] = 1;
17460 fixed_regs[26] = call_used_regs[26] = 1;
17461 fixed_regs[27] = call_used_regs[27] = 1;
17462 fixed_regs[30] = call_used_regs[30] = 1;
17463 if (optimize_size)
17464 {
17465 fixed_regs[8] = call_used_regs[8] = 1;
17466 fixed_regs[9] = call_used_regs[9] = 1;
17467 fixed_regs[10] = call_used_regs[10] = 1;
17468 fixed_regs[11] = call_used_regs[11] = 1;
17469 fixed_regs[12] = call_used_regs[12] = 1;
17470 fixed_regs[13] = call_used_regs[13] = 1;
17471 fixed_regs[14] = call_used_regs[14] = 1;
17472 fixed_regs[15] = call_used_regs[15] = 1;
17473 }
17474
17475 /* Do not allow HI and LO to be treated as register operands.
17476 There are no MTHI or MTLO instructions (or any real need
17477 for them) and one-way registers cannot easily be reloaded. */
17478 AND_COMPL_HARD_REG_SET (operand_reg_set,
17479 reg_class_contents[(int) MD_REGS]);
17480 }
17481 /* $f20-$f23 are call-clobbered for n64. */
17482 if (mips_abi == ABI_64)
17483 {
17484 int regno;
17485 for (regno = FP_REG_FIRST + 20; regno < FP_REG_FIRST + 24; regno++)
17486 call_really_used_regs[regno] = call_used_regs[regno] = 1;
17487 }
17488 /* Odd registers in the range $f21-$f31 (inclusive) are call-clobbered
17489 for n32. */
17490 if (mips_abi == ABI_N32)
17491 {
17492 int regno;
17493 for (regno = FP_REG_FIRST + 21; regno <= FP_REG_FIRST + 31; regno+=2)
17494 call_really_used_regs[regno] = call_used_regs[regno] = 1;
17495 }
17496 /* Make sure that double-register accumulator values are correctly
17497 ordered for the current endianness. */
17498 if (TARGET_LITTLE_ENDIAN)
17499 {
17500 unsigned int regno;
17501
17502 mips_swap_registers (MD_REG_FIRST);
17503 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno += 2)
17504 mips_swap_registers (regno);
17505 }
17506 }
17507
17508 /* Implement EH_USES. */
17509
17510 bool
17511 mips_eh_uses (unsigned int regno)
17512 {
17513 if (reload_completed && !TARGET_ABSOLUTE_JUMPS)
17514 {
17515 /* We need to force certain registers to be live in order to handle
17516 PIC long branches correctly. See mips_must_initialize_gp_p for
17517 details. */
17518 if (mips_cfun_has_cprestore_slot_p ())
17519 {
17520 if (regno == CPRESTORE_SLOT_REGNUM)
17521 return true;
17522 }
17523 else
17524 {
17525 if (cfun->machine->global_pointer == regno)
17526 return true;
17527 }
17528 }
17529
17530 return false;
17531 }
17532
17533 /* Implement EPILOGUE_USES. */
17534
17535 bool
17536 mips_epilogue_uses (unsigned int regno)
17537 {
17538 /* Say that the epilogue uses the return address register. Note that
17539 in the case of sibcalls, the values "used by the epilogue" are
17540 considered live at the start of the called function. */
17541 if (regno == RETURN_ADDR_REGNUM)
17542 return true;
17543
17544 /* If using a GOT, say that the epilogue also uses GOT_VERSION_REGNUM.
17545 See the comment above load_call<mode> for details. */
17546 if (TARGET_USE_GOT && (regno) == GOT_VERSION_REGNUM)
17547 return true;
17548
17549 /* An interrupt handler must preserve some registers that are
17550 ordinarily call-clobbered. */
17551 if (cfun->machine->interrupt_handler_p
17552 && mips_interrupt_extra_call_saved_reg_p (regno))
17553 return true;
17554
17555 return false;
17556 }
17557
17558 /* A for_each_rtx callback. Stop the search if *X is an AT register. */
17559
17560 static int
17561 mips_at_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED)
17562 {
17563 return REG_P (*x) && REGNO (*x) == AT_REGNUM;
17564 }
17565
17566 /* Return true if INSN needs to be wrapped in ".set noat".
17567 INSN has NOPERANDS operands, stored in OPVEC. */
17568
17569 static bool
17570 mips_need_noat_wrapper_p (rtx insn, rtx *opvec, int noperands)
17571 {
17572 int i;
17573
17574 if (recog_memoized (insn) >= 0)
17575 for (i = 0; i < noperands; i++)
17576 if (for_each_rtx (&opvec[i], mips_at_reg_p, NULL))
17577 return true;
17578 return false;
17579 }
17580
17581 /* Implement FINAL_PRESCAN_INSN. */
17582
17583 void
17584 mips_final_prescan_insn (rtx_insn *insn, rtx *opvec, int noperands)
17585 {
17586 if (mips_need_noat_wrapper_p (insn, opvec, noperands))
17587 mips_push_asm_switch (&mips_noat);
17588 }
17589
17590 /* Implement TARGET_ASM_FINAL_POSTSCAN_INSN. */
17591
17592 static void
17593 mips_final_postscan_insn (FILE *file ATTRIBUTE_UNUSED, rtx insn,
17594 rtx *opvec, int noperands)
17595 {
17596 if (mips_need_noat_wrapper_p (insn, opvec, noperands))
17597 mips_pop_asm_switch (&mips_noat);
17598 }
17599
17600 /* Return the function that is used to expand the <u>mulsidi3 pattern.
17601 EXT_CODE is the code of the extension used. Return NULL if widening
17602 multiplication shouldn't be used. */
17603
17604 mulsidi3_gen_fn
17605 mips_mulsidi3_gen_fn (enum rtx_code ext_code)
17606 {
17607 bool signed_p;
17608
17609 signed_p = ext_code == SIGN_EXTEND;
17610 if (TARGET_64BIT)
17611 {
17612 /* Don't use widening multiplication with MULT when we have DMUL. Even
17613 with the extension of its input operands DMUL is faster. Note that
17614 the extension is not needed for signed multiplication. In order to
17615 ensure that we always remove the redundant sign-extension in this
17616 case we still expand mulsidi3 for DMUL. */
17617 if (ISA_HAS_DMUL3)
17618 return signed_p ? gen_mulsidi3_64bit_dmul : NULL;
17619 if (TARGET_MIPS16)
17620 return (signed_p
17621 ? gen_mulsidi3_64bit_mips16
17622 : gen_umulsidi3_64bit_mips16);
17623 if (TARGET_FIX_R4000)
17624 return NULL;
17625 return signed_p ? gen_mulsidi3_64bit : gen_umulsidi3_64bit;
17626 }
17627 else
17628 {
17629 if (TARGET_MIPS16)
17630 return (signed_p
17631 ? gen_mulsidi3_32bit_mips16
17632 : gen_umulsidi3_32bit_mips16);
17633 if (TARGET_FIX_R4000 && !ISA_HAS_DSP)
17634 return signed_p ? gen_mulsidi3_32bit_r4000 : gen_umulsidi3_32bit_r4000;
17635 return signed_p ? gen_mulsidi3_32bit : gen_umulsidi3_32bit;
17636 }
17637 }
17638
17639 /* Return true if PATTERN matches the kind of instruction generated by
17640 umips_build_save_restore. SAVE_P is true for store. */
17641
17642 bool
17643 umips_save_restore_pattern_p (bool save_p, rtx pattern)
17644 {
17645 int n;
17646 unsigned int i;
17647 HOST_WIDE_INT first_offset = 0;
17648 rtx first_base = 0;
17649 unsigned int regmask = 0;
17650
17651 for (n = 0; n < XVECLEN (pattern, 0); n++)
17652 {
17653 rtx set, reg, mem, this_base;
17654 HOST_WIDE_INT this_offset;
17655
17656 /* Check that we have a SET. */
17657 set = XVECEXP (pattern, 0, n);
17658 if (GET_CODE (set) != SET)
17659 return false;
17660
17661 /* Check that the SET is a load (if restoring) or a store
17662 (if saving). */
17663 mem = save_p ? SET_DEST (set) : SET_SRC (set);
17664 if (!MEM_P (mem) || MEM_VOLATILE_P (mem))
17665 return false;
17666
17667 /* Check that the address is the sum of base and a possibly-zero
17668 constant offset. Determine if the offset is in range. */
17669 mips_split_plus (XEXP (mem, 0), &this_base, &this_offset);
17670 if (!REG_P (this_base))
17671 return false;
17672
17673 if (n == 0)
17674 {
17675 if (!UMIPS_12BIT_OFFSET_P (this_offset))
17676 return false;
17677 first_base = this_base;
17678 first_offset = this_offset;
17679 }
17680 else
17681 {
17682 /* Check that the save slots are consecutive. */
17683 if (REGNO (this_base) != REGNO (first_base)
17684 || this_offset != first_offset + UNITS_PER_WORD * n)
17685 return false;
17686 }
17687
17688 /* Check that SET's other operand is a register. */
17689 reg = save_p ? SET_SRC (set) : SET_DEST (set);
17690 if (!REG_P (reg))
17691 return false;
17692
17693 regmask |= 1 << REGNO (reg);
17694 }
17695
17696 for (i = 0; i < ARRAY_SIZE (umips_swm_mask); i++)
17697 if (regmask == umips_swm_mask[i])
17698 return true;
17699
17700 return false;
17701 }
17702
17703 /* Return the assembly instruction for microMIPS LWM or SWM.
17704 SAVE_P and PATTERN are as for umips_save_restore_pattern_p. */
17705
17706 const char *
17707 umips_output_save_restore (bool save_p, rtx pattern)
17708 {
17709 static char buffer[300];
17710 char *s;
17711 int n;
17712 HOST_WIDE_INT offset;
17713 rtx base, mem, set, last_set, last_reg;
17714
17715 /* Parse the pattern. */
17716 gcc_assert (umips_save_restore_pattern_p (save_p, pattern));
17717
17718 s = strcpy (buffer, save_p ? "swm\t" : "lwm\t");
17719 s += strlen (s);
17720 n = XVECLEN (pattern, 0);
17721
17722 set = XVECEXP (pattern, 0, 0);
17723 mem = save_p ? SET_DEST (set) : SET_SRC (set);
17724 mips_split_plus (XEXP (mem, 0), &base, &offset);
17725
17726 last_set = XVECEXP (pattern, 0, n - 1);
17727 last_reg = save_p ? SET_SRC (last_set) : SET_DEST (last_set);
17728
17729 if (REGNO (last_reg) == 31)
17730 n--;
17731
17732 gcc_assert (n <= 9);
17733 if (n == 0)
17734 ;
17735 else if (n == 1)
17736 s += sprintf (s, "%s,", reg_names[16]);
17737 else if (n < 9)
17738 s += sprintf (s, "%s-%s,", reg_names[16], reg_names[15 + n]);
17739 else if (n == 9)
17740 s += sprintf (s, "%s-%s,%s,", reg_names[16], reg_names[23],
17741 reg_names[30]);
17742
17743 if (REGNO (last_reg) == 31)
17744 s += sprintf (s, "%s,", reg_names[31]);
17745
17746 s += sprintf (s, "%d(%s)", (int)offset, reg_names[REGNO (base)]);
17747 return buffer;
17748 }
17749
17750 /* Return true if MEM1 and MEM2 use the same base register, and the
17751 offset of MEM2 equals the offset of MEM1 plus 4. FIRST_REG is the
17752 register into (from) which the contents of MEM1 will be loaded
17753 (stored), depending on the value of LOAD_P.
17754 SWAP_P is true when the 1st and 2nd instructions are swapped. */
17755
17756 static bool
17757 umips_load_store_pair_p_1 (bool load_p, bool swap_p,
17758 rtx first_reg, rtx mem1, rtx mem2)
17759 {
17760 rtx base1, base2;
17761 HOST_WIDE_INT offset1, offset2;
17762
17763 if (!MEM_P (mem1) || !MEM_P (mem2))
17764 return false;
17765
17766 mips_split_plus (XEXP (mem1, 0), &base1, &offset1);
17767 mips_split_plus (XEXP (mem2, 0), &base2, &offset2);
17768
17769 if (!REG_P (base1) || !rtx_equal_p (base1, base2))
17770 return false;
17771
17772 /* Avoid invalid load pair instructions. */
17773 if (load_p && REGNO (first_reg) == REGNO (base1))
17774 return false;
17775
17776 /* We must avoid this case for anti-dependence.
17777 Ex: lw $3, 4($3)
17778 lw $2, 0($3)
17779 first_reg is $2, but the base is $3. */
17780 if (load_p
17781 && swap_p
17782 && REGNO (first_reg) + 1 == REGNO (base1))
17783 return false;
17784
17785 if (offset2 != offset1 + 4)
17786 return false;
17787
17788 if (!UMIPS_12BIT_OFFSET_P (offset1))
17789 return false;
17790
17791 return true;
17792 }
17793
17794 /* OPERANDS describes the operands to a pair of SETs, in the order
17795 dest1, src1, dest2, src2. Return true if the operands can be used
17796 in an LWP or SWP instruction; LOAD_P says which. */
17797
17798 bool
17799 umips_load_store_pair_p (bool load_p, rtx *operands)
17800 {
17801 rtx reg1, reg2, mem1, mem2;
17802
17803 if (load_p)
17804 {
17805 reg1 = operands[0];
17806 reg2 = operands[2];
17807 mem1 = operands[1];
17808 mem2 = operands[3];
17809 }
17810 else
17811 {
17812 reg1 = operands[1];
17813 reg2 = operands[3];
17814 mem1 = operands[0];
17815 mem2 = operands[2];
17816 }
17817
17818 if (REGNO (reg2) == REGNO (reg1) + 1)
17819 return umips_load_store_pair_p_1 (load_p, false, reg1, mem1, mem2);
17820
17821 if (REGNO (reg1) == REGNO (reg2) + 1)
17822 return umips_load_store_pair_p_1 (load_p, true, reg2, mem2, mem1);
17823
17824 return false;
17825 }
17826
17827 /* Return the assembly instruction for a microMIPS LWP or SWP in which
17828 the first register is REG and the first memory slot is MEM.
17829 LOAD_P is true for LWP. */
17830
17831 static void
17832 umips_output_load_store_pair_1 (bool load_p, rtx reg, rtx mem)
17833 {
17834 rtx ops[] = {reg, mem};
17835
17836 if (load_p)
17837 output_asm_insn ("lwp\t%0,%1", ops);
17838 else
17839 output_asm_insn ("swp\t%0,%1", ops);
17840 }
17841
17842 /* Output the assembly instruction for a microMIPS LWP or SWP instruction.
17843 LOAD_P and OPERANDS are as for umips_load_store_pair_p. */
17844
17845 void
17846 umips_output_load_store_pair (bool load_p, rtx *operands)
17847 {
17848 rtx reg1, reg2, mem1, mem2;
17849 if (load_p)
17850 {
17851 reg1 = operands[0];
17852 reg2 = operands[2];
17853 mem1 = operands[1];
17854 mem2 = operands[3];
17855 }
17856 else
17857 {
17858 reg1 = operands[1];
17859 reg2 = operands[3];
17860 mem1 = operands[0];
17861 mem2 = operands[2];
17862 }
17863
17864 if (REGNO (reg2) == REGNO (reg1) + 1)
17865 {
17866 umips_output_load_store_pair_1 (load_p, reg1, mem1);
17867 return;
17868 }
17869
17870 gcc_assert (REGNO (reg1) == REGNO (reg2) + 1);
17871 umips_output_load_store_pair_1 (load_p, reg2, mem2);
17872 }
17873
17874 /* Return true if REG1 and REG2 match the criteria for a movep insn. */
17875
17876 bool
17877 umips_movep_target_p (rtx reg1, rtx reg2)
17878 {
17879 int regno1, regno2, pair;
17880 unsigned int i;
17881 static const int match[8] = {
17882 0x00000060, /* 5, 6 */
17883 0x000000a0, /* 5, 7 */
17884 0x000000c0, /* 6, 7 */
17885 0x00200010, /* 4, 21 */
17886 0x00400010, /* 4, 22 */
17887 0x00000030, /* 4, 5 */
17888 0x00000050, /* 4, 6 */
17889 0x00000090 /* 4, 7 */
17890 };
17891
17892 if (!REG_P (reg1) || !REG_P (reg2))
17893 return false;
17894
17895 regno1 = REGNO (reg1);
17896 regno2 = REGNO (reg2);
17897
17898 if (!GP_REG_P (regno1) || !GP_REG_P (regno2))
17899 return false;
17900
17901 pair = (1 << regno1) | (1 << regno2);
17902
17903 for (i = 0; i < ARRAY_SIZE (match); i++)
17904 if (pair == match[i])
17905 return true;
17906
17907 return false;
17908 }
17909 \f
17910 /* Return the size in bytes of the trampoline code, padded to
17911 TRAMPOLINE_ALIGNMENT bits. The static chain pointer and target
17912 function address immediately follow. */
17913
17914 int
17915 mips_trampoline_code_size (void)
17916 {
17917 if (TARGET_USE_PIC_FN_ADDR_REG)
17918 return 4 * 4;
17919 else if (ptr_mode == DImode)
17920 return 8 * 4;
17921 else if (ISA_HAS_LOAD_DELAY)
17922 return 6 * 4;
17923 else
17924 return 4 * 4;
17925 }
17926
17927 /* Implement TARGET_TRAMPOLINE_INIT. */
17928
17929 static void
17930 mips_trampoline_init (rtx m_tramp, tree fndecl, rtx chain_value)
17931 {
17932 rtx addr, end_addr, high, low, opcode, mem;
17933 rtx trampoline[8];
17934 unsigned int i, j;
17935 HOST_WIDE_INT end_addr_offset, static_chain_offset, target_function_offset;
17936
17937 /* Work out the offsets of the pointers from the start of the
17938 trampoline code. */
17939 end_addr_offset = mips_trampoline_code_size ();
17940 static_chain_offset = end_addr_offset;
17941 target_function_offset = static_chain_offset + GET_MODE_SIZE (ptr_mode);
17942
17943 /* Get pointers to the beginning and end of the code block. */
17944 addr = force_reg (Pmode, XEXP (m_tramp, 0));
17945 end_addr = mips_force_binary (Pmode, PLUS, addr, GEN_INT (end_addr_offset));
17946
17947 #define OP(X) gen_int_mode (X, SImode)
17948
17949 /* Build up the code in TRAMPOLINE. */
17950 i = 0;
17951 if (TARGET_USE_PIC_FN_ADDR_REG)
17952 {
17953 /* $25 contains the address of the trampoline. Emit code of the form:
17954
17955 l[wd] $1, target_function_offset($25)
17956 l[wd] $static_chain, static_chain_offset($25)
17957 jr $1
17958 move $25,$1. */
17959 trampoline[i++] = OP (MIPS_LOAD_PTR (AT_REGNUM,
17960 target_function_offset,
17961 PIC_FUNCTION_ADDR_REGNUM));
17962 trampoline[i++] = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM,
17963 static_chain_offset,
17964 PIC_FUNCTION_ADDR_REGNUM));
17965 trampoline[i++] = OP (MIPS_JR (AT_REGNUM));
17966 trampoline[i++] = OP (MIPS_MOVE (PIC_FUNCTION_ADDR_REGNUM, AT_REGNUM));
17967 }
17968 else if (ptr_mode == DImode)
17969 {
17970 /* It's too cumbersome to create the full 64-bit address, so let's
17971 instead use:
17972
17973 move $1, $31
17974 bal 1f
17975 nop
17976 1: l[wd] $25, target_function_offset - 12($31)
17977 l[wd] $static_chain, static_chain_offset - 12($31)
17978 jr $25
17979 move $31, $1
17980
17981 where 12 is the offset of "1:" from the start of the code block. */
17982 trampoline[i++] = OP (MIPS_MOVE (AT_REGNUM, RETURN_ADDR_REGNUM));
17983 trampoline[i++] = OP (MIPS_BAL (1));
17984 trampoline[i++] = OP (MIPS_NOP);
17985 trampoline[i++] = OP (MIPS_LOAD_PTR (PIC_FUNCTION_ADDR_REGNUM,
17986 target_function_offset - 12,
17987 RETURN_ADDR_REGNUM));
17988 trampoline[i++] = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM,
17989 static_chain_offset - 12,
17990 RETURN_ADDR_REGNUM));
17991 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM));
17992 trampoline[i++] = OP (MIPS_MOVE (RETURN_ADDR_REGNUM, AT_REGNUM));
17993 }
17994 else
17995 {
17996 /* If the target has load delays, emit:
17997
17998 lui $1, %hi(end_addr)
17999 lw $25, %lo(end_addr + ...)($1)
18000 lw $static_chain, %lo(end_addr + ...)($1)
18001 jr $25
18002 nop
18003
18004 Otherwise emit:
18005
18006 lui $1, %hi(end_addr)
18007 lw $25, %lo(end_addr + ...)($1)
18008 jr $25
18009 lw $static_chain, %lo(end_addr + ...)($1). */
18010
18011 /* Split END_ADDR into %hi and %lo values. Trampolines are aligned
18012 to 64 bits, so the %lo value will have the bottom 3 bits clear. */
18013 high = expand_simple_binop (SImode, PLUS, end_addr, GEN_INT (0x8000),
18014 NULL, false, OPTAB_WIDEN);
18015 high = expand_simple_binop (SImode, LSHIFTRT, high, GEN_INT (16),
18016 NULL, false, OPTAB_WIDEN);
18017 low = convert_to_mode (SImode, gen_lowpart (HImode, end_addr), true);
18018
18019 /* Emit the LUI. */
18020 opcode = OP (MIPS_LUI (AT_REGNUM, 0));
18021 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, high,
18022 NULL, false, OPTAB_WIDEN);
18023
18024 /* Emit the load of the target function. */
18025 opcode = OP (MIPS_LOAD_PTR (PIC_FUNCTION_ADDR_REGNUM,
18026 target_function_offset - end_addr_offset,
18027 AT_REGNUM));
18028 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, low,
18029 NULL, false, OPTAB_WIDEN);
18030
18031 /* Emit the JR here, if we can. */
18032 if (!ISA_HAS_LOAD_DELAY)
18033 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM));
18034
18035 /* Emit the load of the static chain register. */
18036 opcode = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM,
18037 static_chain_offset - end_addr_offset,
18038 AT_REGNUM));
18039 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, low,
18040 NULL, false, OPTAB_WIDEN);
18041
18042 /* Emit the JR, if we couldn't above. */
18043 if (ISA_HAS_LOAD_DELAY)
18044 {
18045 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM));
18046 trampoline[i++] = OP (MIPS_NOP);
18047 }
18048 }
18049
18050 #undef OP
18051
18052 /* Copy the trampoline code. Leave any padding uninitialized. */
18053 for (j = 0; j < i; j++)
18054 {
18055 mem = adjust_address (m_tramp, SImode, j * GET_MODE_SIZE (SImode));
18056 mips_emit_move (mem, trampoline[j]);
18057 }
18058
18059 /* Set up the static chain pointer field. */
18060 mem = adjust_address (m_tramp, ptr_mode, static_chain_offset);
18061 mips_emit_move (mem, chain_value);
18062
18063 /* Set up the target function field. */
18064 mem = adjust_address (m_tramp, ptr_mode, target_function_offset);
18065 mips_emit_move (mem, XEXP (DECL_RTL (fndecl), 0));
18066
18067 /* Flush the code part of the trampoline. */
18068 emit_insn (gen_add3_insn (end_addr, addr, GEN_INT (TRAMPOLINE_SIZE)));
18069 emit_insn (gen_clear_cache (addr, end_addr));
18070 }
18071
18072 /* Implement FUNCTION_PROFILER. */
18073
18074 void mips_function_profiler (FILE *file)
18075 {
18076 if (TARGET_MIPS16)
18077 sorry ("mips16 function profiling");
18078 if (TARGET_LONG_CALLS)
18079 {
18080 /* For TARGET_LONG_CALLS use $3 for the address of _mcount. */
18081 if (Pmode == DImode)
18082 fprintf (file, "\tdla\t%s,_mcount\n", reg_names[3]);
18083 else
18084 fprintf (file, "\tla\t%s,_mcount\n", reg_names[3]);
18085 }
18086 mips_push_asm_switch (&mips_noat);
18087 fprintf (file, "\tmove\t%s,%s\t\t# save current return address\n",
18088 reg_names[AT_REGNUM], reg_names[RETURN_ADDR_REGNUM]);
18089 /* _mcount treats $2 as the static chain register. */
18090 if (cfun->static_chain_decl != NULL)
18091 fprintf (file, "\tmove\t%s,%s\n", reg_names[2],
18092 reg_names[STATIC_CHAIN_REGNUM]);
18093 if (TARGET_MCOUNT_RA_ADDRESS)
18094 {
18095 /* If TARGET_MCOUNT_RA_ADDRESS load $12 with the address of the
18096 ra save location. */
18097 if (cfun->machine->frame.ra_fp_offset == 0)
18098 /* ra not saved, pass zero. */
18099 fprintf (file, "\tmove\t%s,%s\n", reg_names[12], reg_names[0]);
18100 else
18101 fprintf (file, "\t%s\t%s," HOST_WIDE_INT_PRINT_DEC "(%s)\n",
18102 Pmode == DImode ? "dla" : "la", reg_names[12],
18103 cfun->machine->frame.ra_fp_offset,
18104 reg_names[STACK_POINTER_REGNUM]);
18105 }
18106 if (!TARGET_NEWABI)
18107 fprintf (file,
18108 "\t%s\t%s,%s,%d\t\t# _mcount pops 2 words from stack\n",
18109 TARGET_64BIT ? "dsubu" : "subu",
18110 reg_names[STACK_POINTER_REGNUM],
18111 reg_names[STACK_POINTER_REGNUM],
18112 Pmode == DImode ? 16 : 8);
18113
18114 if (TARGET_LONG_CALLS)
18115 fprintf (file, "\tjalr\t%s\n", reg_names[3]);
18116 else
18117 fprintf (file, "\tjal\t_mcount\n");
18118 mips_pop_asm_switch (&mips_noat);
18119 /* _mcount treats $2 as the static chain register. */
18120 if (cfun->static_chain_decl != NULL)
18121 fprintf (file, "\tmove\t%s,%s\n", reg_names[STATIC_CHAIN_REGNUM],
18122 reg_names[2]);
18123 }
18124
18125 /* Implement TARGET_SHIFT_TRUNCATION_MASK. We want to keep the default
18126 behaviour of TARGET_SHIFT_TRUNCATION_MASK for non-vector modes even
18127 when TARGET_LOONGSON_VECTORS is true. */
18128
18129 static unsigned HOST_WIDE_INT
18130 mips_shift_truncation_mask (enum machine_mode mode)
18131 {
18132 if (TARGET_LOONGSON_VECTORS && VECTOR_MODE_P (mode))
18133 return 0;
18134
18135 return GET_MODE_BITSIZE (mode) - 1;
18136 }
18137
18138 /* Implement TARGET_PREPARE_PCH_SAVE. */
18139
18140 static void
18141 mips_prepare_pch_save (void)
18142 {
18143 /* We are called in a context where the current MIPS16 vs. non-MIPS16
18144 setting should be irrelevant. The question then is: which setting
18145 makes most sense at load time?
18146
18147 The PCH is loaded before the first token is read. We should never
18148 have switched into MIPS16 mode by that point, and thus should not
18149 have populated mips16_globals. Nor can we load the entire contents
18150 of mips16_globals from the PCH file, because mips16_globals contains
18151 a combination of GGC and non-GGC data.
18152
18153 There is therefore no point in trying save the GGC part of
18154 mips16_globals to the PCH file, or to preserve MIPS16ness across
18155 the PCH save and load. The loading compiler would not have access
18156 to the non-GGC parts of mips16_globals (either from the PCH file,
18157 or from a copy that the loading compiler generated itself) and would
18158 have to call target_reinit anyway.
18159
18160 It therefore seems best to switch back to non-MIPS16 mode at
18161 save time, and to ensure that mips16_globals remains null after
18162 a PCH load. */
18163 mips_set_compression_mode (0);
18164 mips16_globals = 0;
18165 }
18166 \f
18167 /* Generate or test for an insn that supports a constant permutation. */
18168
18169 #define MAX_VECT_LEN 8
18170
18171 struct expand_vec_perm_d
18172 {
18173 rtx target, op0, op1;
18174 unsigned char perm[MAX_VECT_LEN];
18175 enum machine_mode vmode;
18176 unsigned char nelt;
18177 bool one_vector_p;
18178 bool testing_p;
18179 };
18180
18181 /* Construct (set target (vec_select op0 (parallel perm))) and
18182 return true if that's a valid instruction in the active ISA. */
18183
18184 static bool
18185 mips_expand_vselect (rtx target, rtx op0,
18186 const unsigned char *perm, unsigned nelt)
18187 {
18188 rtx rperm[MAX_VECT_LEN], x;
18189 unsigned i;
18190
18191 for (i = 0; i < nelt; ++i)
18192 rperm[i] = GEN_INT (perm[i]);
18193
18194 x = gen_rtx_PARALLEL (VOIDmode, gen_rtvec_v (nelt, rperm));
18195 x = gen_rtx_VEC_SELECT (GET_MODE (target), op0, x);
18196 x = gen_rtx_SET (VOIDmode, target, x);
18197
18198 x = emit_insn (x);
18199 if (recog_memoized (x) < 0)
18200 {
18201 remove_insn (x);
18202 return false;
18203 }
18204 return true;
18205 }
18206
18207 /* Similar, but generate a vec_concat from op0 and op1 as well. */
18208
18209 static bool
18210 mips_expand_vselect_vconcat (rtx target, rtx op0, rtx op1,
18211 const unsigned char *perm, unsigned nelt)
18212 {
18213 enum machine_mode v2mode;
18214 rtx x;
18215
18216 v2mode = GET_MODE_2XWIDER_MODE (GET_MODE (op0));
18217 x = gen_rtx_VEC_CONCAT (v2mode, op0, op1);
18218 return mips_expand_vselect (target, x, perm, nelt);
18219 }
18220
18221 /* Recognize patterns for even-odd extraction. */
18222
18223 static bool
18224 mips_expand_vpc_loongson_even_odd (struct expand_vec_perm_d *d)
18225 {
18226 unsigned i, odd, nelt = d->nelt;
18227 rtx t0, t1, t2, t3;
18228
18229 if (!(TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS))
18230 return false;
18231 /* Even-odd for V2SI/V2SFmode is matched by interleave directly. */
18232 if (nelt < 4)
18233 return false;
18234
18235 odd = d->perm[0];
18236 if (odd > 1)
18237 return false;
18238 for (i = 1; i < nelt; ++i)
18239 if (d->perm[i] != i * 2 + odd)
18240 return false;
18241
18242 if (d->testing_p)
18243 return true;
18244
18245 /* We need 2*log2(N)-1 operations to achieve odd/even with interleave. */
18246 t0 = gen_reg_rtx (d->vmode);
18247 t1 = gen_reg_rtx (d->vmode);
18248 switch (d->vmode)
18249 {
18250 case V4HImode:
18251 emit_insn (gen_loongson_punpckhhw (t0, d->op0, d->op1));
18252 emit_insn (gen_loongson_punpcklhw (t1, d->op0, d->op1));
18253 if (odd)
18254 emit_insn (gen_loongson_punpckhhw (d->target, t1, t0));
18255 else
18256 emit_insn (gen_loongson_punpcklhw (d->target, t1, t0));
18257 break;
18258
18259 case V8QImode:
18260 t2 = gen_reg_rtx (d->vmode);
18261 t3 = gen_reg_rtx (d->vmode);
18262 emit_insn (gen_loongson_punpckhbh (t0, d->op0, d->op1));
18263 emit_insn (gen_loongson_punpcklbh (t1, d->op0, d->op1));
18264 emit_insn (gen_loongson_punpckhbh (t2, t1, t0));
18265 emit_insn (gen_loongson_punpcklbh (t3, t1, t0));
18266 if (odd)
18267 emit_insn (gen_loongson_punpckhbh (d->target, t3, t2));
18268 else
18269 emit_insn (gen_loongson_punpcklbh (d->target, t3, t2));
18270 break;
18271
18272 default:
18273 gcc_unreachable ();
18274 }
18275 return true;
18276 }
18277
18278 /* Recognize patterns for the Loongson PSHUFH instruction. */
18279
18280 static bool
18281 mips_expand_vpc_loongson_pshufh (struct expand_vec_perm_d *d)
18282 {
18283 unsigned i, mask;
18284 rtx rmask;
18285
18286 if (!(TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS))
18287 return false;
18288 if (d->vmode != V4HImode)
18289 return false;
18290 if (d->testing_p)
18291 return true;
18292
18293 /* Convert the selector into the packed 8-bit form for pshufh. */
18294 /* Recall that loongson is little-endian only. No big-endian
18295 adjustment required. */
18296 for (i = mask = 0; i < 4; i++)
18297 mask |= (d->perm[i] & 3) << (i * 2);
18298 rmask = force_reg (SImode, GEN_INT (mask));
18299
18300 if (d->one_vector_p)
18301 emit_insn (gen_loongson_pshufh (d->target, d->op0, rmask));
18302 else
18303 {
18304 rtx t0, t1, x, merge, rmerge[4];
18305
18306 t0 = gen_reg_rtx (V4HImode);
18307 t1 = gen_reg_rtx (V4HImode);
18308 emit_insn (gen_loongson_pshufh (t1, d->op1, rmask));
18309 emit_insn (gen_loongson_pshufh (t0, d->op0, rmask));
18310
18311 for (i = 0; i < 4; ++i)
18312 rmerge[i] = (d->perm[i] & 4 ? constm1_rtx : const0_rtx);
18313 merge = gen_rtx_CONST_VECTOR (V4HImode, gen_rtvec_v (4, rmerge));
18314 merge = force_reg (V4HImode, merge);
18315
18316 x = gen_rtx_AND (V4HImode, merge, t1);
18317 emit_insn (gen_rtx_SET (VOIDmode, t1, x));
18318
18319 x = gen_rtx_NOT (V4HImode, merge);
18320 x = gen_rtx_AND (V4HImode, x, t0);
18321 emit_insn (gen_rtx_SET (VOIDmode, t0, x));
18322
18323 x = gen_rtx_IOR (V4HImode, t0, t1);
18324 emit_insn (gen_rtx_SET (VOIDmode, d->target, x));
18325 }
18326
18327 return true;
18328 }
18329
18330 /* Recognize broadcast patterns for the Loongson. */
18331
18332 static bool
18333 mips_expand_vpc_loongson_bcast (struct expand_vec_perm_d *d)
18334 {
18335 unsigned i, elt;
18336 rtx t0, t1;
18337
18338 if (!(TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS))
18339 return false;
18340 /* Note that we've already matched V2SI via punpck and V4HI via pshufh. */
18341 if (d->vmode != V8QImode)
18342 return false;
18343 if (!d->one_vector_p)
18344 return false;
18345
18346 elt = d->perm[0];
18347 for (i = 1; i < 8; ++i)
18348 if (d->perm[i] != elt)
18349 return false;
18350
18351 if (d->testing_p)
18352 return true;
18353
18354 /* With one interleave we put two of the desired element adjacent. */
18355 t0 = gen_reg_rtx (V8QImode);
18356 if (elt < 4)
18357 emit_insn (gen_loongson_punpcklbh (t0, d->op0, d->op0));
18358 else
18359 emit_insn (gen_loongson_punpckhbh (t0, d->op0, d->op0));
18360
18361 /* Shuffle that one HImode element into all locations. */
18362 elt &= 3;
18363 elt *= 0x55;
18364 t1 = gen_reg_rtx (V4HImode);
18365 emit_insn (gen_loongson_pshufh (t1, gen_lowpart (V4HImode, t0),
18366 force_reg (SImode, GEN_INT (elt))));
18367
18368 emit_move_insn (d->target, gen_lowpart (V8QImode, t1));
18369 return true;
18370 }
18371
18372 static bool
18373 mips_expand_vec_perm_const_1 (struct expand_vec_perm_d *d)
18374 {
18375 unsigned int i, nelt = d->nelt;
18376 unsigned char perm2[MAX_VECT_LEN];
18377
18378 if (d->one_vector_p)
18379 {
18380 /* Try interleave with alternating operands. */
18381 memcpy (perm2, d->perm, sizeof(perm2));
18382 for (i = 1; i < nelt; i += 2)
18383 perm2[i] += nelt;
18384 if (mips_expand_vselect_vconcat (d->target, d->op0, d->op1, perm2, nelt))
18385 return true;
18386 }
18387 else
18388 {
18389 if (mips_expand_vselect_vconcat (d->target, d->op0, d->op1,
18390 d->perm, nelt))
18391 return true;
18392
18393 /* Try again with swapped operands. */
18394 for (i = 0; i < nelt; ++i)
18395 perm2[i] = (d->perm[i] + nelt) & (2 * nelt - 1);
18396 if (mips_expand_vselect_vconcat (d->target, d->op1, d->op0, perm2, nelt))
18397 return true;
18398 }
18399
18400 if (mips_expand_vpc_loongson_even_odd (d))
18401 return true;
18402 if (mips_expand_vpc_loongson_pshufh (d))
18403 return true;
18404 if (mips_expand_vpc_loongson_bcast (d))
18405 return true;
18406 return false;
18407 }
18408
18409 /* Expand a vec_perm_const pattern. */
18410
18411 bool
18412 mips_expand_vec_perm_const (rtx operands[4])
18413 {
18414 struct expand_vec_perm_d d;
18415 int i, nelt, which;
18416 unsigned char orig_perm[MAX_VECT_LEN];
18417 rtx sel;
18418 bool ok;
18419
18420 d.target = operands[0];
18421 d.op0 = operands[1];
18422 d.op1 = operands[2];
18423 sel = operands[3];
18424
18425 d.vmode = GET_MODE (d.target);
18426 gcc_assert (VECTOR_MODE_P (d.vmode));
18427 d.nelt = nelt = GET_MODE_NUNITS (d.vmode);
18428 d.testing_p = false;
18429
18430 for (i = which = 0; i < nelt; ++i)
18431 {
18432 rtx e = XVECEXP (sel, 0, i);
18433 int ei = INTVAL (e) & (2 * nelt - 1);
18434 which |= (ei < nelt ? 1 : 2);
18435 orig_perm[i] = ei;
18436 }
18437 memcpy (d.perm, orig_perm, MAX_VECT_LEN);
18438
18439 switch (which)
18440 {
18441 default:
18442 gcc_unreachable();
18443
18444 case 3:
18445 d.one_vector_p = false;
18446 if (!rtx_equal_p (d.op0, d.op1))
18447 break;
18448 /* FALLTHRU */
18449
18450 case 2:
18451 for (i = 0; i < nelt; ++i)
18452 d.perm[i] &= nelt - 1;
18453 d.op0 = d.op1;
18454 d.one_vector_p = true;
18455 break;
18456
18457 case 1:
18458 d.op1 = d.op0;
18459 d.one_vector_p = true;
18460 break;
18461 }
18462
18463 ok = mips_expand_vec_perm_const_1 (&d);
18464
18465 /* If we were given a two-vector permutation which just happened to
18466 have both input vectors equal, we folded this into a one-vector
18467 permutation. There are several loongson patterns that are matched
18468 via direct vec_select+vec_concat expansion, but we do not have
18469 support in mips_expand_vec_perm_const_1 to guess the adjustment
18470 that should be made for a single operand. Just try again with
18471 the original permutation. */
18472 if (!ok && which == 3)
18473 {
18474 d.op0 = operands[1];
18475 d.op1 = operands[2];
18476 d.one_vector_p = false;
18477 memcpy (d.perm, orig_perm, MAX_VECT_LEN);
18478 ok = mips_expand_vec_perm_const_1 (&d);
18479 }
18480
18481 return ok;
18482 }
18483
18484 /* Implement TARGET_VECTORIZE_VEC_PERM_CONST_OK. */
18485
18486 static bool
18487 mips_vectorize_vec_perm_const_ok (enum machine_mode vmode,
18488 const unsigned char *sel)
18489 {
18490 struct expand_vec_perm_d d;
18491 unsigned int i, nelt, which;
18492 bool ret;
18493
18494 d.vmode = vmode;
18495 d.nelt = nelt = GET_MODE_NUNITS (d.vmode);
18496 d.testing_p = true;
18497 memcpy (d.perm, sel, nelt);
18498
18499 /* Categorize the set of elements in the selector. */
18500 for (i = which = 0; i < nelt; ++i)
18501 {
18502 unsigned char e = d.perm[i];
18503 gcc_assert (e < 2 * nelt);
18504 which |= (e < nelt ? 1 : 2);
18505 }
18506
18507 /* For all elements from second vector, fold the elements to first. */
18508 if (which == 2)
18509 for (i = 0; i < nelt; ++i)
18510 d.perm[i] -= nelt;
18511
18512 /* Check whether the mask can be applied to the vector type. */
18513 d.one_vector_p = (which != 3);
18514
18515 d.target = gen_raw_REG (d.vmode, LAST_VIRTUAL_REGISTER + 1);
18516 d.op1 = d.op0 = gen_raw_REG (d.vmode, LAST_VIRTUAL_REGISTER + 2);
18517 if (!d.one_vector_p)
18518 d.op1 = gen_raw_REG (d.vmode, LAST_VIRTUAL_REGISTER + 3);
18519
18520 start_sequence ();
18521 ret = mips_expand_vec_perm_const_1 (&d);
18522 end_sequence ();
18523
18524 return ret;
18525 }
18526
18527 /* Expand an integral vector unpack operation. */
18528
18529 void
18530 mips_expand_vec_unpack (rtx operands[2], bool unsigned_p, bool high_p)
18531 {
18532 enum machine_mode imode = GET_MODE (operands[1]);
18533 rtx (*unpack) (rtx, rtx, rtx);
18534 rtx (*cmpgt) (rtx, rtx, rtx);
18535 rtx tmp, dest, zero;
18536
18537 switch (imode)
18538 {
18539 case V8QImode:
18540 if (high_p)
18541 unpack = gen_loongson_punpckhbh;
18542 else
18543 unpack = gen_loongson_punpcklbh;
18544 cmpgt = gen_loongson_pcmpgtb;
18545 break;
18546 case V4HImode:
18547 if (high_p)
18548 unpack = gen_loongson_punpckhhw;
18549 else
18550 unpack = gen_loongson_punpcklhw;
18551 cmpgt = gen_loongson_pcmpgth;
18552 break;
18553 default:
18554 gcc_unreachable ();
18555 }
18556
18557 zero = force_reg (imode, CONST0_RTX (imode));
18558 if (unsigned_p)
18559 tmp = zero;
18560 else
18561 {
18562 tmp = gen_reg_rtx (imode);
18563 emit_insn (cmpgt (tmp, zero, operands[1]));
18564 }
18565
18566 dest = gen_reg_rtx (imode);
18567 emit_insn (unpack (dest, operands[1], tmp));
18568
18569 emit_move_insn (operands[0], gen_lowpart (GET_MODE (operands[0]), dest));
18570 }
18571
18572 /* A subroutine of mips_expand_vec_init, match constant vector elements. */
18573
18574 static inline bool
18575 mips_constant_elt_p (rtx x)
18576 {
18577 return CONST_INT_P (x) || GET_CODE (x) == CONST_DOUBLE;
18578 }
18579
18580 /* A subroutine of mips_expand_vec_init, expand via broadcast. */
18581
18582 static void
18583 mips_expand_vi_broadcast (enum machine_mode vmode, rtx target, rtx elt)
18584 {
18585 struct expand_vec_perm_d d;
18586 rtx t1;
18587 bool ok;
18588
18589 if (elt != const0_rtx)
18590 elt = force_reg (GET_MODE_INNER (vmode), elt);
18591 if (REG_P (elt))
18592 elt = gen_lowpart (DImode, elt);
18593
18594 t1 = gen_reg_rtx (vmode);
18595 switch (vmode)
18596 {
18597 case V8QImode:
18598 emit_insn (gen_loongson_vec_init1_v8qi (t1, elt));
18599 break;
18600 case V4HImode:
18601 emit_insn (gen_loongson_vec_init1_v4hi (t1, elt));
18602 break;
18603 default:
18604 gcc_unreachable ();
18605 }
18606
18607 memset (&d, 0, sizeof (d));
18608 d.target = target;
18609 d.op0 = t1;
18610 d.op1 = t1;
18611 d.vmode = vmode;
18612 d.nelt = GET_MODE_NUNITS (vmode);
18613 d.one_vector_p = true;
18614
18615 ok = mips_expand_vec_perm_const_1 (&d);
18616 gcc_assert (ok);
18617 }
18618
18619 /* A subroutine of mips_expand_vec_init, replacing all of the non-constant
18620 elements of VALS with zeros, copy the constant vector to TARGET. */
18621
18622 static void
18623 mips_expand_vi_constant (enum machine_mode vmode, unsigned nelt,
18624 rtx target, rtx vals)
18625 {
18626 rtvec vec = shallow_copy_rtvec (XVEC (vals, 0));
18627 unsigned i;
18628
18629 for (i = 0; i < nelt; ++i)
18630 {
18631 if (!mips_constant_elt_p (RTVEC_ELT (vec, i)))
18632 RTVEC_ELT (vec, i) = const0_rtx;
18633 }
18634
18635 emit_move_insn (target, gen_rtx_CONST_VECTOR (vmode, vec));
18636 }
18637
18638
18639 /* A subroutine of mips_expand_vec_init, expand via pinsrh. */
18640
18641 static void
18642 mips_expand_vi_loongson_one_pinsrh (rtx target, rtx vals, unsigned one_var)
18643 {
18644 mips_expand_vi_constant (V4HImode, 4, target, vals);
18645
18646 emit_insn (gen_vec_setv4hi (target, target, XVECEXP (vals, 0, one_var),
18647 GEN_INT (one_var)));
18648 }
18649
18650 /* A subroutine of mips_expand_vec_init, expand anything via memory. */
18651
18652 static void
18653 mips_expand_vi_general (enum machine_mode vmode, enum machine_mode imode,
18654 unsigned nelt, unsigned nvar, rtx target, rtx vals)
18655 {
18656 rtx mem = assign_stack_temp (vmode, GET_MODE_SIZE (vmode));
18657 unsigned int i, isize = GET_MODE_SIZE (imode);
18658
18659 if (nvar < nelt)
18660 mips_expand_vi_constant (vmode, nelt, mem, vals);
18661
18662 for (i = 0; i < nelt; ++i)
18663 {
18664 rtx x = XVECEXP (vals, 0, i);
18665 if (!mips_constant_elt_p (x))
18666 emit_move_insn (adjust_address (mem, imode, i * isize), x);
18667 }
18668
18669 emit_move_insn (target, mem);
18670 }
18671
18672 /* Expand a vector initialization. */
18673
18674 void
18675 mips_expand_vector_init (rtx target, rtx vals)
18676 {
18677 enum machine_mode vmode = GET_MODE (target);
18678 enum machine_mode imode = GET_MODE_INNER (vmode);
18679 unsigned i, nelt = GET_MODE_NUNITS (vmode);
18680 unsigned nvar = 0, one_var = -1u;
18681 bool all_same = true;
18682 rtx x;
18683
18684 for (i = 0; i < nelt; ++i)
18685 {
18686 x = XVECEXP (vals, 0, i);
18687 if (!mips_constant_elt_p (x))
18688 nvar++, one_var = i;
18689 if (i > 0 && !rtx_equal_p (x, XVECEXP (vals, 0, 0)))
18690 all_same = false;
18691 }
18692
18693 /* Load constants from the pool, or whatever's handy. */
18694 if (nvar == 0)
18695 {
18696 emit_move_insn (target, gen_rtx_CONST_VECTOR (vmode, XVEC (vals, 0)));
18697 return;
18698 }
18699
18700 /* For two-part initialization, always use CONCAT. */
18701 if (nelt == 2)
18702 {
18703 rtx op0 = force_reg (imode, XVECEXP (vals, 0, 0));
18704 rtx op1 = force_reg (imode, XVECEXP (vals, 0, 1));
18705 x = gen_rtx_VEC_CONCAT (vmode, op0, op1);
18706 emit_insn (gen_rtx_SET (VOIDmode, target, x));
18707 return;
18708 }
18709
18710 /* Loongson is the only cpu with vectors with more elements. */
18711 gcc_assert (TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS);
18712
18713 /* If all values are identical, broadcast the value. */
18714 if (all_same)
18715 {
18716 mips_expand_vi_broadcast (vmode, target, XVECEXP (vals, 0, 0));
18717 return;
18718 }
18719
18720 /* If we've only got one non-variable V4HImode, use PINSRH. */
18721 if (nvar == 1 && vmode == V4HImode)
18722 {
18723 mips_expand_vi_loongson_one_pinsrh (target, vals, one_var);
18724 return;
18725 }
18726
18727 mips_expand_vi_general (vmode, imode, nelt, nvar, target, vals);
18728 }
18729
18730 /* Expand a vector reduction. */
18731
18732 void
18733 mips_expand_vec_reduc (rtx target, rtx in, rtx (*gen)(rtx, rtx, rtx))
18734 {
18735 enum machine_mode vmode = GET_MODE (in);
18736 unsigned char perm2[2];
18737 rtx last, next, fold, x;
18738 bool ok;
18739
18740 last = in;
18741 fold = gen_reg_rtx (vmode);
18742 switch (vmode)
18743 {
18744 case V2SFmode:
18745 /* Use PUL/PLU to produce { L, H } op { H, L }.
18746 By reversing the pair order, rather than a pure interleave high,
18747 we avoid erroneous exceptional conditions that we might otherwise
18748 produce from the computation of H op H. */
18749 perm2[0] = 1;
18750 perm2[1] = 2;
18751 ok = mips_expand_vselect_vconcat (fold, last, last, perm2, 2);
18752 gcc_assert (ok);
18753 break;
18754
18755 case V2SImode:
18756 /* Use interleave to produce { H, L } op { H, H }. */
18757 emit_insn (gen_loongson_punpckhwd (fold, last, last));
18758 break;
18759
18760 case V4HImode:
18761 /* Perform the first reduction with interleave,
18762 and subsequent reductions with shifts. */
18763 emit_insn (gen_loongson_punpckhwd_hi (fold, last, last));
18764
18765 next = gen_reg_rtx (vmode);
18766 emit_insn (gen (next, last, fold));
18767 last = next;
18768
18769 fold = gen_reg_rtx (vmode);
18770 x = force_reg (SImode, GEN_INT (16));
18771 emit_insn (gen_vec_shr_v4hi (fold, last, x));
18772 break;
18773
18774 case V8QImode:
18775 emit_insn (gen_loongson_punpckhwd_qi (fold, last, last));
18776
18777 next = gen_reg_rtx (vmode);
18778 emit_insn (gen (next, last, fold));
18779 last = next;
18780
18781 fold = gen_reg_rtx (vmode);
18782 x = force_reg (SImode, GEN_INT (16));
18783 emit_insn (gen_vec_shr_v8qi (fold, last, x));
18784
18785 next = gen_reg_rtx (vmode);
18786 emit_insn (gen (next, last, fold));
18787 last = next;
18788
18789 fold = gen_reg_rtx (vmode);
18790 x = force_reg (SImode, GEN_INT (8));
18791 emit_insn (gen_vec_shr_v8qi (fold, last, x));
18792 break;
18793
18794 default:
18795 gcc_unreachable ();
18796 }
18797
18798 emit_insn (gen (target, last, fold));
18799 }
18800
18801 /* Expand a vector minimum/maximum. */
18802
18803 void
18804 mips_expand_vec_minmax (rtx target, rtx op0, rtx op1,
18805 rtx (*cmp) (rtx, rtx, rtx), bool min_p)
18806 {
18807 enum machine_mode vmode = GET_MODE (target);
18808 rtx tc, t0, t1, x;
18809
18810 tc = gen_reg_rtx (vmode);
18811 t0 = gen_reg_rtx (vmode);
18812 t1 = gen_reg_rtx (vmode);
18813
18814 /* op0 > op1 */
18815 emit_insn (cmp (tc, op0, op1));
18816
18817 x = gen_rtx_AND (vmode, tc, (min_p ? op1 : op0));
18818 emit_insn (gen_rtx_SET (VOIDmode, t0, x));
18819
18820 x = gen_rtx_NOT (vmode, tc);
18821 x = gen_rtx_AND (vmode, x, (min_p ? op0 : op1));
18822 emit_insn (gen_rtx_SET (VOIDmode, t1, x));
18823
18824 x = gen_rtx_IOR (vmode, t0, t1);
18825 emit_insn (gen_rtx_SET (VOIDmode, target, x));
18826 }
18827
18828 /* Implement TARGET_CASE_VALUES_THRESHOLD. */
18829
18830 unsigned int
18831 mips_case_values_threshold (void)
18832 {
18833 /* In MIPS16 mode using a larger case threshold generates smaller code. */
18834 if (TARGET_MIPS16 && optimize_size)
18835 return 10;
18836 else
18837 return default_case_values_threshold ();
18838 }
18839
18840 /* Implement TARGET_ATOMIC_ASSIGN_EXPAND_FENV. */
18841
18842 static void
18843 mips_atomic_assign_expand_fenv (tree *hold, tree *clear, tree *update)
18844 {
18845 if (!TARGET_HARD_FLOAT_ABI)
18846 return;
18847 tree exceptions_var = create_tmp_var (MIPS_ATYPE_USI, NULL);
18848 tree fcsr_orig_var = create_tmp_var (MIPS_ATYPE_USI, NULL);
18849 tree fcsr_mod_var = create_tmp_var (MIPS_ATYPE_USI, NULL);
18850 tree get_fcsr = mips_builtin_decls[MIPS_GET_FCSR];
18851 tree set_fcsr = mips_builtin_decls[MIPS_SET_FCSR];
18852 tree get_fcsr_hold_call = build_call_expr (get_fcsr, 0);
18853 tree hold_assign_orig = build2 (MODIFY_EXPR, MIPS_ATYPE_USI,
18854 fcsr_orig_var, get_fcsr_hold_call);
18855 tree hold_mod_val = build2 (BIT_AND_EXPR, MIPS_ATYPE_USI, fcsr_orig_var,
18856 build_int_cst (MIPS_ATYPE_USI, 0xfffff003));
18857 tree hold_assign_mod = build2 (MODIFY_EXPR, MIPS_ATYPE_USI,
18858 fcsr_mod_var, hold_mod_val);
18859 tree set_fcsr_hold_call = build_call_expr (set_fcsr, 1, fcsr_mod_var);
18860 tree hold_all = build2 (COMPOUND_EXPR, MIPS_ATYPE_USI,
18861 hold_assign_orig, hold_assign_mod);
18862 *hold = build2 (COMPOUND_EXPR, void_type_node, hold_all,
18863 set_fcsr_hold_call);
18864
18865 *clear = build_call_expr (set_fcsr, 1, fcsr_mod_var);
18866
18867 tree get_fcsr_update_call = build_call_expr (get_fcsr, 0);
18868 *update = build2 (MODIFY_EXPR, MIPS_ATYPE_USI,
18869 exceptions_var, get_fcsr_update_call);
18870 tree set_fcsr_update_call = build_call_expr (set_fcsr, 1, fcsr_orig_var);
18871 *update = build2 (COMPOUND_EXPR, void_type_node, *update,
18872 set_fcsr_update_call);
18873 tree atomic_feraiseexcept
18874 = builtin_decl_implicit (BUILT_IN_ATOMIC_FERAISEEXCEPT);
18875 tree int_exceptions_var = fold_convert (integer_type_node,
18876 exceptions_var);
18877 tree atomic_feraiseexcept_call = build_call_expr (atomic_feraiseexcept,
18878 1, int_exceptions_var);
18879 *update = build2 (COMPOUND_EXPR, void_type_node, *update,
18880 atomic_feraiseexcept_call);
18881 }
18882
18883 /* Implement TARGET_SPILL_CLASS. */
18884
18885 static reg_class_t
18886 mips_spill_class (reg_class_t rclass ATTRIBUTE_UNUSED,
18887 enum machine_mode mode ATTRIBUTE_UNUSED)
18888 {
18889 if (TARGET_MIPS16)
18890 return SPILL_REGS;
18891 return NO_REGS;
18892 }
18893
18894 /* Implement TARGET_LRA_P. */
18895
18896 static bool
18897 mips_lra_p (void)
18898 {
18899 return mips_lra_flag;
18900 }
18901 \f
18902 /* Initialize the GCC target structure. */
18903 #undef TARGET_ASM_ALIGNED_HI_OP
18904 #define TARGET_ASM_ALIGNED_HI_OP "\t.half\t"
18905 #undef TARGET_ASM_ALIGNED_SI_OP
18906 #define TARGET_ASM_ALIGNED_SI_OP "\t.word\t"
18907 #undef TARGET_ASM_ALIGNED_DI_OP
18908 #define TARGET_ASM_ALIGNED_DI_OP "\t.dword\t"
18909
18910 #undef TARGET_OPTION_OVERRIDE
18911 #define TARGET_OPTION_OVERRIDE mips_option_override
18912
18913 #undef TARGET_LEGITIMIZE_ADDRESS
18914 #define TARGET_LEGITIMIZE_ADDRESS mips_legitimize_address
18915
18916 #undef TARGET_ASM_FUNCTION_PROLOGUE
18917 #define TARGET_ASM_FUNCTION_PROLOGUE mips_output_function_prologue
18918 #undef TARGET_ASM_FUNCTION_EPILOGUE
18919 #define TARGET_ASM_FUNCTION_EPILOGUE mips_output_function_epilogue
18920 #undef TARGET_ASM_SELECT_RTX_SECTION
18921 #define TARGET_ASM_SELECT_RTX_SECTION mips_select_rtx_section
18922 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
18923 #define TARGET_ASM_FUNCTION_RODATA_SECTION mips_function_rodata_section
18924
18925 #undef TARGET_SCHED_INIT
18926 #define TARGET_SCHED_INIT mips_sched_init
18927 #undef TARGET_SCHED_REORDER
18928 #define TARGET_SCHED_REORDER mips_sched_reorder
18929 #undef TARGET_SCHED_REORDER2
18930 #define TARGET_SCHED_REORDER2 mips_sched_reorder2
18931 #undef TARGET_SCHED_VARIABLE_ISSUE
18932 #define TARGET_SCHED_VARIABLE_ISSUE mips_variable_issue
18933 #undef TARGET_SCHED_ADJUST_COST
18934 #define TARGET_SCHED_ADJUST_COST mips_adjust_cost
18935 #undef TARGET_SCHED_ISSUE_RATE
18936 #define TARGET_SCHED_ISSUE_RATE mips_issue_rate
18937 #undef TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN
18938 #define TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN mips_init_dfa_post_cycle_insn
18939 #undef TARGET_SCHED_DFA_POST_ADVANCE_CYCLE
18940 #define TARGET_SCHED_DFA_POST_ADVANCE_CYCLE mips_dfa_post_advance_cycle
18941 #undef TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD
18942 #define TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD \
18943 mips_multipass_dfa_lookahead
18944 #undef TARGET_SMALL_REGISTER_CLASSES_FOR_MODE_P
18945 #define TARGET_SMALL_REGISTER_CLASSES_FOR_MODE_P \
18946 mips_small_register_classes_for_mode_p
18947
18948 #undef TARGET_FUNCTION_OK_FOR_SIBCALL
18949 #define TARGET_FUNCTION_OK_FOR_SIBCALL mips_function_ok_for_sibcall
18950
18951 #undef TARGET_INSERT_ATTRIBUTES
18952 #define TARGET_INSERT_ATTRIBUTES mips_insert_attributes
18953 #undef TARGET_MERGE_DECL_ATTRIBUTES
18954 #define TARGET_MERGE_DECL_ATTRIBUTES mips_merge_decl_attributes
18955 #undef TARGET_CAN_INLINE_P
18956 #define TARGET_CAN_INLINE_P mips_can_inline_p
18957 #undef TARGET_SET_CURRENT_FUNCTION
18958 #define TARGET_SET_CURRENT_FUNCTION mips_set_current_function
18959
18960 #undef TARGET_VALID_POINTER_MODE
18961 #define TARGET_VALID_POINTER_MODE mips_valid_pointer_mode
18962 #undef TARGET_REGISTER_MOVE_COST
18963 #define TARGET_REGISTER_MOVE_COST mips_register_move_cost
18964 #undef TARGET_REGISTER_PRIORITY
18965 #define TARGET_REGISTER_PRIORITY mips_register_priority
18966 #undef TARGET_MEMORY_MOVE_COST
18967 #define TARGET_MEMORY_MOVE_COST mips_memory_move_cost
18968 #undef TARGET_RTX_COSTS
18969 #define TARGET_RTX_COSTS mips_rtx_costs
18970 #undef TARGET_ADDRESS_COST
18971 #define TARGET_ADDRESS_COST mips_address_cost
18972
18973 #undef TARGET_IN_SMALL_DATA_P
18974 #define TARGET_IN_SMALL_DATA_P mips_in_small_data_p
18975
18976 #undef TARGET_MACHINE_DEPENDENT_REORG
18977 #define TARGET_MACHINE_DEPENDENT_REORG mips_reorg
18978
18979 #undef TARGET_PREFERRED_RELOAD_CLASS
18980 #define TARGET_PREFERRED_RELOAD_CLASS mips_preferred_reload_class
18981
18982 #undef TARGET_EXPAND_TO_RTL_HOOK
18983 #define TARGET_EXPAND_TO_RTL_HOOK mips_expand_to_rtl_hook
18984 #undef TARGET_ASM_FILE_START
18985 #define TARGET_ASM_FILE_START mips_file_start
18986 #undef TARGET_ASM_FILE_START_FILE_DIRECTIVE
18987 #define TARGET_ASM_FILE_START_FILE_DIRECTIVE true
18988 #undef TARGET_ASM_CODE_END
18989 #define TARGET_ASM_CODE_END mips_code_end
18990
18991 #undef TARGET_INIT_LIBFUNCS
18992 #define TARGET_INIT_LIBFUNCS mips_init_libfuncs
18993
18994 #undef TARGET_BUILD_BUILTIN_VA_LIST
18995 #define TARGET_BUILD_BUILTIN_VA_LIST mips_build_builtin_va_list
18996 #undef TARGET_EXPAND_BUILTIN_VA_START
18997 #define TARGET_EXPAND_BUILTIN_VA_START mips_va_start
18998 #undef TARGET_GIMPLIFY_VA_ARG_EXPR
18999 #define TARGET_GIMPLIFY_VA_ARG_EXPR mips_gimplify_va_arg_expr
19000
19001 #undef TARGET_PROMOTE_FUNCTION_MODE
19002 #define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote
19003 #undef TARGET_PROMOTE_PROTOTYPES
19004 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
19005
19006 #undef TARGET_FUNCTION_VALUE
19007 #define TARGET_FUNCTION_VALUE mips_function_value
19008 #undef TARGET_LIBCALL_VALUE
19009 #define TARGET_LIBCALL_VALUE mips_libcall_value
19010 #undef TARGET_FUNCTION_VALUE_REGNO_P
19011 #define TARGET_FUNCTION_VALUE_REGNO_P mips_function_value_regno_p
19012 #undef TARGET_RETURN_IN_MEMORY
19013 #define TARGET_RETURN_IN_MEMORY mips_return_in_memory
19014 #undef TARGET_RETURN_IN_MSB
19015 #define TARGET_RETURN_IN_MSB mips_return_in_msb
19016
19017 #undef TARGET_ASM_OUTPUT_MI_THUNK
19018 #define TARGET_ASM_OUTPUT_MI_THUNK mips_output_mi_thunk
19019 #undef TARGET_ASM_CAN_OUTPUT_MI_THUNK
19020 #define TARGET_ASM_CAN_OUTPUT_MI_THUNK hook_bool_const_tree_hwi_hwi_const_tree_true
19021
19022 #undef TARGET_PRINT_OPERAND
19023 #define TARGET_PRINT_OPERAND mips_print_operand
19024 #undef TARGET_PRINT_OPERAND_ADDRESS
19025 #define TARGET_PRINT_OPERAND_ADDRESS mips_print_operand_address
19026 #undef TARGET_PRINT_OPERAND_PUNCT_VALID_P
19027 #define TARGET_PRINT_OPERAND_PUNCT_VALID_P mips_print_operand_punct_valid_p
19028
19029 #undef TARGET_SETUP_INCOMING_VARARGS
19030 #define TARGET_SETUP_INCOMING_VARARGS mips_setup_incoming_varargs
19031 #undef TARGET_STRICT_ARGUMENT_NAMING
19032 #define TARGET_STRICT_ARGUMENT_NAMING mips_strict_argument_naming
19033 #undef TARGET_MUST_PASS_IN_STACK
19034 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
19035 #undef TARGET_PASS_BY_REFERENCE
19036 #define TARGET_PASS_BY_REFERENCE mips_pass_by_reference
19037 #undef TARGET_CALLEE_COPIES
19038 #define TARGET_CALLEE_COPIES mips_callee_copies
19039 #undef TARGET_ARG_PARTIAL_BYTES
19040 #define TARGET_ARG_PARTIAL_BYTES mips_arg_partial_bytes
19041 #undef TARGET_FUNCTION_ARG
19042 #define TARGET_FUNCTION_ARG mips_function_arg
19043 #undef TARGET_FUNCTION_ARG_ADVANCE
19044 #define TARGET_FUNCTION_ARG_ADVANCE mips_function_arg_advance
19045 #undef TARGET_FUNCTION_ARG_BOUNDARY
19046 #define TARGET_FUNCTION_ARG_BOUNDARY mips_function_arg_boundary
19047
19048 #undef TARGET_MODE_REP_EXTENDED
19049 #define TARGET_MODE_REP_EXTENDED mips_mode_rep_extended
19050
19051 #undef TARGET_VECTOR_MODE_SUPPORTED_P
19052 #define TARGET_VECTOR_MODE_SUPPORTED_P mips_vector_mode_supported_p
19053
19054 #undef TARGET_SCALAR_MODE_SUPPORTED_P
19055 #define TARGET_SCALAR_MODE_SUPPORTED_P mips_scalar_mode_supported_p
19056
19057 #undef TARGET_VECTORIZE_PREFERRED_SIMD_MODE
19058 #define TARGET_VECTORIZE_PREFERRED_SIMD_MODE mips_preferred_simd_mode
19059
19060 #undef TARGET_INIT_BUILTINS
19061 #define TARGET_INIT_BUILTINS mips_init_builtins
19062 #undef TARGET_BUILTIN_DECL
19063 #define TARGET_BUILTIN_DECL mips_builtin_decl
19064 #undef TARGET_EXPAND_BUILTIN
19065 #define TARGET_EXPAND_BUILTIN mips_expand_builtin
19066
19067 #undef TARGET_HAVE_TLS
19068 #define TARGET_HAVE_TLS HAVE_AS_TLS
19069
19070 #undef TARGET_CANNOT_FORCE_CONST_MEM
19071 #define TARGET_CANNOT_FORCE_CONST_MEM mips_cannot_force_const_mem
19072
19073 #undef TARGET_LEGITIMATE_CONSTANT_P
19074 #define TARGET_LEGITIMATE_CONSTANT_P mips_legitimate_constant_p
19075
19076 #undef TARGET_ENCODE_SECTION_INFO
19077 #define TARGET_ENCODE_SECTION_INFO mips_encode_section_info
19078
19079 #undef TARGET_ATTRIBUTE_TABLE
19080 #define TARGET_ATTRIBUTE_TABLE mips_attribute_table
19081 /* All our function attributes are related to how out-of-line copies should
19082 be compiled or called. They don't in themselves prevent inlining. */
19083 #undef TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P
19084 #define TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P hook_bool_const_tree_true
19085
19086 #undef TARGET_EXTRA_LIVE_ON_ENTRY
19087 #define TARGET_EXTRA_LIVE_ON_ENTRY mips_extra_live_on_entry
19088
19089 #undef TARGET_USE_BLOCKS_FOR_CONSTANT_P
19090 #define TARGET_USE_BLOCKS_FOR_CONSTANT_P mips_use_blocks_for_constant_p
19091 #undef TARGET_USE_ANCHORS_FOR_SYMBOL_P
19092 #define TARGET_USE_ANCHORS_FOR_SYMBOL_P mips_use_anchors_for_symbol_p
19093
19094 #undef TARGET_COMP_TYPE_ATTRIBUTES
19095 #define TARGET_COMP_TYPE_ATTRIBUTES mips_comp_type_attributes
19096
19097 #ifdef HAVE_AS_DTPRELWORD
19098 #undef TARGET_ASM_OUTPUT_DWARF_DTPREL
19099 #define TARGET_ASM_OUTPUT_DWARF_DTPREL mips_output_dwarf_dtprel
19100 #endif
19101 #undef TARGET_DWARF_REGISTER_SPAN
19102 #define TARGET_DWARF_REGISTER_SPAN mips_dwarf_register_span
19103
19104 #undef TARGET_ASM_FINAL_POSTSCAN_INSN
19105 #define TARGET_ASM_FINAL_POSTSCAN_INSN mips_final_postscan_insn
19106
19107 #undef TARGET_LEGITIMATE_ADDRESS_P
19108 #define TARGET_LEGITIMATE_ADDRESS_P mips_legitimate_address_p
19109
19110 #undef TARGET_FRAME_POINTER_REQUIRED
19111 #define TARGET_FRAME_POINTER_REQUIRED mips_frame_pointer_required
19112
19113 #undef TARGET_CAN_ELIMINATE
19114 #define TARGET_CAN_ELIMINATE mips_can_eliminate
19115
19116 #undef TARGET_CONDITIONAL_REGISTER_USAGE
19117 #define TARGET_CONDITIONAL_REGISTER_USAGE mips_conditional_register_usage
19118
19119 #undef TARGET_TRAMPOLINE_INIT
19120 #define TARGET_TRAMPOLINE_INIT mips_trampoline_init
19121
19122 #undef TARGET_ASM_OUTPUT_SOURCE_FILENAME
19123 #define TARGET_ASM_OUTPUT_SOURCE_FILENAME mips_output_filename
19124
19125 #undef TARGET_SHIFT_TRUNCATION_MASK
19126 #define TARGET_SHIFT_TRUNCATION_MASK mips_shift_truncation_mask
19127
19128 #undef TARGET_PREPARE_PCH_SAVE
19129 #define TARGET_PREPARE_PCH_SAVE mips_prepare_pch_save
19130
19131 #undef TARGET_VECTORIZE_VEC_PERM_CONST_OK
19132 #define TARGET_VECTORIZE_VEC_PERM_CONST_OK mips_vectorize_vec_perm_const_ok
19133
19134 #undef TARGET_CASE_VALUES_THRESHOLD
19135 #define TARGET_CASE_VALUES_THRESHOLD mips_case_values_threshold
19136
19137 #undef TARGET_ATOMIC_ASSIGN_EXPAND_FENV
19138 #define TARGET_ATOMIC_ASSIGN_EXPAND_FENV mips_atomic_assign_expand_fenv
19139
19140 #undef TARGET_CALL_FUSAGE_CONTAINS_NON_CALLEE_CLOBBERS
19141 #define TARGET_CALL_FUSAGE_CONTAINS_NON_CALLEE_CLOBBERS true
19142
19143 #undef TARGET_SPILL_CLASS
19144 #define TARGET_SPILL_CLASS mips_spill_class
19145 #undef TARGET_LRA_P
19146 #define TARGET_LRA_P mips_lra_p
19147
19148 struct gcc_target targetm = TARGET_INITIALIZER;
19149 \f
19150 #include "gt-mips.h"