/* ------------------------------------------------------------------------ */
-/* A helper function to check if this function should contain prologue. */
-static int
-nds32_have_prologue_p (void)
-{
- int i;
-
- for (i = 0; i < 28; i++)
- if (NDS32_REQUIRED_CALLEE_SAVED_P (i))
- return 1;
-
- return (flag_pic
- || NDS32_REQUIRED_CALLEE_SAVED_P (FP_REGNUM)
- || NDS32_REQUIRED_CALLEE_SAVED_P (LP_REGNUM));
-}
-
-/* Return true if is load/store with SYMBOL_REF addressing mode
- and memory mode is SImode. */
-static bool
-nds32_symbol_load_store_p (rtx_insn *insn)
-{
- rtx mem_src = NULL_RTX;
-
- switch (get_attr_type (insn))
- {
- case TYPE_LOAD:
- mem_src = SET_SRC (PATTERN (insn));
- break;
- case TYPE_STORE:
- mem_src = SET_DEST (PATTERN (insn));
- break;
- default:
- break;
- }
-
- /* Find load/store insn with addressing mode is SYMBOL_REF. */
- if (mem_src != NULL_RTX)
- {
- if ((GET_CODE (mem_src) == ZERO_EXTEND)
- || (GET_CODE (mem_src) == SIGN_EXTEND))
- mem_src = XEXP (mem_src, 0);
-
- if ((GET_CODE (XEXP (mem_src, 0)) == SYMBOL_REF)
- || (GET_CODE (XEXP (mem_src, 0)) == LO_SUM))
- return true;
- }
-
- return false;
-}
-
/* Function to determine whether it is worth to do fp_as_gp optimization.
Return 0: It is NOT worth to do fp_as_gp optimization.
Return 1: It is APPROXIMATELY worth to do fp_as_gp optimization.
int
nds32_fp_as_gp_check_available (void)
{
- /* If there exists ANY of following conditions,
- we DO NOT perform fp_as_gp optimization:
- 1. TARGET_FORBID_FP_AS_GP is set
- regardless of the TARGET_FORCE_FP_AS_GP.
- 2. User explicitly uses 'naked' attribute.
- 3. Not optimize for size.
- 4. Need frame pointer.
- 5. If $fp is already required to be saved,
- it means $fp is already choosen by register allocator.
- Thus we better not to use it for fp_as_gp optimization.
- 6. This function is a vararg function.
- DO NOT apply fp_as_gp optimization on this function
- because it may change and break stack frame.
- 7. The epilogue is empty.
- This happens when the function uses exit()
- or its attribute is no_return.
- In that case, compiler will not expand epilogue
- so that we have no chance to output .omit_fp_end directive. */
- if (TARGET_FORBID_FP_AS_GP
- || lookup_attribute ("naked", DECL_ATTRIBUTES (current_function_decl))
- || !optimize_size
- || frame_pointer_needed
- || NDS32_REQUIRED_CALLEE_SAVED_P (FP_REGNUM)
- || (cfun->stdarg == 1)
- || (find_fallthru_edge (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds) == NULL))
- return 0;
-
- /* Now we can check the possibility of using fp_as_gp optimization. */
- if (TARGET_FORCE_FP_AS_GP)
- {
- /* User explicitly issues -mforce-fp-as-gp option. */
- df_set_regs_ever_live (FP_REGNUM, 1);
- return 1;
- }
- else
- {
- /* In the following we are going to evaluate whether
- it is worth to do fp_as_gp optimization. */
- int good_gain = 0;
- int symbol_count = 0;
-
- int threshold;
- rtx_insn *insn;
-
- /* We check if there already requires prologue.
- Note that $gp will be saved in prologue for PIC code generation.
- After that, we can set threshold by the existence of prologue.
- Each fp-implied instruction will gain 2-byte code size
- from gp-aware instruction, so we have following heuristics. */
- if (flag_pic
- || nds32_have_prologue_p ())
- {
- /* Have-prologue:
- Compiler already intends to generate prologue content,
- so the fp_as_gp optimization will only insert
- 'la $fp,_FP_BASE_' instruction, which will be
- converted into 4-byte instruction at link time.
- The threshold is "3" symbol accesses, 2 + 2 + 2 > 4. */
- threshold = 3;
- }
- else
- {
- /* None-prologue:
- Compiler originally does not generate prologue content,
- so the fp_as_gp optimization will NOT ONLY insert
- 'la $fp,_FP_BASE' instruction, but also causes
- push/pop instructions.
- If we are using v3push (push25/pop25),
- the threshold is "5" symbol accesses, 5*2 > 4 + 2 + 2;
- If we are using normal push (smw/lmw),
- the threshold is "5+2" symbol accesses 7*2 > 4 + 4 + 4. */
- threshold = 5 + (TARGET_V3PUSH ? 0 : 2);
- }
-
- /* We would like to traverse every instruction in this function.
- So we need to have push_topmost_sequence()/pop_topmost_sequence()
- surrounding our for-loop evaluation. */
- push_topmost_sequence ();
- /* Counting the insn number which the addressing mode is symbol. */
- for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
- {
- if (single_set (insn) && nds32_symbol_load_store_p (insn))
- symbol_count++;
-
- if (symbol_count == threshold)
- {
- good_gain = 1;
- break;
- }
- }
- pop_topmost_sequence ();
-
- /* Enable fp_as_gp optimization when potential gain is good enough. */
- if (good_gain)
- {
- df_set_regs_ever_live (FP_REGNUM, 1);
- return 1;
- }
- }
-
/* By default we return 0. */
return 0;
}
"for checking inconsistency on interrupt handler\n");
fprintf (asm_out_file, "\t.vec_size\t%d\n", nds32_isr_vector_size);
- /* If user enables '-mforce-fp-as-gp' or compiles programs with -Os,
- the compiler may produce 'la $fp,_FP_BASE_' instruction
- at prologue for fp-as-gp optimization.
- We should emit weak reference of _FP_BASE_ to avoid undefined reference
- in case user does not pass '--relax' option to linker. */
- if (TARGET_FORCE_FP_AS_GP || optimize_size)
- {
- fprintf (asm_out_file, "\t! This weak reference is required to do "
- "fp-as-gp link time optimization\n");
- fprintf (asm_out_file, "\t.weak\t_FP_BASE_\n");
- }
- /* If user enables '-mex9', we should emit relaxation directive
- to tell linker that this file is allowed to do ex9 optimization. */
- if (TARGET_EX9)
- {
- fprintf (asm_out_file, "\t! This relaxation directive is required "
- "to do ex9 link time optimization\n");
- fprintf (asm_out_file, "\t.relax\tex9\n");
- }
-
fprintf (asm_out_file, "\t! ------------------------------------\n");
if (TARGET_ISA_V2)
fixed_regs[r] = call_used_regs[r] = 1;
}
- /* See if user explicitly would like to use fp-as-gp optimization.
- If so, we must prevent $fp from being allocated
- during register allocation. */
- if (TARGET_FORCE_FP_AS_GP)
- fixed_regs[FP_REGNUM] = call_used_regs[FP_REGNUM] = 1;
-
if (!TARGET_16_BIT)
{
/* Under no 16 bit ISA, we need to strictly disable TARGET_V3PUSH. */