re PR tree-optimization/42508 (wrong code with "-O1 -fipa-sra")
[gcc.git] / gcc / cgraphunit.c
1 /* Callgraph based interprocedural optimizations.
2 Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010
3 Free Software Foundation, Inc.
4 Contributed by Jan Hubicka
5
6 This file is part of GCC.
7
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
12
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
17
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
21
22 /* This module implements main driver of compilation process as well as
23 few basic interprocedural optimizers.
24
25 The main scope of this file is to act as an interface in between
26 tree based frontends and the backend (and middle end)
27
28 The front-end is supposed to use following functionality:
29
30 - cgraph_finalize_function
31
32 This function is called once front-end has parsed whole body of function
33 and it is certain that the function body nor the declaration will change.
34
35 (There is one exception needed for implementing GCC extern inline
36 function.)
37
38 - varpool_finalize_variable
39
40 This function has same behavior as the above but is used for static
41 variables.
42
43 - cgraph_finalize_compilation_unit
44
45 This function is called once (source level) compilation unit is finalized
46 and it will no longer change.
47
48 In the the call-graph construction and local function
49 analysis takes place here. Bodies of unreachable functions are released
50 to conserve memory usage.
51
52 The function can be called multiple times when multiple source level
53 compilation units are combined (such as in C frontend)
54
55 - cgraph_optimize
56
57 In this unit-at-a-time compilation the intra procedural analysis takes
58 place here. In particular the static functions whose address is never
59 taken are marked as local. Backend can then use this information to
60 modify calling conventions, do better inlining or similar optimizations.
61
62 - cgraph_mark_needed_node
63 - varpool_mark_needed_node
64
65 When function or variable is referenced by some hidden way the call-graph
66 data structure must be updated accordingly by this function.
67 There should be little need to call this function and all the references
68 should be made explicit to cgraph code. At present these functions are
69 used by C++ frontend to explicitly mark the keyed methods.
70
71 - analyze_expr callback
72
73 This function is responsible for lowering tree nodes not understood by
74 generic code into understandable ones or alternatively marking
75 callgraph and varpool nodes referenced by the as needed.
76
77 ??? On the tree-ssa genericizing should take place here and we will avoid
78 need for these hooks (replacing them by genericizing hook)
79
80 Analyzing of all functions is deferred
81 to cgraph_finalize_compilation_unit and expansion into cgraph_optimize.
82
83 In cgraph_finalize_compilation_unit the reachable functions are
84 analyzed. During analysis the call-graph edges from reachable
85 functions are constructed and their destinations are marked as
86 reachable. References to functions and variables are discovered too
87 and variables found to be needed output to the assembly file. Via
88 mark_referenced call in assemble_variable functions referenced by
89 static variables are noticed too.
90
91 The intra-procedural information is produced and its existence
92 indicated by global_info_ready. Once this flag is set it is impossible
93 to change function from !reachable to reachable and thus
94 assemble_variable no longer call mark_referenced.
95
96 Finally the call-graph is topologically sorted and all reachable functions
97 that has not been completely inlined or are not external are output.
98
99 ??? It is possible that reference to function or variable is optimized
100 out. We can not deal with this nicely because topological order is not
101 suitable for it. For tree-ssa we may consider another pass doing
102 optimization and re-discovering reachable functions.
103
104 ??? Reorganize code so variables are output very last and only if they
105 really has been referenced by produced code, so we catch more cases
106 where reference has been optimized out. */
107
108
109 #include "config.h"
110 #include "system.h"
111 #include "coretypes.h"
112 #include "tm.h"
113 #include "tree.h"
114 #include "rtl.h"
115 #include "tree-flow.h"
116 #include "tree-inline.h"
117 #include "langhooks.h"
118 #include "pointer-set.h"
119 #include "toplev.h"
120 #include "flags.h"
121 #include "ggc.h"
122 #include "debug.h"
123 #include "target.h"
124 #include "cgraph.h"
125 #include "diagnostic.h"
126 #include "timevar.h"
127 #include "params.h"
128 #include "fibheap.h"
129 #include "intl.h"
130 #include "function.h"
131 #include "ipa-prop.h"
132 #include "gimple.h"
133 #include "tree-iterator.h"
134 #include "tree-pass.h"
135 #include "tree-dump.h"
136 #include "output.h"
137 #include "coverage.h"
138 #include "plugin.h"
139
140 static void cgraph_expand_all_functions (void);
141 static void cgraph_mark_functions_to_output (void);
142 static void cgraph_expand_function (struct cgraph_node *);
143 static void cgraph_output_pending_asms (void);
144 static void cgraph_analyze_function (struct cgraph_node *);
145
146 static FILE *cgraph_dump_file;
147
148 /* A vector of FUNCTION_DECLs declared as static constructors. */
149 static GTY (()) VEC(tree, gc) *static_ctors;
150 /* A vector of FUNCTION_DECLs declared as static destructors. */
151 static GTY (()) VEC(tree, gc) *static_dtors;
152
153 /* Used for vtable lookup in thunk adjusting. */
154 static GTY (()) tree vtable_entry_type;
155
156 /* When target does not have ctors and dtors, we call all constructor
157 and destructor by special initialization/destruction function
158 recognized by collect2.
159
160 When we are going to build this function, collect all constructors and
161 destructors and turn them into normal functions. */
162
163 static void
164 record_cdtor_fn (tree fndecl)
165 {
166 struct cgraph_node *node;
167 if (targetm.have_ctors_dtors
168 || (!DECL_STATIC_CONSTRUCTOR (fndecl)
169 && !DECL_STATIC_DESTRUCTOR (fndecl)))
170 return;
171
172 if (DECL_STATIC_CONSTRUCTOR (fndecl))
173 {
174 VEC_safe_push (tree, gc, static_ctors, fndecl);
175 DECL_STATIC_CONSTRUCTOR (fndecl) = 0;
176 }
177 if (DECL_STATIC_DESTRUCTOR (fndecl))
178 {
179 VEC_safe_push (tree, gc, static_dtors, fndecl);
180 DECL_STATIC_DESTRUCTOR (fndecl) = 0;
181 }
182 node = cgraph_node (fndecl);
183 node->local.disregard_inline_limits = 1;
184 cgraph_mark_reachable_node (node);
185 }
186
187 /* Define global constructors/destructor functions for the CDTORS, of
188 which they are LEN. The CDTORS are sorted by initialization
189 priority. If CTOR_P is true, these are constructors; otherwise,
190 they are destructors. */
191
192 static void
193 build_cdtor (bool ctor_p, tree *cdtors, size_t len)
194 {
195 size_t i;
196
197 i = 0;
198 while (i < len)
199 {
200 tree body;
201 tree fn;
202 priority_type priority;
203
204 priority = 0;
205 body = NULL_TREE;
206 /* Find the next batch of constructors/destructors with the same
207 initialization priority. */
208 do
209 {
210 priority_type p;
211 fn = cdtors[i];
212 p = ctor_p ? DECL_INIT_PRIORITY (fn) : DECL_FINI_PRIORITY (fn);
213 if (!body)
214 priority = p;
215 else if (p != priority)
216 break;
217 append_to_statement_list (build_function_call_expr (UNKNOWN_LOCATION,
218 fn, 0),
219 &body);
220 ++i;
221 }
222 while (i < len);
223 gcc_assert (body != NULL_TREE);
224 /* Generate a function to call all the function of like
225 priority. */
226 cgraph_build_static_cdtor (ctor_p ? 'I' : 'D', body, priority);
227 }
228 }
229
230 /* Comparison function for qsort. P1 and P2 are actually of type
231 "tree *" and point to static constructors. DECL_INIT_PRIORITY is
232 used to determine the sort order. */
233
234 static int
235 compare_ctor (const void *p1, const void *p2)
236 {
237 tree f1;
238 tree f2;
239 int priority1;
240 int priority2;
241
242 f1 = *(const tree *)p1;
243 f2 = *(const tree *)p2;
244 priority1 = DECL_INIT_PRIORITY (f1);
245 priority2 = DECL_INIT_PRIORITY (f2);
246
247 if (priority1 < priority2)
248 return -1;
249 else if (priority1 > priority2)
250 return 1;
251 else
252 /* Ensure a stable sort. */
253 return (const tree *)p1 - (const tree *)p2;
254 }
255
256 /* Comparison function for qsort. P1 and P2 are actually of type
257 "tree *" and point to static destructors. DECL_FINI_PRIORITY is
258 used to determine the sort order. */
259
260 static int
261 compare_dtor (const void *p1, const void *p2)
262 {
263 tree f1;
264 tree f2;
265 int priority1;
266 int priority2;
267
268 f1 = *(const tree *)p1;
269 f2 = *(const tree *)p2;
270 priority1 = DECL_FINI_PRIORITY (f1);
271 priority2 = DECL_FINI_PRIORITY (f2);
272
273 if (priority1 < priority2)
274 return -1;
275 else if (priority1 > priority2)
276 return 1;
277 else
278 /* Ensure a stable sort. */
279 return (const tree *)p1 - (const tree *)p2;
280 }
281
282 /* Generate functions to call static constructors and destructors
283 for targets that do not support .ctors/.dtors sections. These
284 functions have magic names which are detected by collect2. */
285
286 static void
287 cgraph_build_cdtor_fns (void)
288 {
289 if (!VEC_empty (tree, static_ctors))
290 {
291 gcc_assert (!targetm.have_ctors_dtors);
292 qsort (VEC_address (tree, static_ctors),
293 VEC_length (tree, static_ctors),
294 sizeof (tree),
295 compare_ctor);
296 build_cdtor (/*ctor_p=*/true,
297 VEC_address (tree, static_ctors),
298 VEC_length (tree, static_ctors));
299 VEC_truncate (tree, static_ctors, 0);
300 }
301
302 if (!VEC_empty (tree, static_dtors))
303 {
304 gcc_assert (!targetm.have_ctors_dtors);
305 qsort (VEC_address (tree, static_dtors),
306 VEC_length (tree, static_dtors),
307 sizeof (tree),
308 compare_dtor);
309 build_cdtor (/*ctor_p=*/false,
310 VEC_address (tree, static_dtors),
311 VEC_length (tree, static_dtors));
312 VEC_truncate (tree, static_dtors, 0);
313 }
314 }
315
316 /* Determine if function DECL is needed. That is, visible to something
317 either outside this translation unit, something magic in the system
318 configury. */
319
320 bool
321 cgraph_decide_is_function_needed (struct cgraph_node *node, tree decl)
322 {
323 /* If the user told us it is used, then it must be so. */
324 if (node->local.externally_visible)
325 return true;
326
327 /* ??? If the assembler name is set by hand, it is possible to assemble
328 the name later after finalizing the function and the fact is noticed
329 in assemble_name then. This is arguably a bug. */
330 if (DECL_ASSEMBLER_NAME_SET_P (decl)
331 && TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl)))
332 return true;
333
334 /* With -fkeep-inline-functions we are keeping all inline functions except
335 for extern inline ones. */
336 if (flag_keep_inline_functions
337 && DECL_DECLARED_INLINE_P (decl)
338 && !DECL_EXTERNAL (decl)
339 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (decl)))
340 return true;
341
342 /* If we decided it was needed before, but at the time we didn't have
343 the body of the function available, then it's still needed. We have
344 to go back and re-check its dependencies now. */
345 if (node->needed)
346 return true;
347
348 /* Externally visible functions must be output. The exception is
349 COMDAT functions that must be output only when they are needed.
350
351 When not optimizing, also output the static functions. (see
352 PR24561), but don't do so for always_inline functions, functions
353 declared inline and nested functions. These was optimized out
354 in the original implementation and it is unclear whether we want
355 to change the behavior here. */
356 if (((TREE_PUBLIC (decl)
357 || (!optimize && !node->local.disregard_inline_limits
358 && !DECL_DECLARED_INLINE_P (decl)
359 && !node->origin))
360 && !flag_whole_program
361 && !flag_lto
362 && !flag_whopr)
363 && !DECL_COMDAT (decl) && !DECL_EXTERNAL (decl))
364 return true;
365
366 /* Constructors and destructors are reachable from the runtime by
367 some mechanism. */
368 if (DECL_STATIC_CONSTRUCTOR (decl) || DECL_STATIC_DESTRUCTOR (decl))
369 return true;
370
371 return false;
372 }
373
374 /* Process CGRAPH_NEW_FUNCTIONS and perform actions necessary to add these
375 functions into callgraph in a way so they look like ordinary reachable
376 functions inserted into callgraph already at construction time. */
377
378 bool
379 cgraph_process_new_functions (void)
380 {
381 bool output = false;
382 tree fndecl;
383 struct cgraph_node *node;
384
385 /* Note that this queue may grow as its being processed, as the new
386 functions may generate new ones. */
387 while (cgraph_new_nodes)
388 {
389 node = cgraph_new_nodes;
390 fndecl = node->decl;
391 cgraph_new_nodes = cgraph_new_nodes->next_needed;
392 switch (cgraph_state)
393 {
394 case CGRAPH_STATE_CONSTRUCTION:
395 /* At construction time we just need to finalize function and move
396 it into reachable functions list. */
397
398 node->next_needed = NULL;
399 cgraph_finalize_function (fndecl, false);
400 cgraph_mark_reachable_node (node);
401 output = true;
402 break;
403
404 case CGRAPH_STATE_IPA:
405 case CGRAPH_STATE_IPA_SSA:
406 /* When IPA optimization already started, do all essential
407 transformations that has been already performed on the whole
408 cgraph but not on this function. */
409
410 gimple_register_cfg_hooks ();
411 if (!node->analyzed)
412 cgraph_analyze_function (node);
413 push_cfun (DECL_STRUCT_FUNCTION (fndecl));
414 current_function_decl = fndecl;
415 compute_inline_parameters (node);
416 if ((cgraph_state == CGRAPH_STATE_IPA_SSA
417 && !gimple_in_ssa_p (DECL_STRUCT_FUNCTION (fndecl)))
418 /* When not optimizing, be sure we run early local passes anyway
419 to expand OMP. */
420 || !optimize)
421 execute_pass_list (pass_early_local_passes.pass.sub);
422 free_dominance_info (CDI_POST_DOMINATORS);
423 free_dominance_info (CDI_DOMINATORS);
424 pop_cfun ();
425 current_function_decl = NULL;
426 break;
427
428 case CGRAPH_STATE_EXPANSION:
429 /* Functions created during expansion shall be compiled
430 directly. */
431 node->process = 0;
432 cgraph_expand_function (node);
433 break;
434
435 default:
436 gcc_unreachable ();
437 break;
438 }
439 cgraph_call_function_insertion_hooks (node);
440 }
441 return output;
442 }
443
444 /* As an GCC extension we allow redefinition of the function. The
445 semantics when both copies of bodies differ is not well defined.
446 We replace the old body with new body so in unit at a time mode
447 we always use new body, while in normal mode we may end up with
448 old body inlined into some functions and new body expanded and
449 inlined in others.
450
451 ??? It may make more sense to use one body for inlining and other
452 body for expanding the function but this is difficult to do. */
453
454 static void
455 cgraph_reset_node (struct cgraph_node *node)
456 {
457 /* If node->process is set, then we have already begun whole-unit analysis.
458 This is *not* testing for whether we've already emitted the function.
459 That case can be sort-of legitimately seen with real function redefinition
460 errors. I would argue that the front end should never present us with
461 such a case, but don't enforce that for now. */
462 gcc_assert (!node->process);
463
464 /* Reset our data structures so we can analyze the function again. */
465 memset (&node->local, 0, sizeof (node->local));
466 memset (&node->global, 0, sizeof (node->global));
467 memset (&node->rtl, 0, sizeof (node->rtl));
468 node->analyzed = false;
469 node->local.redefined_extern_inline = true;
470 node->local.finalized = false;
471
472 cgraph_node_remove_callees (node);
473
474 /* We may need to re-queue the node for assembling in case
475 we already proceeded it and ignored as not needed or got
476 a re-declaration in IMA mode. */
477 if (node->reachable)
478 {
479 struct cgraph_node *n;
480
481 for (n = cgraph_nodes_queue; n; n = n->next_needed)
482 if (n == node)
483 break;
484 if (!n)
485 node->reachable = 0;
486 }
487 }
488
489 static void
490 cgraph_lower_function (struct cgraph_node *node)
491 {
492 if (node->lowered)
493 return;
494
495 if (node->nested)
496 lower_nested_functions (node->decl);
497 gcc_assert (!node->nested);
498
499 tree_lowering_passes (node->decl);
500 node->lowered = true;
501 }
502
503 /* DECL has been parsed. Take it, queue it, compile it at the whim of the
504 logic in effect. If NESTED is true, then our caller cannot stand to have
505 the garbage collector run at the moment. We would need to either create
506 a new GC context, or just not compile right now. */
507
508 void
509 cgraph_finalize_function (tree decl, bool nested)
510 {
511 struct cgraph_node *node = cgraph_node (decl);
512
513 if (node->local.finalized)
514 cgraph_reset_node (node);
515
516 node->pid = cgraph_max_pid ++;
517 notice_global_symbol (decl);
518 node->local.finalized = true;
519 node->lowered = DECL_STRUCT_FUNCTION (decl)->cfg != NULL;
520 node->finalized_by_frontend = true;
521 record_cdtor_fn (node->decl);
522
523 if (cgraph_decide_is_function_needed (node, decl))
524 cgraph_mark_needed_node (node);
525
526 /* Since we reclaim unreachable nodes at the end of every language
527 level unit, we need to be conservative about possible entry points
528 there. */
529 if ((TREE_PUBLIC (decl) && !DECL_COMDAT (decl) && !DECL_EXTERNAL (decl)))
530 cgraph_mark_reachable_node (node);
531
532 /* If we've not yet emitted decl, tell the debug info about it. */
533 if (!TREE_ASM_WRITTEN (decl))
534 (*debug_hooks->deferred_inline_function) (decl);
535
536 /* Possibly warn about unused parameters. */
537 if (warn_unused_parameter)
538 do_warn_unused_parameter (decl);
539
540 if (!nested)
541 ggc_collect ();
542 }
543
544 /* C99 extern inline keywords allow changing of declaration after function
545 has been finalized. We need to re-decide if we want to mark the function as
546 needed then. */
547
548 void
549 cgraph_mark_if_needed (tree decl)
550 {
551 struct cgraph_node *node = cgraph_node (decl);
552 if (node->local.finalized && cgraph_decide_is_function_needed (node, decl))
553 cgraph_mark_needed_node (node);
554 }
555
556 /* Return TRUE if NODE2 is equivalent to NODE or its clone. */
557 static bool
558 clone_of_p (struct cgraph_node *node, struct cgraph_node *node2)
559 {
560 while (node != node2 && node2)
561 node2 = node2->clone_of;
562 return node2 != NULL;
563 }
564
565 /* Verify cgraph nodes of given cgraph node. */
566 void
567 verify_cgraph_node (struct cgraph_node *node)
568 {
569 struct cgraph_edge *e;
570 struct function *this_cfun = DECL_STRUCT_FUNCTION (node->decl);
571 struct function *saved_cfun = cfun;
572 basic_block this_block;
573 gimple_stmt_iterator gsi;
574 bool error_found = false;
575
576 if (errorcount || sorrycount)
577 return;
578
579 timevar_push (TV_CGRAPH_VERIFY);
580 /* debug_generic_stmt needs correct cfun */
581 set_cfun (this_cfun);
582 for (e = node->callees; e; e = e->next_callee)
583 if (e->aux)
584 {
585 error ("aux field set for edge %s->%s",
586 identifier_to_locale (cgraph_node_name (e->caller)),
587 identifier_to_locale (cgraph_node_name (e->callee)));
588 error_found = true;
589 }
590 if (node->count < 0)
591 {
592 error ("Execution count is negative");
593 error_found = true;
594 }
595 if (node->global.inlined_to && node->local.externally_visible)
596 {
597 error ("Externally visible inline clone");
598 error_found = true;
599 }
600 if (node->global.inlined_to && node->address_taken)
601 {
602 error ("Inline clone with address taken");
603 error_found = true;
604 }
605 if (node->global.inlined_to && node->needed)
606 {
607 error ("Inline clone is needed");
608 error_found = true;
609 }
610 for (e = node->callers; e; e = e->next_caller)
611 {
612 if (e->count < 0)
613 {
614 error ("caller edge count is negative");
615 error_found = true;
616 }
617 if (e->frequency < 0)
618 {
619 error ("caller edge frequency is negative");
620 error_found = true;
621 }
622 if (e->frequency > CGRAPH_FREQ_MAX)
623 {
624 error ("caller edge frequency is too large");
625 error_found = true;
626 }
627 if (gimple_has_body_p (e->caller->decl)
628 && !e->caller->global.inlined_to
629 && (e->frequency
630 != compute_call_stmt_bb_frequency (e->caller->decl,
631 gimple_bb (e->call_stmt))))
632 {
633 error ("caller edge frequency %i does not match BB freqency %i",
634 e->frequency,
635 compute_call_stmt_bb_frequency (e->caller->decl,
636 gimple_bb (e->call_stmt)));
637 error_found = true;
638 }
639 if (!e->inline_failed)
640 {
641 if (node->global.inlined_to
642 != (e->caller->global.inlined_to
643 ? e->caller->global.inlined_to : e->caller))
644 {
645 error ("inlined_to pointer is wrong");
646 error_found = true;
647 }
648 if (node->callers->next_caller)
649 {
650 error ("multiple inline callers");
651 error_found = true;
652 }
653 }
654 else
655 if (node->global.inlined_to)
656 {
657 error ("inlined_to pointer set for noninline callers");
658 error_found = true;
659 }
660 }
661 if (!node->callers && node->global.inlined_to)
662 {
663 error ("inlined_to pointer is set but no predecessors found");
664 error_found = true;
665 }
666 if (node->global.inlined_to == node)
667 {
668 error ("inlined_to pointer refers to itself");
669 error_found = true;
670 }
671
672 if (!cgraph_node (node->decl))
673 {
674 error ("node not found in cgraph_hash");
675 error_found = true;
676 }
677
678 if (node->clone_of)
679 {
680 struct cgraph_node *n;
681 for (n = node->clone_of->clones; n; n = n->next_sibling_clone)
682 if (n == node)
683 break;
684 if (!n)
685 {
686 error ("node has wrong clone_of");
687 error_found = true;
688 }
689 }
690 if (node->clones)
691 {
692 struct cgraph_node *n;
693 for (n = node->clones; n; n = n->next_sibling_clone)
694 if (n->clone_of != node)
695 break;
696 if (n)
697 {
698 error ("node has wrong clone list");
699 error_found = true;
700 }
701 }
702 if ((node->prev_sibling_clone || node->next_sibling_clone) && !node->clone_of)
703 {
704 error ("node is in clone list but it is not clone");
705 error_found = true;
706 }
707 if (!node->prev_sibling_clone && node->clone_of && node->clone_of->clones != node)
708 {
709 error ("node has wrong prev_clone pointer");
710 error_found = true;
711 }
712 if (node->prev_sibling_clone && node->prev_sibling_clone->next_sibling_clone != node)
713 {
714 error ("double linked list of clones corrupted");
715 error_found = true;
716 }
717
718 if (node->analyzed && gimple_has_body_p (node->decl)
719 && !TREE_ASM_WRITTEN (node->decl)
720 && (!DECL_EXTERNAL (node->decl) || node->global.inlined_to)
721 && !flag_wpa)
722 {
723 if (this_cfun->cfg)
724 {
725 /* The nodes we're interested in are never shared, so walk
726 the tree ignoring duplicates. */
727 struct pointer_set_t *visited_nodes = pointer_set_create ();
728 /* Reach the trees by walking over the CFG, and note the
729 enclosing basic-blocks in the call edges. */
730 FOR_EACH_BB_FN (this_block, this_cfun)
731 for (gsi = gsi_start_bb (this_block);
732 !gsi_end_p (gsi);
733 gsi_next (&gsi))
734 {
735 gimple stmt = gsi_stmt (gsi);
736 tree decl;
737 if (is_gimple_call (stmt) && (decl = gimple_call_fndecl (stmt)))
738 {
739 struct cgraph_edge *e = cgraph_edge (node, stmt);
740 if (e)
741 {
742 if (e->aux)
743 {
744 error ("shared call_stmt:");
745 debug_gimple_stmt (stmt);
746 error_found = true;
747 }
748 if (e->callee->same_body_alias)
749 {
750 error ("edge points to same body alias:");
751 debug_tree (e->callee->decl);
752 error_found = true;
753 }
754 else if (!clone_of_p (cgraph_node (decl), e->callee)
755 && !e->callee->global.inlined_to)
756 {
757 error ("edge points to wrong declaration:");
758 debug_tree (e->callee->decl);
759 fprintf (stderr," Instead of:");
760 debug_tree (decl);
761 error_found = true;
762 }
763 e->aux = (void *)1;
764 }
765 else
766 {
767 error ("missing callgraph edge for call stmt:");
768 debug_gimple_stmt (stmt);
769 error_found = true;
770 }
771 }
772 }
773 pointer_set_destroy (visited_nodes);
774 }
775 else
776 /* No CFG available?! */
777 gcc_unreachable ();
778
779 for (e = node->callees; e; e = e->next_callee)
780 {
781 if (!e->aux && !e->indirect_call)
782 {
783 error ("edge %s->%s has no corresponding call_stmt",
784 identifier_to_locale (cgraph_node_name (e->caller)),
785 identifier_to_locale (cgraph_node_name (e->callee)));
786 debug_gimple_stmt (e->call_stmt);
787 error_found = true;
788 }
789 e->aux = 0;
790 }
791 }
792 if (error_found)
793 {
794 dump_cgraph_node (stderr, node);
795 internal_error ("verify_cgraph_node failed");
796 }
797 set_cfun (saved_cfun);
798 timevar_pop (TV_CGRAPH_VERIFY);
799 }
800
801 /* Verify whole cgraph structure. */
802 void
803 verify_cgraph (void)
804 {
805 struct cgraph_node *node;
806
807 if (sorrycount || errorcount)
808 return;
809
810 for (node = cgraph_nodes; node; node = node->next)
811 verify_cgraph_node (node);
812 }
813
814 /* Output all asm statements we have stored up to be output. */
815
816 static void
817 cgraph_output_pending_asms (void)
818 {
819 struct cgraph_asm_node *can;
820
821 if (errorcount || sorrycount)
822 return;
823
824 for (can = cgraph_asm_nodes; can; can = can->next)
825 assemble_asm (can->asm_str);
826 cgraph_asm_nodes = NULL;
827 }
828
829 /* Analyze the function scheduled to be output. */
830 static void
831 cgraph_analyze_function (struct cgraph_node *node)
832 {
833 tree save = current_function_decl;
834 tree decl = node->decl;
835
836 current_function_decl = decl;
837 push_cfun (DECL_STRUCT_FUNCTION (decl));
838
839 /* Make sure to gimplify bodies only once. During analyzing a
840 function we lower it, which will require gimplified nested
841 functions, so we can end up here with an already gimplified
842 body. */
843 if (!gimple_body (decl))
844 gimplify_function_tree (decl);
845 dump_function (TDI_generic, decl);
846
847 cgraph_lower_function (node);
848 node->analyzed = true;
849
850 pop_cfun ();
851 current_function_decl = save;
852 }
853
854 /* Look for externally_visible and used attributes and mark cgraph nodes
855 accordingly.
856
857 We cannot mark the nodes at the point the attributes are processed (in
858 handle_*_attribute) because the copy of the declarations available at that
859 point may not be canonical. For example, in:
860
861 void f();
862 void f() __attribute__((used));
863
864 the declaration we see in handle_used_attribute will be the second
865 declaration -- but the front end will subsequently merge that declaration
866 with the original declaration and discard the second declaration.
867
868 Furthermore, we can't mark these nodes in cgraph_finalize_function because:
869
870 void f() {}
871 void f() __attribute__((externally_visible));
872
873 is valid.
874
875 So, we walk the nodes at the end of the translation unit, applying the
876 attributes at that point. */
877
878 static void
879 process_function_and_variable_attributes (struct cgraph_node *first,
880 struct varpool_node *first_var)
881 {
882 struct cgraph_node *node;
883 struct varpool_node *vnode;
884
885 for (node = cgraph_nodes; node != first; node = node->next)
886 {
887 tree decl = node->decl;
888 if (lookup_attribute ("used", DECL_ATTRIBUTES (decl)))
889 {
890 mark_decl_referenced (decl);
891 if (node->local.finalized)
892 cgraph_mark_needed_node (node);
893 }
894 if (lookup_attribute ("externally_visible", DECL_ATTRIBUTES (decl)))
895 {
896 if (! TREE_PUBLIC (node->decl))
897 warning_at (DECL_SOURCE_LOCATION (node->decl), OPT_Wattributes,
898 "%<externally_visible%>"
899 " attribute have effect only on public objects");
900 else if (node->local.finalized)
901 cgraph_mark_needed_node (node);
902 }
903 }
904 for (vnode = varpool_nodes; vnode != first_var; vnode = vnode->next)
905 {
906 tree decl = vnode->decl;
907 if (lookup_attribute ("used", DECL_ATTRIBUTES (decl)))
908 {
909 mark_decl_referenced (decl);
910 vnode->force_output = true;
911 if (vnode->finalized)
912 varpool_mark_needed_node (vnode);
913 }
914 if (lookup_attribute ("externally_visible", DECL_ATTRIBUTES (decl)))
915 {
916 if (! TREE_PUBLIC (vnode->decl))
917 warning_at (DECL_SOURCE_LOCATION (vnode->decl), OPT_Wattributes,
918 "%<externally_visible%>"
919 " attribute have effect only on public objects");
920 else if (vnode->finalized)
921 varpool_mark_needed_node (vnode);
922 }
923 }
924 }
925
926 /* Process CGRAPH_NODES_NEEDED queue, analyze each function (and transitively
927 each reachable functions) and build cgraph.
928 The function can be called multiple times after inserting new nodes
929 into beginning of queue. Just the new part of queue is re-scanned then. */
930
931 static void
932 cgraph_analyze_functions (void)
933 {
934 /* Keep track of already processed nodes when called multiple times for
935 intermodule optimization. */
936 static struct cgraph_node *first_analyzed;
937 struct cgraph_node *first_processed = first_analyzed;
938 static struct varpool_node *first_analyzed_var;
939 struct cgraph_node *node, *next;
940
941 process_function_and_variable_attributes (first_processed,
942 first_analyzed_var);
943 first_processed = cgraph_nodes;
944 first_analyzed_var = varpool_nodes;
945 varpool_analyze_pending_decls ();
946 if (cgraph_dump_file)
947 {
948 fprintf (cgraph_dump_file, "Initial entry points:");
949 for (node = cgraph_nodes; node != first_analyzed; node = node->next)
950 if (node->needed)
951 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
952 fprintf (cgraph_dump_file, "\n");
953 }
954 cgraph_process_new_functions ();
955
956 /* Propagate reachability flag and lower representation of all reachable
957 functions. In the future, lowering will introduce new functions and
958 new entry points on the way (by template instantiation and virtual
959 method table generation for instance). */
960 while (cgraph_nodes_queue)
961 {
962 struct cgraph_edge *edge;
963 tree decl = cgraph_nodes_queue->decl;
964
965 node = cgraph_nodes_queue;
966 cgraph_nodes_queue = cgraph_nodes_queue->next_needed;
967 node->next_needed = NULL;
968
969 /* ??? It is possible to create extern inline function and later using
970 weak alias attribute to kill its body. See
971 gcc.c-torture/compile/20011119-1.c */
972 if (!DECL_STRUCT_FUNCTION (decl))
973 {
974 cgraph_reset_node (node);
975 continue;
976 }
977
978 if (!node->analyzed)
979 cgraph_analyze_function (node);
980
981 for (edge = node->callees; edge; edge = edge->next_callee)
982 if (!edge->callee->reachable)
983 cgraph_mark_reachable_node (edge->callee);
984
985 if (node->same_comdat_group)
986 {
987 for (next = node->same_comdat_group;
988 next != node;
989 next = next->same_comdat_group)
990 cgraph_mark_reachable_node (next);
991 }
992
993 /* If decl is a clone of an abstract function, mark that abstract
994 function so that we don't release its body. The DECL_INITIAL() of that
995 abstract function declaration will be later needed to output debug info. */
996 if (DECL_ABSTRACT_ORIGIN (decl))
997 {
998 struct cgraph_node *origin_node = cgraph_node (DECL_ABSTRACT_ORIGIN (decl));
999 origin_node->abstract_and_needed = true;
1000 }
1001
1002 /* We finalize local static variables during constructing callgraph
1003 edges. Process their attributes too. */
1004 process_function_and_variable_attributes (first_processed,
1005 first_analyzed_var);
1006 first_processed = cgraph_nodes;
1007 first_analyzed_var = varpool_nodes;
1008 varpool_analyze_pending_decls ();
1009 cgraph_process_new_functions ();
1010 }
1011
1012 /* Collect entry points to the unit. */
1013 if (cgraph_dump_file)
1014 {
1015 fprintf (cgraph_dump_file, "Unit entry points:");
1016 for (node = cgraph_nodes; node != first_analyzed; node = node->next)
1017 if (node->needed)
1018 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
1019 fprintf (cgraph_dump_file, "\n\nInitial ");
1020 dump_cgraph (cgraph_dump_file);
1021 }
1022
1023 if (cgraph_dump_file)
1024 fprintf (cgraph_dump_file, "\nReclaiming functions:");
1025
1026 for (node = cgraph_nodes; node != first_analyzed; node = next)
1027 {
1028 tree decl = node->decl;
1029 next = node->next;
1030
1031 if (node->local.finalized && !gimple_has_body_p (decl))
1032 cgraph_reset_node (node);
1033
1034 if (!node->reachable && gimple_has_body_p (decl))
1035 {
1036 if (cgraph_dump_file)
1037 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
1038 cgraph_remove_node (node);
1039 continue;
1040 }
1041 else
1042 node->next_needed = NULL;
1043 gcc_assert (!node->local.finalized || gimple_has_body_p (decl));
1044 gcc_assert (node->analyzed == node->local.finalized);
1045 }
1046 if (cgraph_dump_file)
1047 {
1048 fprintf (cgraph_dump_file, "\n\nReclaimed ");
1049 dump_cgraph (cgraph_dump_file);
1050 }
1051 first_analyzed = cgraph_nodes;
1052 ggc_collect ();
1053 }
1054
1055
1056 /* Analyze the whole compilation unit once it is parsed completely. */
1057
1058 void
1059 cgraph_finalize_compilation_unit (void)
1060 {
1061 timevar_push (TV_CGRAPH);
1062
1063 /* Do not skip analyzing the functions if there were errors, we
1064 miss diagnostics for following functions otherwise. */
1065
1066 /* Emit size functions we didn't inline. */
1067 finalize_size_functions ();
1068
1069 /* Call functions declared with the "constructor" or "destructor"
1070 attribute. */
1071 cgraph_build_cdtor_fns ();
1072
1073 /* Mark alias targets necessary and emit diagnostics. */
1074 finish_aliases_1 ();
1075
1076 if (!quiet_flag)
1077 {
1078 fprintf (stderr, "\nAnalyzing compilation unit\n");
1079 fflush (stderr);
1080 }
1081
1082 /* Gimplify and lower all functions, compute reachability and
1083 remove unreachable nodes. */
1084 cgraph_analyze_functions ();
1085
1086 /* Mark alias targets necessary and emit diagnostics. */
1087 finish_aliases_1 ();
1088
1089 /* Gimplify and lower thunks. */
1090 cgraph_analyze_functions ();
1091
1092 /* Finally drive the pass manager. */
1093 cgraph_optimize ();
1094
1095 timevar_pop (TV_CGRAPH);
1096 }
1097
1098
1099 /* Figure out what functions we want to assemble. */
1100
1101 static void
1102 cgraph_mark_functions_to_output (void)
1103 {
1104 struct cgraph_node *node;
1105 #ifdef ENABLE_CHECKING
1106 bool check_same_comdat_groups = false;
1107
1108 for (node = cgraph_nodes; node; node = node->next)
1109 gcc_assert (!node->process);
1110 #endif
1111
1112 for (node = cgraph_nodes; node; node = node->next)
1113 {
1114 tree decl = node->decl;
1115 struct cgraph_edge *e;
1116
1117 gcc_assert (!node->process || node->same_comdat_group);
1118 if (node->process)
1119 continue;
1120
1121 for (e = node->callers; e; e = e->next_caller)
1122 if (e->inline_failed)
1123 break;
1124
1125 /* We need to output all local functions that are used and not
1126 always inlined, as well as those that are reachable from
1127 outside the current compilation unit. */
1128 if (node->analyzed
1129 && !node->global.inlined_to
1130 && (node->needed
1131 || (e && node->reachable))
1132 && !TREE_ASM_WRITTEN (decl)
1133 && !DECL_EXTERNAL (decl))
1134 {
1135 node->process = 1;
1136 if (node->same_comdat_group)
1137 {
1138 struct cgraph_node *next;
1139 for (next = node->same_comdat_group;
1140 next != node;
1141 next = next->same_comdat_group)
1142 next->process = 1;
1143 }
1144 }
1145 else if (node->same_comdat_group)
1146 {
1147 #ifdef ENABLE_CHECKING
1148 check_same_comdat_groups = true;
1149 #endif
1150 }
1151 else
1152 {
1153 /* We should've reclaimed all functions that are not needed. */
1154 #ifdef ENABLE_CHECKING
1155 if (!node->global.inlined_to
1156 && gimple_has_body_p (decl)
1157 && !DECL_EXTERNAL (decl))
1158 {
1159 dump_cgraph_node (stderr, node);
1160 internal_error ("failed to reclaim unneeded function");
1161 }
1162 #endif
1163 gcc_assert (node->global.inlined_to
1164 || !gimple_has_body_p (decl)
1165 || DECL_EXTERNAL (decl));
1166
1167 }
1168
1169 }
1170 #ifdef ENABLE_CHECKING
1171 if (check_same_comdat_groups)
1172 for (node = cgraph_nodes; node; node = node->next)
1173 if (node->same_comdat_group && !node->process)
1174 {
1175 tree decl = node->decl;
1176 if (!node->global.inlined_to
1177 && gimple_has_body_p (decl)
1178 && !DECL_EXTERNAL (decl))
1179 {
1180 dump_cgraph_node (stderr, node);
1181 internal_error ("failed to reclaim unneeded function");
1182 }
1183 }
1184 #endif
1185 }
1186
1187 /* DECL is FUNCTION_DECL. Initialize datastructures so DECL is a function
1188 in lowered gimple form.
1189
1190 Set current_function_decl and cfun to newly constructed empty function body.
1191 return basic block in the function body. */
1192
1193 static basic_block
1194 init_lowered_empty_function (tree decl)
1195 {
1196 basic_block bb;
1197
1198 current_function_decl = decl;
1199 allocate_struct_function (decl, false);
1200 gimple_register_cfg_hooks ();
1201 init_empty_tree_cfg ();
1202 init_tree_ssa (cfun);
1203 init_ssa_operands ();
1204 cfun->gimple_df->in_ssa_p = true;
1205 DECL_INITIAL (decl) = make_node (BLOCK);
1206
1207 DECL_SAVED_TREE (decl) = error_mark_node;
1208 cfun->curr_properties |=
1209 (PROP_gimple_lcf | PROP_gimple_leh | PROP_cfg | PROP_referenced_vars |
1210 PROP_ssa);
1211
1212 /* Create BB for body of the function and connect it properly. */
1213 bb = create_basic_block (NULL, (void *) 0, ENTRY_BLOCK_PTR);
1214 make_edge (ENTRY_BLOCK_PTR, bb, 0);
1215 make_edge (bb, EXIT_BLOCK_PTR, 0);
1216
1217 return bb;
1218 }
1219
1220 /* Adjust PTR by the constant FIXED_OFFSET, and by the vtable
1221 offset indicated by VIRTUAL_OFFSET, if that is
1222 non-null. THIS_ADJUSTING is nonzero for a this adjusting thunk and
1223 zero for a result adjusting thunk. */
1224
1225 static tree
1226 thunk_adjust (gimple_stmt_iterator * bsi,
1227 tree ptr, bool this_adjusting,
1228 HOST_WIDE_INT fixed_offset, tree virtual_offset)
1229 {
1230 gimple stmt;
1231 tree ret;
1232
1233 if (this_adjusting)
1234 {
1235 stmt = gimple_build_assign (ptr,
1236 fold_build2_loc (input_location,
1237 POINTER_PLUS_EXPR,
1238 TREE_TYPE (ptr), ptr,
1239 size_int (fixed_offset)));
1240 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1241 }
1242
1243 /* If there's a virtual offset, look up that value in the vtable and
1244 adjust the pointer again. */
1245 if (virtual_offset)
1246 {
1247 tree vtabletmp;
1248 tree vtabletmp2;
1249 tree vtabletmp3;
1250 tree offsettmp;
1251
1252 if (!vtable_entry_type)
1253 {
1254 tree vfunc_type = make_node (FUNCTION_TYPE);
1255 TREE_TYPE (vfunc_type) = integer_type_node;
1256 TYPE_ARG_TYPES (vfunc_type) = NULL_TREE;
1257 layout_type (vfunc_type);
1258
1259 vtable_entry_type = build_pointer_type (vfunc_type);
1260 }
1261
1262 vtabletmp =
1263 create_tmp_var (build_pointer_type
1264 (build_pointer_type (vtable_entry_type)), "vptr");
1265
1266 /* The vptr is always at offset zero in the object. */
1267 stmt = gimple_build_assign (vtabletmp,
1268 build1 (NOP_EXPR, TREE_TYPE (vtabletmp),
1269 ptr));
1270 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1271 mark_symbols_for_renaming (stmt);
1272 find_referenced_vars_in (stmt);
1273
1274 /* Form the vtable address. */
1275 vtabletmp2 = create_tmp_var (TREE_TYPE (TREE_TYPE (vtabletmp)),
1276 "vtableaddr");
1277 stmt = gimple_build_assign (vtabletmp2,
1278 build1 (INDIRECT_REF,
1279 TREE_TYPE (vtabletmp2), vtabletmp));
1280 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1281 mark_symbols_for_renaming (stmt);
1282 find_referenced_vars_in (stmt);
1283
1284 /* Find the entry with the vcall offset. */
1285 stmt = gimple_build_assign (vtabletmp2,
1286 fold_build2_loc (input_location,
1287 POINTER_PLUS_EXPR,
1288 TREE_TYPE (vtabletmp2),
1289 vtabletmp2,
1290 fold_convert (sizetype,
1291 virtual_offset)));
1292 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1293
1294 /* Get the offset itself. */
1295 vtabletmp3 = create_tmp_var (TREE_TYPE (TREE_TYPE (vtabletmp2)),
1296 "vcalloffset");
1297 stmt = gimple_build_assign (vtabletmp3,
1298 build1 (INDIRECT_REF,
1299 TREE_TYPE (vtabletmp3),
1300 vtabletmp2));
1301 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1302 mark_symbols_for_renaming (stmt);
1303 find_referenced_vars_in (stmt);
1304
1305 /* Cast to sizetype. */
1306 offsettmp = create_tmp_var (sizetype, "offset");
1307 stmt = gimple_build_assign (offsettmp, fold_convert (sizetype, vtabletmp3));
1308 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1309 mark_symbols_for_renaming (stmt);
1310 find_referenced_vars_in (stmt);
1311
1312 /* Adjust the `this' pointer. */
1313 ptr = fold_build2_loc (input_location,
1314 POINTER_PLUS_EXPR, TREE_TYPE (ptr), ptr,
1315 offsettmp);
1316 }
1317
1318 if (!this_adjusting)
1319 /* Adjust the pointer by the constant. */
1320 {
1321 tree ptrtmp;
1322
1323 if (TREE_CODE (ptr) == VAR_DECL)
1324 ptrtmp = ptr;
1325 else
1326 {
1327 ptrtmp = create_tmp_var (TREE_TYPE (ptr), "ptr");
1328 stmt = gimple_build_assign (ptrtmp, ptr);
1329 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1330 mark_symbols_for_renaming (stmt);
1331 find_referenced_vars_in (stmt);
1332 }
1333 ptr = fold_build2_loc (input_location,
1334 POINTER_PLUS_EXPR, TREE_TYPE (ptrtmp), ptrtmp,
1335 size_int (fixed_offset));
1336 }
1337
1338 /* Emit the statement and gimplify the adjustment expression. */
1339 ret = create_tmp_var (TREE_TYPE (ptr), "adjusted_this");
1340 stmt = gimple_build_assign (ret, ptr);
1341 mark_symbols_for_renaming (stmt);
1342 find_referenced_vars_in (stmt);
1343 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1344
1345 return ret;
1346 }
1347
1348 /* Produce assembler for thunk NODE. */
1349
1350 static void
1351 assemble_thunk (struct cgraph_node *node)
1352 {
1353 bool this_adjusting = node->thunk.this_adjusting;
1354 HOST_WIDE_INT fixed_offset = node->thunk.fixed_offset;
1355 HOST_WIDE_INT virtual_value = node->thunk.virtual_value;
1356 tree virtual_offset = NULL;
1357 tree alias = node->thunk.alias;
1358 tree thunk_fndecl = node->decl;
1359 tree a = DECL_ARGUMENTS (thunk_fndecl);
1360
1361 current_function_decl = thunk_fndecl;
1362
1363 if (this_adjusting
1364 && targetm.asm_out.can_output_mi_thunk (thunk_fndecl, fixed_offset,
1365 virtual_value, alias))
1366 {
1367 const char *fnname;
1368 tree fn_block;
1369
1370 DECL_RESULT (thunk_fndecl)
1371 = build_decl (DECL_SOURCE_LOCATION (thunk_fndecl),
1372 RESULT_DECL, 0, integer_type_node);
1373 fnname = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (thunk_fndecl));
1374
1375 /* The back end expects DECL_INITIAL to contain a BLOCK, so we
1376 create one. */
1377 fn_block = make_node (BLOCK);
1378 BLOCK_VARS (fn_block) = a;
1379 DECL_INITIAL (thunk_fndecl) = fn_block;
1380 init_function_start (thunk_fndecl);
1381 cfun->is_thunk = 1;
1382 assemble_start_function (thunk_fndecl, fnname);
1383
1384 targetm.asm_out.output_mi_thunk (asm_out_file, thunk_fndecl,
1385 fixed_offset, virtual_value, alias);
1386
1387 assemble_end_function (thunk_fndecl, fnname);
1388 init_insn_lengths ();
1389 free_after_compilation (cfun);
1390 set_cfun (NULL);
1391 TREE_ASM_WRITTEN (thunk_fndecl) = 1;
1392 }
1393 else
1394 {
1395 tree restype;
1396 basic_block bb, then_bb, else_bb, return_bb;
1397 gimple_stmt_iterator bsi;
1398 int nargs = 0;
1399 tree arg;
1400 int i;
1401 tree resdecl;
1402 tree restmp = NULL;
1403 VEC(tree, heap) *vargs;
1404
1405 gimple call;
1406 gimple ret;
1407
1408 DECL_IGNORED_P (thunk_fndecl) = 1;
1409 bitmap_obstack_initialize (NULL);
1410
1411 if (node->thunk.virtual_offset_p)
1412 virtual_offset = size_int (virtual_value);
1413
1414 /* Build the return declaration for the function. */
1415 restype = TREE_TYPE (TREE_TYPE (thunk_fndecl));
1416 if (DECL_RESULT (thunk_fndecl) == NULL_TREE)
1417 {
1418 resdecl = build_decl (input_location, RESULT_DECL, 0, restype);
1419 DECL_ARTIFICIAL (resdecl) = 1;
1420 DECL_IGNORED_P (resdecl) = 1;
1421 DECL_RESULT (thunk_fndecl) = resdecl;
1422 }
1423 else
1424 resdecl = DECL_RESULT (thunk_fndecl);
1425
1426 bb = then_bb = else_bb = return_bb = init_lowered_empty_function (thunk_fndecl);
1427
1428 bsi = gsi_start_bb (bb);
1429
1430 /* Build call to the function being thunked. */
1431 if (!VOID_TYPE_P (restype))
1432 {
1433 if (!is_gimple_reg_type (restype))
1434 {
1435 restmp = resdecl;
1436 cfun->local_decls = tree_cons (NULL_TREE, restmp, cfun->local_decls);
1437 BLOCK_VARS (DECL_INITIAL (current_function_decl)) = restmp;
1438 }
1439 else
1440 restmp = create_tmp_var_raw (restype, "retval");
1441 }
1442
1443 for (arg = a; arg; arg = TREE_CHAIN (arg))
1444 nargs++;
1445 vargs = VEC_alloc (tree, heap, nargs);
1446 if (this_adjusting)
1447 VEC_quick_push (tree, vargs,
1448 thunk_adjust (&bsi,
1449 a, 1, fixed_offset,
1450 virtual_offset));
1451 else
1452 VEC_quick_push (tree, vargs, a);
1453 for (i = 1, arg = TREE_CHAIN (a); i < nargs; i++, arg = TREE_CHAIN (arg))
1454 VEC_quick_push (tree, vargs, arg);
1455 call = gimple_build_call_vec (build_fold_addr_expr_loc (0, alias), vargs);
1456 VEC_free (tree, heap, vargs);
1457 gimple_call_set_cannot_inline (call, true);
1458 gimple_call_set_from_thunk (call, true);
1459 if (restmp)
1460 gimple_call_set_lhs (call, restmp);
1461 gsi_insert_after (&bsi, call, GSI_NEW_STMT);
1462 mark_symbols_for_renaming (call);
1463 find_referenced_vars_in (call);
1464 update_stmt (call);
1465
1466 if (restmp && !this_adjusting)
1467 {
1468 tree true_label = NULL_TREE, false_label = NULL_TREE;
1469
1470 if (TREE_CODE (TREE_TYPE (restmp)) == POINTER_TYPE)
1471 {
1472 gimple stmt;
1473 /* If the return type is a pointer, we need to
1474 protect against NULL. We know there will be an
1475 adjustment, because that's why we're emitting a
1476 thunk. */
1477 then_bb = create_basic_block (NULL, (void *) 0, bb);
1478 return_bb = create_basic_block (NULL, (void *) 0, then_bb);
1479 else_bb = create_basic_block (NULL, (void *) 0, else_bb);
1480 remove_edge (single_succ_edge (bb));
1481 true_label = gimple_block_label (then_bb);
1482 false_label = gimple_block_label (else_bb);
1483 stmt = gimple_build_cond (NE_EXPR, restmp,
1484 fold_convert (TREE_TYPE (restmp),
1485 integer_zero_node),
1486 NULL_TREE, NULL_TREE);
1487 gsi_insert_after (&bsi, stmt, GSI_NEW_STMT);
1488 make_edge (bb, then_bb, EDGE_TRUE_VALUE);
1489 make_edge (bb, else_bb, EDGE_FALSE_VALUE);
1490 make_edge (return_bb, EXIT_BLOCK_PTR, 0);
1491 make_edge (then_bb, return_bb, EDGE_FALLTHRU);
1492 make_edge (else_bb, return_bb, EDGE_FALLTHRU);
1493 bsi = gsi_last_bb (then_bb);
1494 }
1495
1496 restmp = thunk_adjust (&bsi, restmp, /*this_adjusting=*/0,
1497 fixed_offset, virtual_offset);
1498 if (true_label)
1499 {
1500 gimple stmt;
1501 bsi = gsi_last_bb (else_bb);
1502 stmt = gimple_build_assign (restmp, fold_convert (TREE_TYPE (restmp),
1503 integer_zero_node));
1504 gsi_insert_after (&bsi, stmt, GSI_NEW_STMT);
1505 bsi = gsi_last_bb (return_bb);
1506 }
1507 }
1508 else
1509 gimple_call_set_tail (call, true);
1510
1511 /* Build return value. */
1512 ret = gimple_build_return (restmp);
1513 gsi_insert_after (&bsi, ret, GSI_NEW_STMT);
1514
1515 delete_unreachable_blocks ();
1516 update_ssa (TODO_update_ssa);
1517
1518 cgraph_remove_same_body_alias (node);
1519 /* Since we want to emit the thunk, we explicitly mark its name as
1520 referenced. */
1521 mark_decl_referenced (thunk_fndecl);
1522 cgraph_add_new_function (thunk_fndecl, true);
1523 bitmap_obstack_release (NULL);
1524 }
1525 current_function_decl = NULL;
1526 }
1527
1528 /* Expand function specified by NODE. */
1529
1530 static void
1531 cgraph_expand_function (struct cgraph_node *node)
1532 {
1533 tree decl = node->decl;
1534
1535 /* We ought to not compile any inline clones. */
1536 gcc_assert (!node->global.inlined_to);
1537
1538 announce_function (decl);
1539 node->process = 0;
1540
1541 gcc_assert (node->lowered);
1542
1543 /* Generate RTL for the body of DECL. */
1544 tree_rest_of_compilation (decl);
1545
1546 /* Make sure that BE didn't give up on compiling. */
1547 gcc_assert (TREE_ASM_WRITTEN (decl));
1548 current_function_decl = NULL;
1549 if (node->same_body)
1550 {
1551 struct cgraph_node *alias, *next;
1552 bool saved_alias = node->alias;
1553 for (alias = node->same_body;
1554 alias && alias->next; alias = alias->next)
1555 ;
1556 /* Walk aliases in the order they were created; it is possible that
1557 thunks reffers to the aliases made earlier. */
1558 for (; alias; alias = next)
1559 {
1560 next = alias->previous;
1561 if (!alias->thunk.thunk_p)
1562 assemble_alias (alias->decl,
1563 DECL_ASSEMBLER_NAME (alias->thunk.alias));
1564 else
1565 assemble_thunk (alias);
1566 }
1567 node->alias = saved_alias;
1568 }
1569 gcc_assert (!cgraph_preserve_function_body_p (decl));
1570 cgraph_release_function_body (node);
1571 /* Eliminate all call edges. This is important so the GIMPLE_CALL no longer
1572 points to the dead function body. */
1573 cgraph_node_remove_callees (node);
1574
1575 cgraph_function_flags_ready = true;
1576 }
1577
1578 /* Return true when CALLER_DECL should be inlined into CALLEE_DECL. */
1579
1580 bool
1581 cgraph_inline_p (struct cgraph_edge *e, cgraph_inline_failed_t *reason)
1582 {
1583 *reason = e->inline_failed;
1584 return !e->inline_failed;
1585 }
1586
1587
1588
1589 /* Expand all functions that must be output.
1590
1591 Attempt to topologically sort the nodes so function is output when
1592 all called functions are already assembled to allow data to be
1593 propagated across the callgraph. Use a stack to get smaller distance
1594 between a function and its callees (later we may choose to use a more
1595 sophisticated algorithm for function reordering; we will likely want
1596 to use subsections to make the output functions appear in top-down
1597 order). */
1598
1599 static void
1600 cgraph_expand_all_functions (void)
1601 {
1602 struct cgraph_node *node;
1603 struct cgraph_node **order = XCNEWVEC (struct cgraph_node *, cgraph_n_nodes);
1604 int order_pos, new_order_pos = 0;
1605 int i;
1606
1607 order_pos = cgraph_postorder (order);
1608 gcc_assert (order_pos == cgraph_n_nodes);
1609
1610 /* Garbage collector may remove inline clones we eliminate during
1611 optimization. So we must be sure to not reference them. */
1612 for (i = 0; i < order_pos; i++)
1613 if (order[i]->process)
1614 order[new_order_pos++] = order[i];
1615
1616 for (i = new_order_pos - 1; i >= 0; i--)
1617 {
1618 node = order[i];
1619 if (node->process)
1620 {
1621 gcc_assert (node->reachable);
1622 node->process = 0;
1623 cgraph_expand_function (node);
1624 }
1625 }
1626 cgraph_process_new_functions ();
1627
1628 free (order);
1629
1630 }
1631
1632 /* This is used to sort the node types by the cgraph order number. */
1633
1634 enum cgraph_order_sort_kind
1635 {
1636 ORDER_UNDEFINED = 0,
1637 ORDER_FUNCTION,
1638 ORDER_VAR,
1639 ORDER_ASM
1640 };
1641
1642 struct cgraph_order_sort
1643 {
1644 enum cgraph_order_sort_kind kind;
1645 union
1646 {
1647 struct cgraph_node *f;
1648 struct varpool_node *v;
1649 struct cgraph_asm_node *a;
1650 } u;
1651 };
1652
1653 /* Output all functions, variables, and asm statements in the order
1654 according to their order fields, which is the order in which they
1655 appeared in the file. This implements -fno-toplevel-reorder. In
1656 this mode we may output functions and variables which don't really
1657 need to be output. */
1658
1659 static void
1660 cgraph_output_in_order (void)
1661 {
1662 int max;
1663 size_t size;
1664 struct cgraph_order_sort *nodes;
1665 int i;
1666 struct cgraph_node *pf;
1667 struct varpool_node *pv;
1668 struct cgraph_asm_node *pa;
1669
1670 max = cgraph_order;
1671 size = max * sizeof (struct cgraph_order_sort);
1672 nodes = (struct cgraph_order_sort *) alloca (size);
1673 memset (nodes, 0, size);
1674
1675 varpool_analyze_pending_decls ();
1676
1677 for (pf = cgraph_nodes; pf; pf = pf->next)
1678 {
1679 if (pf->process)
1680 {
1681 i = pf->order;
1682 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1683 nodes[i].kind = ORDER_FUNCTION;
1684 nodes[i].u.f = pf;
1685 }
1686 }
1687
1688 for (pv = varpool_nodes_queue; pv; pv = pv->next_needed)
1689 {
1690 i = pv->order;
1691 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1692 nodes[i].kind = ORDER_VAR;
1693 nodes[i].u.v = pv;
1694 }
1695
1696 for (pa = cgraph_asm_nodes; pa; pa = pa->next)
1697 {
1698 i = pa->order;
1699 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1700 nodes[i].kind = ORDER_ASM;
1701 nodes[i].u.a = pa;
1702 }
1703
1704 /* In toplevel reorder mode we output all statics; mark them as needed. */
1705 for (i = 0; i < max; ++i)
1706 {
1707 if (nodes[i].kind == ORDER_VAR)
1708 {
1709 varpool_mark_needed_node (nodes[i].u.v);
1710 }
1711 }
1712 varpool_empty_needed_queue ();
1713
1714 for (i = 0; i < max; ++i)
1715 {
1716 switch (nodes[i].kind)
1717 {
1718 case ORDER_FUNCTION:
1719 nodes[i].u.f->process = 0;
1720 cgraph_expand_function (nodes[i].u.f);
1721 break;
1722
1723 case ORDER_VAR:
1724 varpool_assemble_decl (nodes[i].u.v);
1725 break;
1726
1727 case ORDER_ASM:
1728 assemble_asm (nodes[i].u.a->asm_str);
1729 break;
1730
1731 case ORDER_UNDEFINED:
1732 break;
1733
1734 default:
1735 gcc_unreachable ();
1736 }
1737 }
1738
1739 cgraph_asm_nodes = NULL;
1740 }
1741
1742 /* Return true when function body of DECL still needs to be kept around
1743 for later re-use. */
1744 bool
1745 cgraph_preserve_function_body_p (tree decl)
1746 {
1747 struct cgraph_node *node;
1748
1749 gcc_assert (cgraph_global_info_ready);
1750 /* Look if there is any clone around. */
1751 node = cgraph_node (decl);
1752 if (node->clones)
1753 return true;
1754 return false;
1755 }
1756
1757 static void
1758 ipa_passes (void)
1759 {
1760 set_cfun (NULL);
1761 current_function_decl = NULL;
1762 gimple_register_cfg_hooks ();
1763 bitmap_obstack_initialize (NULL);
1764
1765 invoke_plugin_callbacks (PLUGIN_ALL_IPA_PASSES_START, NULL);
1766
1767 if (!in_lto_p)
1768 execute_ipa_pass_list (all_small_ipa_passes);
1769
1770 /* If pass_all_early_optimizations was not scheduled, the state of
1771 the cgraph will not be properly updated. Update it now. */
1772 if (cgraph_state < CGRAPH_STATE_IPA_SSA)
1773 cgraph_state = CGRAPH_STATE_IPA_SSA;
1774
1775 if (!in_lto_p)
1776 {
1777 /* Generate coverage variables and constructors. */
1778 coverage_finish ();
1779
1780 /* Process new functions added. */
1781 set_cfun (NULL);
1782 current_function_decl = NULL;
1783 cgraph_process_new_functions ();
1784
1785 execute_ipa_summary_passes
1786 ((struct ipa_opt_pass_d *) all_regular_ipa_passes);
1787 }
1788 execute_ipa_summary_passes ((struct ipa_opt_pass_d *) all_lto_gen_passes);
1789
1790 if (!in_lto_p)
1791 ipa_write_summaries ();
1792
1793 if (!flag_ltrans)
1794 execute_ipa_pass_list (all_regular_ipa_passes);
1795 invoke_plugin_callbacks (PLUGIN_ALL_IPA_PASSES_END, NULL);
1796
1797 bitmap_obstack_release (NULL);
1798 }
1799
1800
1801 /* Perform simple optimizations based on callgraph. */
1802
1803 void
1804 cgraph_optimize (void)
1805 {
1806 if (errorcount || sorrycount)
1807 return;
1808
1809 #ifdef ENABLE_CHECKING
1810 verify_cgraph ();
1811 #endif
1812
1813 /* Frontend may output common variables after the unit has been finalized.
1814 It is safe to deal with them here as they are always zero initialized. */
1815 varpool_analyze_pending_decls ();
1816
1817 timevar_push (TV_CGRAPHOPT);
1818 if (pre_ipa_mem_report)
1819 {
1820 fprintf (stderr, "Memory consumption before IPA\n");
1821 dump_memory_report (false);
1822 }
1823 if (!quiet_flag)
1824 fprintf (stderr, "Performing interprocedural optimizations\n");
1825 cgraph_state = CGRAPH_STATE_IPA;
1826
1827 /* Don't run the IPA passes if there was any error or sorry messages. */
1828 if (errorcount == 0 && sorrycount == 0)
1829 ipa_passes ();
1830
1831 /* Do nothing else if any IPA pass found errors. */
1832 if (errorcount || sorrycount)
1833 {
1834 timevar_pop (TV_CGRAPHOPT);
1835 return;
1836 }
1837
1838 /* This pass remove bodies of extern inline functions we never inlined.
1839 Do this later so other IPA passes see what is really going on. */
1840 cgraph_remove_unreachable_nodes (false, dump_file);
1841 cgraph_global_info_ready = true;
1842 if (cgraph_dump_file)
1843 {
1844 fprintf (cgraph_dump_file, "Optimized ");
1845 dump_cgraph (cgraph_dump_file);
1846 dump_varpool (cgraph_dump_file);
1847 }
1848 if (post_ipa_mem_report)
1849 {
1850 fprintf (stderr, "Memory consumption after IPA\n");
1851 dump_memory_report (false);
1852 }
1853 timevar_pop (TV_CGRAPHOPT);
1854
1855 /* Output everything. */
1856 (*debug_hooks->assembly_start) ();
1857 if (!quiet_flag)
1858 fprintf (stderr, "Assembling functions:\n");
1859 #ifdef ENABLE_CHECKING
1860 verify_cgraph ();
1861 #endif
1862
1863 cgraph_materialize_all_clones ();
1864 cgraph_mark_functions_to_output ();
1865
1866 cgraph_state = CGRAPH_STATE_EXPANSION;
1867 if (!flag_toplevel_reorder)
1868 cgraph_output_in_order ();
1869 else
1870 {
1871 cgraph_output_pending_asms ();
1872
1873 cgraph_expand_all_functions ();
1874 varpool_remove_unreferenced_decls ();
1875
1876 varpool_assemble_pending_decls ();
1877 }
1878 cgraph_process_new_functions ();
1879 cgraph_state = CGRAPH_STATE_FINISHED;
1880
1881 if (cgraph_dump_file)
1882 {
1883 fprintf (cgraph_dump_file, "\nFinal ");
1884 dump_cgraph (cgraph_dump_file);
1885 }
1886 #ifdef ENABLE_CHECKING
1887 verify_cgraph ();
1888 /* Double check that all inline clones are gone and that all
1889 function bodies have been released from memory. */
1890 if (!(sorrycount || errorcount))
1891 {
1892 struct cgraph_node *node;
1893 bool error_found = false;
1894
1895 for (node = cgraph_nodes; node; node = node->next)
1896 if (node->analyzed
1897 && (node->global.inlined_to
1898 || gimple_has_body_p (node->decl)))
1899 {
1900 error_found = true;
1901 dump_cgraph_node (stderr, node);
1902 }
1903 if (error_found)
1904 internal_error ("nodes with unreleased memory found");
1905 }
1906 #endif
1907 }
1908
1909
1910 /* Generate and emit a static constructor or destructor. WHICH must
1911 be one of 'I' (for a constructor) or 'D' (for a destructor). BODY
1912 is a STATEMENT_LIST containing GENERIC statements. PRIORITY is the
1913 initialization priority for this constructor or destructor. */
1914
1915 void
1916 cgraph_build_static_cdtor (char which, tree body, int priority)
1917 {
1918 static int counter = 0;
1919 char which_buf[16];
1920 tree decl, name, resdecl;
1921
1922 /* The priority is encoded in the constructor or destructor name.
1923 collect2 will sort the names and arrange that they are called at
1924 program startup. */
1925 sprintf (which_buf, "%c_%.5d_%d", which, priority, counter++);
1926 name = get_file_function_name (which_buf);
1927
1928 decl = build_decl (input_location, FUNCTION_DECL, name,
1929 build_function_type (void_type_node, void_list_node));
1930 current_function_decl = decl;
1931
1932 resdecl = build_decl (input_location,
1933 RESULT_DECL, NULL_TREE, void_type_node);
1934 DECL_ARTIFICIAL (resdecl) = 1;
1935 DECL_RESULT (decl) = resdecl;
1936 DECL_CONTEXT (resdecl) = decl;
1937
1938 allocate_struct_function (decl, false);
1939
1940 TREE_STATIC (decl) = 1;
1941 TREE_USED (decl) = 1;
1942 DECL_ARTIFICIAL (decl) = 1;
1943 DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (decl) = 1;
1944 DECL_SAVED_TREE (decl) = body;
1945 TREE_PUBLIC (decl) = ! targetm.have_ctors_dtors;
1946 DECL_UNINLINABLE (decl) = 1;
1947
1948 DECL_INITIAL (decl) = make_node (BLOCK);
1949 TREE_USED (DECL_INITIAL (decl)) = 1;
1950
1951 DECL_SOURCE_LOCATION (decl) = input_location;
1952 cfun->function_end_locus = input_location;
1953
1954 switch (which)
1955 {
1956 case 'I':
1957 DECL_STATIC_CONSTRUCTOR (decl) = 1;
1958 decl_init_priority_insert (decl, priority);
1959 break;
1960 case 'D':
1961 DECL_STATIC_DESTRUCTOR (decl) = 1;
1962 decl_fini_priority_insert (decl, priority);
1963 break;
1964 default:
1965 gcc_unreachable ();
1966 }
1967
1968 gimplify_function_tree (decl);
1969
1970 cgraph_add_new_function (decl, false);
1971 cgraph_mark_needed_node (cgraph_node (decl));
1972 set_cfun (NULL);
1973 }
1974
1975 void
1976 init_cgraph (void)
1977 {
1978 cgraph_dump_file = dump_begin (TDI_cgraph, NULL);
1979 }
1980
1981 /* The edges representing the callers of the NEW_VERSION node were
1982 fixed by cgraph_function_versioning (), now the call_expr in their
1983 respective tree code should be updated to call the NEW_VERSION. */
1984
1985 static void
1986 update_call_expr (struct cgraph_node *new_version)
1987 {
1988 struct cgraph_edge *e;
1989
1990 gcc_assert (new_version);
1991
1992 /* Update the call expr on the edges to call the new version. */
1993 for (e = new_version->callers; e; e = e->next_caller)
1994 {
1995 struct function *inner_function = DECL_STRUCT_FUNCTION (e->caller->decl);
1996 gimple_call_set_fndecl (e->call_stmt, new_version->decl);
1997 maybe_clean_eh_stmt_fn (inner_function, e->call_stmt);
1998 }
1999 }
2000
2001
2002 /* Create a new cgraph node which is the new version of
2003 OLD_VERSION node. REDIRECT_CALLERS holds the callers
2004 edges which should be redirected to point to
2005 NEW_VERSION. ALL the callees edges of OLD_VERSION
2006 are cloned to the new version node. Return the new
2007 version node. */
2008
2009 static struct cgraph_node *
2010 cgraph_copy_node_for_versioning (struct cgraph_node *old_version,
2011 tree new_decl,
2012 VEC(cgraph_edge_p,heap) *redirect_callers)
2013 {
2014 struct cgraph_node *new_version;
2015 struct cgraph_edge *e, *new_e;
2016 struct cgraph_edge *next_callee;
2017 unsigned i;
2018
2019 gcc_assert (old_version);
2020
2021 new_version = cgraph_node (new_decl);
2022
2023 new_version->analyzed = true;
2024 new_version->local = old_version->local;
2025 new_version->global = old_version->global;
2026 new_version->rtl = new_version->rtl;
2027 new_version->reachable = true;
2028 new_version->count = old_version->count;
2029
2030 /* Clone the old node callees. Recursive calls are
2031 also cloned. */
2032 for (e = old_version->callees;e; e=e->next_callee)
2033 {
2034 new_e = cgraph_clone_edge (e, new_version, e->call_stmt,
2035 e->lto_stmt_uid, 0, e->frequency,
2036 e->loop_nest, true);
2037 new_e->count = e->count;
2038 }
2039 /* Fix recursive calls.
2040 If OLD_VERSION has a recursive call after the
2041 previous edge cloning, the new version will have an edge
2042 pointing to the old version, which is wrong;
2043 Redirect it to point to the new version. */
2044 for (e = new_version->callees ; e; e = next_callee)
2045 {
2046 next_callee = e->next_callee;
2047 if (e->callee == old_version)
2048 cgraph_redirect_edge_callee (e, new_version);
2049
2050 if (!next_callee)
2051 break;
2052 }
2053 for (i = 0; VEC_iterate (cgraph_edge_p, redirect_callers, i, e); i++)
2054 {
2055 /* Redirect calls to the old version node to point to its new
2056 version. */
2057 cgraph_redirect_edge_callee (e, new_version);
2058 }
2059
2060 return new_version;
2061 }
2062
2063 /* Perform function versioning.
2064 Function versioning includes copying of the tree and
2065 a callgraph update (creating a new cgraph node and updating
2066 its callees and callers).
2067
2068 REDIRECT_CALLERS varray includes the edges to be redirected
2069 to the new version.
2070
2071 TREE_MAP is a mapping of tree nodes we want to replace with
2072 new ones (according to results of prior analysis).
2073 OLD_VERSION_NODE is the node that is versioned.
2074 It returns the new version's cgraph node.
2075 ARGS_TO_SKIP lists arguments to be omitted from functions
2076 */
2077
2078 struct cgraph_node *
2079 cgraph_function_versioning (struct cgraph_node *old_version_node,
2080 VEC(cgraph_edge_p,heap) *redirect_callers,
2081 VEC (ipa_replace_map_p,gc)* tree_map,
2082 bitmap args_to_skip)
2083 {
2084 tree old_decl = old_version_node->decl;
2085 struct cgraph_node *new_version_node = NULL;
2086 tree new_decl;
2087
2088 if (!tree_versionable_function_p (old_decl))
2089 return NULL;
2090
2091 /* Make a new FUNCTION_DECL tree node for the
2092 new version. */
2093 if (!args_to_skip)
2094 new_decl = copy_node (old_decl);
2095 else
2096 new_decl = build_function_decl_skip_args (old_decl, args_to_skip);
2097
2098 /* Create the new version's call-graph node.
2099 and update the edges of the new node. */
2100 new_version_node =
2101 cgraph_copy_node_for_versioning (old_version_node, new_decl,
2102 redirect_callers);
2103
2104 /* Copy the OLD_VERSION_NODE function tree to the new version. */
2105 tree_function_versioning (old_decl, new_decl, tree_map, false, args_to_skip);
2106
2107 /* Update the new version's properties.
2108 Make The new version visible only within this translation unit. Make sure
2109 that is not weak also.
2110 ??? We cannot use COMDAT linkage because there is no
2111 ABI support for this. */
2112 DECL_EXTERNAL (new_version_node->decl) = 0;
2113 DECL_COMDAT_GROUP (new_version_node->decl) = NULL_TREE;
2114 TREE_PUBLIC (new_version_node->decl) = 0;
2115 DECL_COMDAT (new_version_node->decl) = 0;
2116 DECL_WEAK (new_version_node->decl) = 0;
2117 DECL_VIRTUAL_P (new_version_node->decl) = 0;
2118 new_version_node->local.externally_visible = 0;
2119 new_version_node->local.local = 1;
2120 new_version_node->lowered = true;
2121
2122 /* Update the call_expr on the edges to call the new version node. */
2123 update_call_expr (new_version_node);
2124
2125 cgraph_call_function_insertion_hooks (new_version_node);
2126 return new_version_node;
2127 }
2128
2129 /* Produce separate function body for inline clones so the offline copy can be
2130 modified without affecting them. */
2131 struct cgraph_node *
2132 save_inline_function_body (struct cgraph_node *node)
2133 {
2134 struct cgraph_node *first_clone, *n;
2135
2136 gcc_assert (node == cgraph_node (node->decl));
2137
2138 cgraph_lower_function (node);
2139
2140 first_clone = node->clones;
2141
2142 first_clone->decl = copy_node (node->decl);
2143 cgraph_insert_node_to_hashtable (first_clone);
2144 gcc_assert (first_clone == cgraph_node (first_clone->decl));
2145 if (first_clone->next_sibling_clone)
2146 {
2147 for (n = first_clone->next_sibling_clone; n->next_sibling_clone; n = n->next_sibling_clone)
2148 n->clone_of = first_clone;
2149 n->clone_of = first_clone;
2150 n->next_sibling_clone = first_clone->clones;
2151 if (first_clone->clones)
2152 first_clone->clones->prev_sibling_clone = n;
2153 first_clone->clones = first_clone->next_sibling_clone;
2154 first_clone->next_sibling_clone->prev_sibling_clone = NULL;
2155 first_clone->next_sibling_clone = NULL;
2156 gcc_assert (!first_clone->prev_sibling_clone);
2157 }
2158 first_clone->clone_of = NULL;
2159 node->clones = NULL;
2160
2161 if (first_clone->clones)
2162 for (n = first_clone->clones; n != first_clone;)
2163 {
2164 gcc_assert (n->decl == node->decl);
2165 n->decl = first_clone->decl;
2166 if (n->clones)
2167 n = n->clones;
2168 else if (n->next_sibling_clone)
2169 n = n->next_sibling_clone;
2170 else
2171 {
2172 while (n != first_clone && !n->next_sibling_clone)
2173 n = n->clone_of;
2174 if (n != first_clone)
2175 n = n->next_sibling_clone;
2176 }
2177 }
2178
2179 /* Copy the OLD_VERSION_NODE function tree to the new version. */
2180 tree_function_versioning (node->decl, first_clone->decl, NULL, true, NULL);
2181
2182 DECL_EXTERNAL (first_clone->decl) = 0;
2183 DECL_COMDAT_GROUP (first_clone->decl) = NULL_TREE;
2184 TREE_PUBLIC (first_clone->decl) = 0;
2185 DECL_COMDAT (first_clone->decl) = 0;
2186 VEC_free (ipa_opt_pass, heap,
2187 first_clone->ipa_transforms_to_apply);
2188 first_clone->ipa_transforms_to_apply = NULL;
2189
2190 #ifdef ENABLE_CHECKING
2191 verify_cgraph_node (first_clone);
2192 #endif
2193 return first_clone;
2194 }
2195
2196 /* Given virtual clone, turn it into actual clone. */
2197 static void
2198 cgraph_materialize_clone (struct cgraph_node *node)
2199 {
2200 bitmap_obstack_initialize (NULL);
2201 /* Copy the OLD_VERSION_NODE function tree to the new version. */
2202 tree_function_versioning (node->clone_of->decl, node->decl,
2203 node->clone.tree_map, true,
2204 node->clone.args_to_skip);
2205 if (cgraph_dump_file)
2206 {
2207 dump_function_to_file (node->clone_of->decl, cgraph_dump_file, dump_flags);
2208 dump_function_to_file (node->decl, cgraph_dump_file, dump_flags);
2209 }
2210
2211 /* Function is no longer clone. */
2212 if (node->next_sibling_clone)
2213 node->next_sibling_clone->prev_sibling_clone = node->prev_sibling_clone;
2214 if (node->prev_sibling_clone)
2215 node->prev_sibling_clone->next_sibling_clone = node->next_sibling_clone;
2216 else
2217 node->clone_of->clones = node->next_sibling_clone;
2218 node->next_sibling_clone = NULL;
2219 node->prev_sibling_clone = NULL;
2220 if (!node->clone_of->analyzed && !node->clone_of->clones)
2221 cgraph_remove_node (node->clone_of);
2222 node->clone_of = NULL;
2223 bitmap_obstack_release (NULL);
2224 }
2225
2226 /* Once all functions from compilation unit are in memory, produce all clones
2227 and update all calls.
2228 We might also do this on demand if we don't want to bring all functions to
2229 memory prior compilation, but current WHOPR implementation does that and it is
2230 is bit easier to keep everything right in this order. */
2231 void
2232 cgraph_materialize_all_clones (void)
2233 {
2234 struct cgraph_node *node;
2235 bool stabilized = false;
2236
2237 if (cgraph_dump_file)
2238 fprintf (cgraph_dump_file, "Materializing clones\n");
2239 #ifdef ENABLE_CHECKING
2240 verify_cgraph ();
2241 #endif
2242
2243 /* We can also do topological order, but number of iterations should be
2244 bounded by number of IPA passes since single IPA pass is probably not
2245 going to create clones of clones it created itself. */
2246 while (!stabilized)
2247 {
2248 stabilized = true;
2249 for (node = cgraph_nodes; node; node = node->next)
2250 {
2251 if (node->clone_of && node->decl != node->clone_of->decl
2252 && !gimple_has_body_p (node->decl))
2253 {
2254 if (gimple_has_body_p (node->clone_of->decl))
2255 {
2256 if (cgraph_dump_file)
2257 {
2258 fprintf (cgraph_dump_file, "clonning %s to %s\n",
2259 cgraph_node_name (node->clone_of),
2260 cgraph_node_name (node));
2261 if (node->clone.tree_map)
2262 {
2263 unsigned int i;
2264 fprintf (cgraph_dump_file, " replace map: ");
2265 for (i = 0; i < VEC_length (ipa_replace_map_p,
2266 node->clone.tree_map);
2267 i++)
2268 {
2269 struct ipa_replace_map *replace_info;
2270 replace_info = VEC_index (ipa_replace_map_p,
2271 node->clone.tree_map,
2272 i);
2273 print_generic_expr (cgraph_dump_file, replace_info->old_tree, 0);
2274 fprintf (cgraph_dump_file, " -> ");
2275 print_generic_expr (cgraph_dump_file, replace_info->new_tree, 0);
2276 fprintf (cgraph_dump_file, "%s%s;",
2277 replace_info->replace_p ? "(replace)":"",
2278 replace_info->ref_p ? "(ref)":"");
2279 }
2280 fprintf (cgraph_dump_file, "\n");
2281 }
2282 if (node->clone.args_to_skip)
2283 {
2284 fprintf (cgraph_dump_file, " args_to_skip: ");
2285 dump_bitmap (cgraph_dump_file, node->clone.args_to_skip);
2286 }
2287 if (node->clone.args_to_skip)
2288 {
2289 fprintf (cgraph_dump_file, " combined_args_to_skip:");
2290 dump_bitmap (cgraph_dump_file, node->clone.combined_args_to_skip);
2291 }
2292 }
2293 cgraph_materialize_clone (node);
2294 }
2295 else
2296 stabilized = false;
2297 }
2298 }
2299 }
2300 for (node = cgraph_nodes; node; node = node->next)
2301 if (!node->analyzed && node->callees)
2302 cgraph_node_remove_callees (node);
2303 if (cgraph_dump_file)
2304 fprintf (cgraph_dump_file, "Updating call sites\n");
2305 for (node = cgraph_nodes; node; node = node->next)
2306 if (node->analyzed && gimple_has_body_p (node->decl)
2307 && (!node->clone_of || node->clone_of->decl != node->decl))
2308 {
2309 struct cgraph_edge *e;
2310
2311 current_function_decl = node->decl;
2312 push_cfun (DECL_STRUCT_FUNCTION (node->decl));
2313 for (e = node->callees; e; e = e->next_callee)
2314 {
2315 tree decl = gimple_call_fndecl (e->call_stmt);
2316 /* When function gets inlined, indirect inlining might've invented
2317 new edge for orginally indirect stmt. Since we are not
2318 preserving clones in the original form, we must not update here
2319 since other inline clones don't need to contain call to the same
2320 call. Inliner will do the substitution for us later. */
2321 if (decl && decl != e->callee->decl)
2322 {
2323 gimple new_stmt;
2324 gimple_stmt_iterator gsi;
2325
2326 if (cgraph_get_node (decl) == cgraph_get_node (e->callee->decl))
2327 /* Don't update call from same body alias to the real function. */
2328 continue;
2329
2330 if (cgraph_dump_file)
2331 {
2332 fprintf (cgraph_dump_file, "updating call of %s in %s:",
2333 cgraph_node_name (node),
2334 cgraph_node_name (e->callee));
2335 print_gimple_stmt (cgraph_dump_file, e->call_stmt, 0, dump_flags);
2336 }
2337
2338 if (e->callee->clone.combined_args_to_skip)
2339 new_stmt = gimple_call_copy_skip_args (e->call_stmt,
2340 e->callee->clone.combined_args_to_skip);
2341 else
2342 new_stmt = e->call_stmt;
2343 if (gimple_vdef (new_stmt)
2344 && TREE_CODE (gimple_vdef (new_stmt)) == SSA_NAME)
2345 SSA_NAME_DEF_STMT (gimple_vdef (new_stmt)) = new_stmt;
2346 gimple_call_set_fndecl (new_stmt, e->callee->decl);
2347
2348 gsi = gsi_for_stmt (e->call_stmt);
2349 gsi_replace (&gsi, new_stmt, true);
2350
2351 /* Update EH information too, just in case. */
2352 maybe_clean_or_replace_eh_stmt (e->call_stmt, new_stmt);
2353
2354 cgraph_set_call_stmt_including_clones (node, e->call_stmt, new_stmt);
2355
2356 if (cgraph_dump_file)
2357 {
2358 fprintf (cgraph_dump_file, " updated to:");
2359 print_gimple_stmt (cgraph_dump_file, e->call_stmt, 0, dump_flags);
2360 }
2361 }
2362 }
2363 pop_cfun ();
2364 current_function_decl = NULL;
2365 #ifdef ENABLE_CHECKING
2366 verify_cgraph_node (node);
2367 #endif
2368 }
2369 #ifdef ENABLE_CHECKING
2370 verify_cgraph ();
2371 #endif
2372 cgraph_remove_unreachable_nodes (false, cgraph_dump_file);
2373 }
2374
2375 #include "gt-cgraphunit.h"