gcc/ipa-inline-analysis.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003, 2004, 2007, 2008, 2009, 2010, 2011
   3    Free Software Foundation, Inc.
   4    Contributed by Jan Hubicka
   5
   6 This file is part of GCC.
   7
   8 GCC is free software; you can redistribute it and/or modify it under
   9 the terms of the GNU General Public License as published by the Free
  10 Software Foundation; either version 3, or (at your option) any later
  11 version.
  12
  13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  16 for more details.
  17
  18 You should have received a copy of the GNU General Public License
  19 along with GCC; see the file COPYING3.  If not see
  20 <http://www.gnu.org/licenses/>.  */
  21
  22 /* Analysis used by the inliner and other passes limiting code size growth.
  23
  24    We estimate for each function
  25      - function body size
  26      - average function execution time
  27      - inlining size benefit (that is how much of function body size
  28        and its call sequence is expected to disappear by inlining)
  29      - inlining time benefit
  30      - function frame size
  31    For each call
  32      - call statement size and time
  33
  34    inlinie_summary datastructures store above information locally (i.e.
  35    parameters of the function itself) and globally (i.e. parameters of
  36    the function created by applying all the inline decisions already
  37    present in the callgraph).
  38
  39    We provide accestor to the inline_summary datastructure and
  40    basic logic updating the parameters when inlining is performed.
  41
  42    The summaries are context sensitive.  Context means
  43      1) partial assignment of known constant values of operands
  44      2) whether function is inlined into the call or not.
  45    It is easy to add more variants.  To represent function size and time
  46    that depends on context (i.e. it is known to be optimized away when
  47    context is known either by inlining or from IP-CP and clonning),
  48    we use predicates. Predicates are logical formulas in
  49    conjunctive-disjunctive form consisting of clauses. Clauses are bitmaps
  50    specifying what conditions must be true. Conditions are simple test
  51    of the form described above.
  52
  53    In order to make predicate (possibly) true, all of its clauses must
  54    be (possibly) true. To make clause (possibly) true, one of conditions
  55    it mentions must be (possibly) true.  There are fixed bounds on
  56    number of clauses and conditions and all the manipulation functions
  57    are conservative in positive direction. I.e. we may lose precision
  58    by thinking that predicate may be true even when it is not.
  59
  60    estimate_edge_size and estimate_edge_growth can be used to query
  61    function size/time in the given context.  inline_merge_summary merges
  62    properties of caller and callee after inlining.
  63
  64    Finally pass_inline_parameters is exported.  This is used to drive
  65    computation of function parameters used by the early inliner. IPA
  66    inlined performs analysis via its analyze_function method. */
  67
  68 #include "config.h"
  69 #include "system.h"
  70 #include "coretypes.h"
  71 #include "tm.h"
  72 #include "tree.h"
  73 #include "tree-inline.h"
  74 #include "langhooks.h"
  75 #include "flags.h"
  76 #include "cgraph.h"
  77 #include "diagnostic.h"
  78 #include "gimple-pretty-print.h"
  79 #include "timevar.h"
  80 #include "params.h"
  81 #include "tree-pass.h"
  82 #include "coverage.h"
  83 #include "ggc.h"
  84 #include "tree-flow.h"
  85 #include "ipa-prop.h"
  86 #include "lto-streamer.h"
  87 #include "ipa-inline.h"
  88 #include "alloc-pool.h"
  89
  90 /* Estimate runtime of function can easilly run into huge numbers with many
  91    nested loops.  Be sure we can compute time * INLINE_SIZE_SCALE in integer.
  92    For anything larger we use gcov_type.  */
  93 #define MAX_TIME 1000000
  94
  95 /* Number of bits in integer, but we really want to be stable across different
  96    hosts.  */
  97 #define NUM_CONDITIONS 32
  98
  99 enum predicate_conditions
 100 {
 101   predicate_false_condition = 0,
 102   predicate_not_inlined_condition = 1,
 103   predicate_first_dynamic_condition = 2
 104 };
 105
 106 /* Special condition code we use to represent test that operand is compile time
 107    constant.  */
 108 #define IS_NOT_CONSTANT ERROR_MARK
 109
 110 /* Holders of ipa cgraph hooks: */
 111 static struct cgraph_node_hook_list *function_insertion_hook_holder;
 112 static struct cgraph_node_hook_list *node_removal_hook_holder;
 113 static struct cgraph_2node_hook_list *node_duplication_hook_holder;
 114 static struct cgraph_2edge_hook_list *edge_duplication_hook_holder;
 115 static struct cgraph_edge_hook_list *edge_removal_hook_holder;
 116 static void inline_node_removal_hook (struct cgraph_node *, void *);
 117 static void inline_node_duplication_hook (struct cgraph_node *,
 118                                           struct cgraph_node *, void *);
 119 static void inline_edge_removal_hook (struct cgraph_edge *, void *);
 120 static void inline_edge_duplication_hook (struct cgraph_edge *,
 121                                           struct cgraph_edge *,
 122                                           void *);
 123
 124 /* VECtor holding inline summaries.
 125    In GGC memory because conditions might point to constant trees.  */
 126 VEC(inline_summary_t,gc) *inline_summary_vec;
 127 VEC(inline_edge_summary_t,heap) *inline_edge_summary_vec;
 128
 129 /* Cached node/edge growths.  */
 130 VEC(int,heap) *node_growth_cache;
 131 VEC(edge_growth_cache_entry,heap) *edge_growth_cache;
 132
 133 /* Edge predicates goes here.  */
 134 static alloc_pool edge_predicate_pool;
 135
 136 /* Return true predicate (tautology).
 137    We represent it by empty list of clauses.  */
 138
 139 static inline struct predicate
 140 true_predicate (void)
 141 {
 142   struct predicate p;
 143   p.clause[0]=0;
 144   return p;
 145 }
 146
 147
 148 /* Return predicate testing single condition number COND.  */
 149
 150 static inline struct predicate
 151 single_cond_predicate (int cond)
 152 {
 153   struct predicate p;
 154   p.clause[0]=1 << cond;
 155   p.clause[1]=0;
 156   return p;
 157 }
 158
 159
 160 /* Return false predicate.  First clause require false condition.  */
 161
 162 static inline struct predicate
 163 false_predicate (void)
 164 {
 165   return single_cond_predicate (predicate_false_condition);
 166 }
 167
 168
 169 /* Return true if P is (false).  */
 170
 171 static inline bool
 172 true_predicate_p (struct predicate *p)
 173 {
 174   return !p->clause[0];
 175 }
 176
 177
 178 /* Return true if P is (false).  */
 179
 180 static inline bool
 181 false_predicate_p (struct predicate *p)
 182 {
 183   if (p->clause[0] == (1 << predicate_false_condition))
 184     {
 185       gcc_checking_assert (!p->clause[1]
 186                            && p->clause[0] == 1 << predicate_false_condition);
 187       return true;
 188     }
 189   return false;
 190 }
 191
 192
 193 /* Return predicate that is set true when function is not inlined.  */
 194 static inline struct predicate
 195 not_inlined_predicate (void)
 196 {
 197   return single_cond_predicate (predicate_not_inlined_condition);
 198 }
 199
 200
 201 /* Add condition to condition list CONDS.  */
 202
 203 static struct predicate
 204 add_condition (struct inline_summary *summary, int operand_num,
 205                enum tree_code code, tree val)
 206 {
 207   int i;
 208   struct condition *c;
 209   struct condition new_cond;
 210
 211   for (i = 0; VEC_iterate (condition, summary->conds, i, c); i++)
 212     {
 213       if (c->operand_num == operand_num
 214           && c->code == code
 215           && c->val == val)
 216         return single_cond_predicate (i + predicate_first_dynamic_condition);
 217     }
 218   /* Too many conditions.  Give up and return constant true.  */
 219   if (i == NUM_CONDITIONS - predicate_first_dynamic_condition)
 220     return true_predicate ();
 221
 222   new_cond.operand_num = operand_num;
 223   new_cond.code = code;
 224   new_cond.val = val;
 225   VEC_safe_push (condition, gc, summary->conds, &new_cond);
 226   return single_cond_predicate (i + predicate_first_dynamic_condition);
 227 }
 228
 229
 230 /* Add clause CLAUSE into the predicate P.  */
 231
 232 static inline void
 233 add_clause (struct predicate *p, clause_t clause)
 234 {
 235   int i;
 236   int i2;
 237   int insert_here = -1;
 238
 239   /* True clause.  */
 240   if (!clause)
 241     return;
 242
 243   /* False clause makes the whole predicate false.  Kill the other variants.  */
 244   if (clause == (1 << predicate_false_condition))
 245     {
 246       p->clause[0] = (1 << predicate_false_condition);
 247       p->clause[1] = 0;
 248       return;
 249     }
 250   if (false_predicate_p (p))
 251     return;
 252
 253   /* No one should be sily enough to add false into nontrivial clauses.  */
 254   gcc_checking_assert (!(clause & (1 << predicate_false_condition)));
 255
 256   /* Look where to insert the clause.  At the same time prune out
 257      clauses of P that are implied by the new clause and thus
 258      redundant.  */
 259   for (i = 0, i2 = 0; i <= MAX_CLAUSES; i++)
 260     {
 261       p->clause[i2] = p->clause[i];
 262
 263       if (!p->clause[i])
 264         break;
 265
 266       /* If p->clause[i] implies clause, there is nothing to add.  */
 267       if ((p->clause[i] & clause) == p->clause[i])
 268         {
 269           /* We had nothing to add, none of clauses should've become redundant.  */
 270           gcc_checking_assert (i == i2);
 271           return;
 272         }
 273
 274       if (p->clause[i] < clause && insert_here < 0)
 275         insert_here = i2;
 276
 277       /* If clause implies p->clause[i], then p->clause[i] becomes redundant.
 278          Otherwise the p->clause[i] has to stay.  */
 279       if ((p->clause[i] & clause) != clause)
 280         i2++;
 281     }
 282   /* We run out of variants.  Be conservative in positive direction.  */
 283   if (i2 == MAX_CLAUSES)
 284     return;
 285   /* Keep clauses in decreasing order. This makes equivalence testing easy.  */
 286   p->clause[i2 + 1] = 0;
 287   if (insert_here >= 0)
 288     for (;i2 > insert_here; i2--)
 289       p->clause[i2] = p->clause[i2 - 1];
 290   else
 291     insert_here = i2;
 292   p->clause[insert_here] = clause;
 293 }
 294
 295
 296 /* Return P & P2.  */
 297
 298 static struct predicate
 299 and_predicates (struct predicate *p, struct predicate *p2)
 300 {
 301   struct predicate out = *p;
 302   int i;
 303
 304   /* Avoid busy work.  */
 305   if (false_predicate_p (p2) || true_predicate_p (p))
 306     return *p2;
 307   if (false_predicate_p (p) || true_predicate_p (p2))
 308     return *p;
 309
 310   /* See how far predicates match.  */
 311   for (i = 0; p->clause[i] && p->clause[i] == p2->clause[i]; i++)
 312     {
 313       gcc_checking_assert (i < MAX_CLAUSES);
 314     }
 315
 316   /* Combine the predicates rest.  */
 317   for (; p2->clause[i]; i++)
 318     {
 319       gcc_checking_assert (i < MAX_CLAUSES);
 320       add_clause (&out, p2->clause[i]);
 321     }
 322   return out;
 323 }
 324
 325
 326 /* Return true if predicates are obviously equal.  */
 327
 328 static inline bool
 329 predicates_equal_p (struct predicate *p, struct predicate *p2)
 330 {
 331   int i;
 332   for (i = 0; p->clause[i]; i++)
 333     {
 334       gcc_checking_assert (i < MAX_CLAUSES);
 335       gcc_checking_assert (p->clause [i] > p->clause[i + 1]);
 336       gcc_checking_assert (!p2->clause[i] || p2->clause [i] > p2->clause[i + 1]);
 337       if (p->clause[i] != p2->clause[i])
 338         return false;
 339     }
 340   return !p2->clause[i];
 341 }
 342
 343
 344 /* Return P | P2.  */
 345
 346 static struct predicate
 347 or_predicates (struct predicate *p, struct predicate *p2)
 348 {
 349   struct predicate out = true_predicate ();
 350   int i,j;
 351
 352   /* Avoid busy work.  */
 353   if (false_predicate_p (p2) || true_predicate_p (p))
 354     return *p;
 355   if (false_predicate_p (p) || true_predicate_p (p2))
 356     return *p2;
 357   if (predicates_equal_p (p, p2))
 358     return *p;
 359
 360   /* OK, combine the predicates.  */
 361   for (i = 0; p->clause[i]; i++)
 362     for (j = 0; p2->clause[j]; j++)
 363       {
 364         gcc_checking_assert (i < MAX_CLAUSES && j < MAX_CLAUSES);
 365         add_clause (&out, p->clause[i] | p2->clause[j]);
 366       }
 367   return out;
 368 }
 369
 370
 371 /* Having partial truth assignment in POSSIBLE_TRUTHS, return false if predicate P
 372    to be false.  */
 373
 374 static bool
 375 evaluate_predicate (struct predicate *p, clause_t possible_truths)
 376 {
 377   int i;
 378
 379   /* True remains true.  */
 380   if (true_predicate_p (p))
 381     return true;
 382
 383   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 384
 385   /* See if we can find clause we can disprove.  */
 386   for (i = 0; p->clause[i]; i++)
 387     {
 388       gcc_checking_assert (i < MAX_CLAUSES);
 389       if (!(p->clause[i] & possible_truths))
 390         return false;
 391     }
 392   return true;
 393 }
 394
 395
 396 /* Dump conditional COND.  */
 397
 398 static void
 399 dump_condition (FILE *f, conditions conditions, int cond)
 400 {
 401   condition *c;
 402   if (cond == predicate_false_condition)
 403     fprintf (f, "false");
 404   else if (cond == predicate_not_inlined_condition)
 405     fprintf (f, "not inlined");
 406   else
 407     {
 408       c = VEC_index (condition, conditions, cond - predicate_first_dynamic_condition);
 409       fprintf (f, "op%i", c->operand_num);
 410       if (c->code == IS_NOT_CONSTANT)
 411         {
 412           fprintf (f, " not constant");
 413           return;
 414         }
 415       fprintf (f, " %s ", op_symbol_code (c->code));
 416       print_generic_expr (f, c->val, 1);
 417     }
 418 }
 419
 420
 421 /* Dump clause CLAUSE.  */
 422
 423 static void
 424 dump_clause (FILE *f, conditions conds, clause_t clause)
 425 {
 426   int i;
 427   bool found = false;
 428   fprintf (f, "(");
 429   if (!clause)
 430     fprintf (f, "true");
 431   for (i = 0; i < NUM_CONDITIONS; i++)
 432     if (clause & (1 << i))
 433       {
 434         if (found)
 435           fprintf (f, " || ");
 436         found = true;
 437         dump_condition (f, conds, i);
 438       }
 439   fprintf (f, ")");
 440 }
 441
 442
 443 /* Dump predicate PREDICATE.  */
 444
 445 static void
 446 dump_predicate (FILE *f, conditions conds, struct predicate *pred)
 447 {
 448   int i;
 449   if (true_predicate_p (pred))
 450     dump_clause (f, conds, 0);
 451   else
 452     for (i = 0; pred->clause[i]; i++)
 453       {
 454         if (i)
 455           fprintf (f, " && ");
 456         dump_clause (f, conds, pred->clause[i]);
 457       }
 458   fprintf (f, "\n");
 459 }
 460
 461
 462 /* Record SIZE and TIME under condition PRED into the inline summary.  */
 463
 464 static void
 465 account_size_time (struct inline_summary *summary, int size, int time, struct predicate *pred)
 466 {
 467   size_time_entry *e;
 468   bool found = false;
 469   int i;
 470
 471   if (false_predicate_p (pred))
 472     return;
 473
 474   /* We need to create initial empty unconitional clause, but otherwie
 475      we don't need to account empty times and sizes.  */
 476   if (!size && !time && summary->conds)
 477     return;
 478
 479   /* Watch overflow that might result from insane profiles.  */
 480   if (time > MAX_TIME * INLINE_TIME_SCALE)
 481     time = MAX_TIME * INLINE_TIME_SCALE;
 482   gcc_assert (time >= 0);
 483
 484   for (i = 0; VEC_iterate (size_time_entry, summary->entry, i, e); i++)
 485     if (predicates_equal_p (&e->predicate, pred))
 486       {
 487         found = true;
 488         break;
 489       }
 490   if (i == 32)
 491     {
 492       i = 0;
 493       found = true;
 494       e = VEC_index (size_time_entry, summary->entry, 0);
 495       gcc_assert (!e->predicate.clause[0]);
 496     }
 497   if (dump_file && (dump_flags & TDF_DETAILS) && (time || size))
 498     {
 499       fprintf (dump_file, "\t\tAccounting size:%3.2f, time:%3.2f on %spredicate:",
 500                ((double)size) / INLINE_SIZE_SCALE, ((double)time) / INLINE_TIME_SCALE,
 501                found ? "" : "new ");
 502       dump_predicate (dump_file, summary->conds, pred);
 503     }
 504   if (!found)
 505     {
 506       struct size_time_entry new_entry;
 507       new_entry.size = size;
 508       new_entry.time = time;
 509       new_entry.predicate = *pred;
 510       VEC_safe_push (size_time_entry, gc, summary->entry, &new_entry);
 511     }
 512   else
 513     {
 514       e->size += size;
 515       e->time += time;
 516       if (e->time > MAX_TIME * INLINE_TIME_SCALE)
 517         e->time = MAX_TIME * INLINE_TIME_SCALE;
 518     }
 519 }
 520
 521 /* Set predicate for edge E.  */
 522
 523 static void
 524 edge_set_predicate (struct cgraph_edge *e, struct predicate *predicate)
 525 {
 526   struct inline_edge_summary *es = inline_edge_summary (e);
 527   if (predicate && !true_predicate_p (predicate))
 528     {
 529       if (!es->predicate)
 530         es->predicate = (struct predicate *)pool_alloc (edge_predicate_pool);
 531       *es->predicate = *predicate;
 532     }
 533   else
 534     {
 535       if (es->predicate)
 536         pool_free (edge_predicate_pool, es->predicate);
 537       es->predicate = NULL;
 538     }
 539 }
 540
 541
 542 /* Work out what conditions might be true at invocation of E.  */
 543
 544 static clause_t
 545 evaluate_conditions_for_edge (struct cgraph_edge *e, bool inline_p)
 546 {
 547   clause_t clause = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 548   struct inline_summary *info = inline_summary (e->callee);
 549   int i;
 550
 551   if (ipa_node_params_vector && info->conds
 552       /* FIXME: it seems that we forget to get argument count in some cases,
 553          probaby for previously indirect edges or so.  */
 554       && ipa_get_cs_argument_count (IPA_EDGE_REF (e)))
 555     {
 556       struct ipa_node_params *parms_info;
 557       struct ipa_edge_args *args = IPA_EDGE_REF (e);
 558       int i, count = ipa_get_cs_argument_count (args);
 559       struct ipcp_lattice lat;
 560       struct condition *c;
 561       VEC (tree, heap) *known_vals = NULL;
 562
 563       if (e->caller->global.inlined_to)
 564         parms_info = IPA_NODE_REF (e->caller->global.inlined_to);
 565       else
 566         parms_info = IPA_NODE_REF (e->caller);
 567
 568       VEC_safe_grow_cleared (tree, heap, known_vals, count);
 569       for (i = 0; i < count; i++)
 570         {
 571           ipa_lattice_from_jfunc (parms_info, &lat, ipa_get_ith_jump_func (args, i));
 572           if (lat.type == IPA_CONST_VALUE)
 573             VEC_replace (tree, known_vals, i, lat.constant);
 574         }
 575       for (i = 0; VEC_iterate (condition, info->conds, i, c); i++)
 576         {
 577           tree val = VEC_index (tree, known_vals, c->operand_num);
 578           tree res;
 579
 580           if (!val)
 581             {
 582               clause |= 1 << (i + predicate_first_dynamic_condition);
 583               continue;
 584             }
 585           if (c->code == IS_NOT_CONSTANT)
 586             continue;
 587           res = fold_binary_to_constant (c->code, boolean_type_node, val, c->val);
 588           if (res
 589               && integer_zerop (res))
 590             continue;
 591           clause |= 1 << (i + predicate_first_dynamic_condition);
 592         }
 593       VEC_free (tree, heap, known_vals);
 594     }
 595   else
 596     for (i = 0; i < (int)VEC_length (condition, info->conds); i++)
 597       clause |= 1 << (i + predicate_first_dynamic_condition);
 598
 599   return clause;
 600 }
 601
 602
 603 /* Allocate the inline summary vector or resize it to cover all cgraph nodes. */
 604
 605 static void
 606 inline_summary_alloc (void)
 607 {
 608   if (!node_removal_hook_holder)
 609     node_removal_hook_holder =
 610       cgraph_add_node_removal_hook (&inline_node_removal_hook, NULL);
 611   if (!edge_removal_hook_holder)
 612     edge_removal_hook_holder =
 613       cgraph_add_edge_removal_hook (&inline_edge_removal_hook, NULL);
 614   if (!node_duplication_hook_holder)
 615     node_duplication_hook_holder =
 616       cgraph_add_node_duplication_hook (&inline_node_duplication_hook, NULL);
 617   if (!edge_duplication_hook_holder)
 618     edge_duplication_hook_holder =
 619       cgraph_add_edge_duplication_hook (&inline_edge_duplication_hook, NULL);
 620
 621   if (VEC_length (inline_summary_t, inline_summary_vec)
 622       <= (unsigned) cgraph_max_uid)
 623     VEC_safe_grow_cleared (inline_summary_t, gc,
 624                            inline_summary_vec, cgraph_max_uid + 1);
 625   if (VEC_length (inline_edge_summary_t, inline_edge_summary_vec)
 626       <= (unsigned) cgraph_edge_max_uid)
 627     VEC_safe_grow_cleared (inline_edge_summary_t, heap,
 628                            inline_edge_summary_vec, cgraph_edge_max_uid + 1);
 629   if (!edge_predicate_pool)
 630     edge_predicate_pool = create_alloc_pool ("edge predicates", sizeof (struct predicate),
 631                                              10);
 632 }
 633
 634 /* Hook that is called by cgraph.c when a node is removed.  */
 635
 636 static void
 637 inline_node_removal_hook (struct cgraph_node *node, void *data ATTRIBUTE_UNUSED)
 638 {
 639   struct inline_summary *info;
 640   if (VEC_length (inline_summary_t, inline_summary_vec)
 641       <= (unsigned)node->uid)
 642     return;
 643   info = inline_summary (node);
 644   reset_node_growth_cache (node);
 645   VEC_free (condition, gc, info->conds);
 646   VEC_free (size_time_entry, gc, info->entry);
 647   info->conds = NULL;
 648   info->entry = NULL;
 649   memset (info, 0, sizeof (inline_summary_t));
 650 }
 651
 652
 653 /* Hook that is called by cgraph.c when a node is duplicated.  */
 654
 655 static void
 656 inline_node_duplication_hook (struct cgraph_node *src, struct cgraph_node *dst,
 657                               ATTRIBUTE_UNUSED void *data)
 658 {
 659   struct inline_summary *info;
 660   inline_summary_alloc ();
 661   info = inline_summary (dst);
 662   memcpy (info, inline_summary (src),
 663           sizeof (struct inline_summary));
 664   info->conds = VEC_copy (condition, gc, info->conds);
 665   info->entry = VEC_copy (size_time_entry, gc, info->entry);
 666 }
 667
 668
 669 /* Hook that is called by cgraph.c when a node is duplicated.  */
 670
 671 static void
 672 inline_edge_duplication_hook (struct cgraph_edge *src, struct cgraph_edge *dst,
 673                               ATTRIBUTE_UNUSED void *data)
 674 {
 675   struct inline_edge_summary *info;
 676   struct inline_edge_summary *srcinfo;
 677   inline_summary_alloc ();
 678   info = inline_edge_summary (dst);
 679   srcinfo = inline_edge_summary (src);
 680   memcpy (info, srcinfo,
 681           sizeof (struct inline_edge_summary));
 682   info->predicate = NULL;
 683   edge_set_predicate (dst, srcinfo->predicate);
 684 }
 685
 686
 687 /* Keep edge cache consistent across edge removal.  */
 688
 689 static void
 690 inline_edge_removal_hook (struct cgraph_edge *edge, void *data ATTRIBUTE_UNUSED)
 691 {
 692   if (edge_growth_cache)
 693     reset_edge_growth_cache (edge);
 694   if (edge->uid < (int)VEC_length (inline_edge_summary_t, inline_edge_summary_vec))
 695     {
 696       edge_set_predicate (edge, NULL);
 697       memset (inline_edge_summary (edge), 0, sizeof (struct inline_edge_summary));
 698     }
 699 }
 700
 701
 702 /* Initialize growth caches.  */
 703
 704 void
 705 initialize_growth_caches (void)
 706 {
 707   if (cgraph_edge_max_uid)
 708     VEC_safe_grow_cleared (edge_growth_cache_entry, heap, edge_growth_cache,
 709                            cgraph_edge_max_uid);
 710   if (cgraph_max_uid)
 711     VEC_safe_grow_cleared (int, heap, node_growth_cache, cgraph_max_uid);
 712 }
 713
 714
 715 /* Free growth caches.  */
 716
 717 void
 718 free_growth_caches (void)
 719 {
 720   VEC_free (edge_growth_cache_entry, heap, edge_growth_cache);
 721   edge_growth_cache = 0;
 722   VEC_free (int, heap, node_growth_cache);
 723   node_growth_cache = 0;
 724 }
 725
 726
 727 /* Dump edge summaries associated to NODE and recursively to all clones.
 728    Indent by INDENT.  */
 729
 730 static void
 731 dump_inline_edge_summary (FILE * f, int indent, struct cgraph_node *node,
 732                           struct inline_summary *info)
 733 {
 734   struct cgraph_edge *edge;
 735   for (edge = node->callees; edge; edge = edge->next_callee)
 736     {
 737       struct inline_edge_summary *es = inline_edge_summary (edge);
 738       fprintf (f, "%*s%s/%i %s\n%*s  loop depth:%2i freq:%4i size:%2i time: %2i callee size:%2i stack:%2i",
 739                indent, "", cgraph_node_name (edge->callee),
 740                edge->callee->uid,
 741                !edge->inline_failed ? "inlined"
 742                : cgraph_inline_failed_string (edge->inline_failed),
 743                indent, "",
 744                es->loop_depth,
 745                edge->frequency,
 746                es->call_stmt_size,
 747                es->call_stmt_time,
 748                (int)inline_summary (edge->callee)->size,
 749                (int)inline_summary (edge->callee)->estimated_stack_size);
 750       if (es->predicate)
 751         {
 752           fprintf (f, " predicate: ");
 753           dump_predicate (f, info->conds, es->predicate);
 754         }
 755       else
 756           fprintf (f, "\n");
 757       if (!edge->inline_failed)
 758         {
 759           fprintf (f, "%*sStack frame offset %i, callee self size %i, callee size %i\n",
 760                    indent+2, "",
 761                    (int)inline_summary (edge->callee)->stack_frame_offset,
 762                    (int)inline_summary (edge->callee)->estimated_self_stack_size,
 763                    (int)inline_summary (edge->callee)->estimated_stack_size);
 764           dump_inline_edge_summary (f, indent+2, edge->callee, info);
 765         }
 766     }
 767   for (edge = node->indirect_calls; edge; edge = edge->next_callee)
 768     {
 769       struct inline_edge_summary *es = inline_edge_summary (edge);
 770       fprintf (f, "%*sindirect call loop depth:%2i freq:%4i size:%2i time: %2i\n",
 771                indent, "",
 772                es->loop_depth,
 773                edge->frequency,
 774                es->call_stmt_size,
 775                es->call_stmt_time);
 776       if (es->predicate)
 777         {
 778           fprintf (f, "predicate: ");
 779           dump_predicate (f, info->conds, es->predicate);
 780         }
 781       else
 782           fprintf (f, "\n");
 783     }
 784 }
 785
 786
 787 void
 788 dump_inline_summary (FILE * f, struct cgraph_node *node)
 789 {
 790   if (node->analyzed)
 791     {
 792       struct inline_summary *s = inline_summary (node);
 793       size_time_entry *e;
 794       int i;
 795       fprintf (f, "Inline summary for %s/%i", cgraph_node_name (node),
 796                node->uid);
 797       if (DECL_DISREGARD_INLINE_LIMITS (node->decl))
 798         fprintf (f, " always_inline");
 799       if (s->inlinable)
 800         fprintf (f, " inlinable");
 801       if (s->versionable)
 802         fprintf (f, " versionable");
 803       fprintf (f, "\n  self time:       %i\n",
 804                s->self_time);
 805       fprintf (f, "  global time:     %i\n", s->time);
 806       fprintf (f, "  self size:       %i\n",
 807                s->self_size);
 808       fprintf (f, "  global size:     %i\n", s->size);
 809       fprintf (f, "  self stack:      %i\n",
 810                (int) s->estimated_self_stack_size);
 811       fprintf (f, "  global stack:    %i\n",
 812                (int) s->estimated_stack_size);
 813       for (i = 0;
 814            VEC_iterate (size_time_entry, s->entry, i, e);
 815            i++)
 816         {
 817           fprintf (f, "    size:%f, time:%f, predicate:",
 818                    (double) e->size / INLINE_SIZE_SCALE,
 819                    (double) e->time / INLINE_TIME_SCALE);
 820           dump_predicate (f, s->conds, &e->predicate);
 821         }
 822       fprintf (f, "  calls:\n");
 823       dump_inline_edge_summary (f, 4, node, s);
 824       fprintf (f, "\n");
 825     }
 826 }
 827
 828 DEBUG_FUNCTION void
 829 debug_inline_summary (struct cgraph_node *node)
 830 {
 831   dump_inline_summary (stderr, node);
 832 }
 833
 834 void
 835 dump_inline_summaries (FILE *f)
 836 {
 837   struct cgraph_node *node;
 838
 839   for (node = cgraph_nodes; node; node = node->next)
 840     if (node->analyzed && !node->global.inlined_to)
 841       dump_inline_summary (f, node);
 842 }
 843
 844 /* Give initial reasons why inlining would fail on EDGE.  This gets either
 845    nullified or usually overwritten by more precise reasons later.  */
 846
 847 void
 848 initialize_inline_failed (struct cgraph_edge *e)
 849 {
 850   struct cgraph_node *callee = e->callee;
 851
 852   if (e->indirect_unknown_callee)
 853     e->inline_failed = CIF_INDIRECT_UNKNOWN_CALL;
 854   else if (!callee->analyzed)
 855     e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 856   else if (callee->local.redefined_extern_inline)
 857     e->inline_failed = CIF_REDEFINED_EXTERN_INLINE;
 858   else if (e->call_stmt && gimple_call_cannot_inline_p (e->call_stmt))
 859     e->inline_failed = CIF_MISMATCHED_ARGUMENTS;
 860   else
 861     e->inline_failed = CIF_FUNCTION_NOT_CONSIDERED;
 862 }
 863
 864 /* See if statement might disappear after inlining.
 865    0 - means not eliminated
 866    1 - half of statements goes away
 867    2 - for sure it is eliminated.
 868    We are not terribly sophisticated, basically looking for simple abstraction
 869    penalty wrappers.  */
 870
 871 static int
 872 eliminated_by_inlining_prob (gimple stmt)
 873 {
 874   enum gimple_code code = gimple_code (stmt);
 875   switch (code)
 876     {
 877       case GIMPLE_RETURN:
 878         return 2;
 879       case GIMPLE_ASSIGN:
 880         if (gimple_num_ops (stmt) != 2)
 881           return 0;
 882
 883         /* Casts of parameters, loads from parameters passed by reference
 884            and stores to return value or parameters are often free after
 885            inlining dua to SRA and further combining.
 886            Assume that half of statements goes away.  */
 887         if (gimple_assign_rhs_code (stmt) == CONVERT_EXPR
 888             || gimple_assign_rhs_code (stmt) == NOP_EXPR
 889             || gimple_assign_rhs_code (stmt) == VIEW_CONVERT_EXPR
 890             || gimple_assign_rhs_class (stmt) == GIMPLE_SINGLE_RHS)
 891           {
 892             tree rhs = gimple_assign_rhs1 (stmt);
 893             tree lhs = gimple_assign_lhs (stmt);
 894             tree inner_rhs = rhs;
 895             tree inner_lhs = lhs;
 896             bool rhs_free = false;
 897             bool lhs_free = false;
 898
 899             while (handled_component_p (inner_lhs)
 900                    || TREE_CODE (inner_lhs) == MEM_REF)
 901               inner_lhs = TREE_OPERAND (inner_lhs, 0);
 902             while (handled_component_p (inner_rhs)
 903                    || TREE_CODE (inner_rhs) == ADDR_EXPR
 904                    || TREE_CODE (inner_rhs) == MEM_REF)
 905               inner_rhs = TREE_OPERAND (inner_rhs, 0);
 906
 907
 908             if (TREE_CODE (inner_rhs) == PARM_DECL
 909                 || (TREE_CODE (inner_rhs) == SSA_NAME
 910                     && SSA_NAME_IS_DEFAULT_DEF (inner_rhs)
 911                     && TREE_CODE (SSA_NAME_VAR (inner_rhs)) == PARM_DECL))
 912               rhs_free = true;
 913             if (rhs_free && is_gimple_reg (lhs))
 914               lhs_free = true;
 915             if (((TREE_CODE (inner_lhs) == PARM_DECL
 916                   || (TREE_CODE (inner_lhs) == SSA_NAME
 917                       && SSA_NAME_IS_DEFAULT_DEF (inner_lhs)
 918                       && TREE_CODE (SSA_NAME_VAR (inner_lhs)) == PARM_DECL))
 919                  && inner_lhs != lhs)
 920                 || TREE_CODE (inner_lhs) == RESULT_DECL
 921                 || (TREE_CODE (inner_lhs) == SSA_NAME
 922                     && TREE_CODE (SSA_NAME_VAR (inner_lhs)) == RESULT_DECL))
 923               lhs_free = true;
 924             if (lhs_free
 925                 && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
 926               rhs_free = true;
 927             if (lhs_free && rhs_free)
 928               return 1;
 929           }
 930         return 0;
 931       default:
 932         return 0;
 933     }
 934 }
 935
 936
 937 /* If BB ends by a conditional we can turn into predicates, attach corresponding
 938    predicates to the CFG edges.   */
 939
 940 static void
 941 set_cond_stmt_execution_predicate (struct ipa_node_params *info,
 942                                    struct inline_summary *summary,
 943                                    basic_block bb)
 944 {
 945   gimple last;
 946   tree op;
 947   int index;
 948   enum tree_code code, inverted_code;
 949   edge e;
 950   edge_iterator ei;
 951   gimple set_stmt;
 952   tree op2;
 953
 954   last = last_stmt (bb);
 955   if (!last
 956       || gimple_code (last) != GIMPLE_COND)
 957     return;
 958   if (!is_gimple_ip_invariant (gimple_cond_rhs (last)))
 959     return;
 960   op = gimple_cond_lhs (last);
 961   /* TODO: handle conditionals like
 962      var = op0 < 4;
 963      if (var != 0).  */
 964   if (TREE_CODE (op) != SSA_NAME)
 965     return;
 966   if (SSA_NAME_IS_DEFAULT_DEF (op))
 967     {
 968       index = ipa_get_param_decl_index (info, SSA_NAME_VAR (op));
 969       if (index == -1)
 970         return;
 971       code = gimple_cond_code (last);
 972       inverted_code = invert_tree_comparison (code,
 973                                               HONOR_NANS (TYPE_MODE (TREE_TYPE (op))));
 974
 975       FOR_EACH_EDGE (e, ei, bb->succs)
 976         {
 977           struct predicate p = add_condition (summary,
 978                                               index,
 979                                               e->flags & EDGE_TRUE_VALUE
 980                                               ? code : inverted_code,
 981                                               gimple_cond_rhs (last));
 982           e->aux = pool_alloc (edge_predicate_pool);
 983           *(struct predicate *)e->aux = p;
 984         }
 985     }
 986
 987   /* Special case
 988      if (builtin_constant_p (op))
 989        constant_code
 990      else
 991        nonconstant_code.
 992      Here we can predicate nonconstant_code.  We can't
 993      really handle constant_code since we have no predicate
 994      for this and also the constant code is not known to be
 995      optimized away when inliner doen't see operand is constant.
 996      Other optimizers might think otherwise.  */
 997   set_stmt = SSA_NAME_DEF_STMT (op);
 998   if (!gimple_call_builtin_p (set_stmt, BUILT_IN_CONSTANT_P)
 999       || gimple_call_num_args (set_stmt) != 1)
1000     return;
1001   op2 = gimple_call_arg (set_stmt, 0);
1002   if (!SSA_NAME_IS_DEFAULT_DEF (op2))
1003     return;
1004   index = ipa_get_param_decl_index (info, SSA_NAME_VAR (op2));
1005   if (index == -1)
1006     return;
1007   if (gimple_cond_code (last) != NE_EXPR
1008       || !integer_zerop (gimple_cond_rhs (last)))
1009     return;
1010   FOR_EACH_EDGE (e, ei, bb->succs)
1011     if (e->flags & EDGE_FALSE_VALUE)
1012       {
1013         struct predicate p = add_condition (summary,
1014                                             index,
1015                                             IS_NOT_CONSTANT,
1016                                             NULL);
1017         e->aux = pool_alloc (edge_predicate_pool);
1018         *(struct predicate *)e->aux = p;
1019       }
1020 }
1021
1022
1023 /* If BB ends by a switch we can turn into predicates, attach corresponding
1024    predicates to the CFG edges.   */
1025
1026 static void
1027 set_switch_stmt_execution_predicate (struct ipa_node_params *info,
1028                                    struct inline_summary *summary,
1029                                    basic_block bb)
1030 {
1031   gimple last;
1032   tree op;
1033   int index;
1034   edge e;
1035   edge_iterator ei;
1036   size_t n;
1037   size_t case_idx;
1038
1039   last = last_stmt (bb);
1040   if (!last
1041       || gimple_code (last) != GIMPLE_SWITCH)
1042     return;
1043   op = gimple_switch_index (last);
1044   if (TREE_CODE (op) != SSA_NAME
1045       || !SSA_NAME_IS_DEFAULT_DEF (op))
1046     return;
1047   index = ipa_get_param_decl_index (info, SSA_NAME_VAR (op));
1048   if (index == -1)
1049     return;
1050
1051   FOR_EACH_EDGE (e, ei, bb->succs)
1052     {
1053       e->aux = pool_alloc (edge_predicate_pool);
1054       *(struct predicate *)e->aux = false_predicate ();
1055     }
1056   n = gimple_switch_num_labels(last);
1057   for (case_idx = 0; case_idx < n; ++case_idx)
1058     {
1059       tree cl = gimple_switch_label (last, case_idx);
1060       tree min, max;
1061       struct predicate p;
1062
1063       e = find_edge (bb, label_to_block (CASE_LABEL (cl)));
1064       min = CASE_LOW (cl);
1065       max = CASE_HIGH (cl);
1066
1067       /* For default we might want to construct predicate that none
1068          of cases is met, but it is bit hard to do not having negations
1069          of conditionals handy.  */
1070       if (!min && !max)
1071         p = true_predicate ();
1072       else if (!max)
1073         p = add_condition (summary, index,
1074                            EQ_EXPR,
1075                            min);
1076       else
1077         {
1078           struct predicate p1, p2;
1079           p1 = add_condition (summary, index,
1080                               GE_EXPR,
1081                               min);
1082           p2 = add_condition (summary, index,
1083                               LE_EXPR,
1084                               max);
1085           p = and_predicates (&p1, &p2);
1086         }
1087       *(struct predicate *)e->aux
1088         = or_predicates (&p, (struct predicate *)e->aux);
1089     }
1090 }
1091
1092
1093 /* For each BB in NODE attach to its AUX pointer predicate under
1094    which it is executable.  */
1095
1096 static void
1097 compute_bb_predicates (struct cgraph_node *node,
1098                        struct ipa_node_params *parms_info,
1099                        struct inline_summary *summary)
1100 {
1101   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
1102   bool done = false;
1103   basic_block bb;
1104
1105   FOR_EACH_BB_FN (bb, my_function)
1106     {
1107       set_cond_stmt_execution_predicate (parms_info, summary, bb);
1108       set_switch_stmt_execution_predicate (parms_info, summary, bb);
1109     }
1110
1111   /* Entry block is always executable.  */
1112   ENTRY_BLOCK_PTR_FOR_FUNCTION (my_function)->aux = pool_alloc (edge_predicate_pool);
1113   *(struct predicate *)ENTRY_BLOCK_PTR_FOR_FUNCTION (my_function)->aux
1114     = true_predicate ();
1115
1116   /* A simple dataflow propagation of predicates forward in the CFG.
1117      TODO: work in reverse postorder.  */
1118   while (!done)
1119     {
1120       done = true;
1121       FOR_EACH_BB_FN (bb, my_function)
1122         {
1123           struct predicate p = false_predicate ();
1124           edge e;
1125           edge_iterator ei;
1126           FOR_EACH_EDGE (e, ei, bb->preds)
1127             {
1128               if (e->src->aux)
1129                 {
1130                   struct predicate this_bb_predicate = *(struct predicate *)e->src->aux;
1131                   if (e->aux)
1132                     this_bb_predicate = and_predicates (&this_bb_predicate,
1133                                                         (struct predicate *)e->aux);
1134                   p = or_predicates (&p, &this_bb_predicate);
1135                   if (true_predicate_p (&p))
1136                     break;
1137                 }
1138             }
1139           if (false_predicate_p (&p))
1140             gcc_assert (!bb->aux);
1141           else
1142             {
1143               if (!bb->aux)
1144                 {
1145                   done = false;
1146                   bb->aux = pool_alloc (edge_predicate_pool);
1147                   *((struct predicate *)bb->aux) = p;
1148                 }
1149               else if (!predicates_equal_p (&p, (struct predicate *)bb->aux))
1150                 {
1151                   done = false;
1152                   *((struct predicate *)bb->aux) = p;
1153                 }
1154             }
1155         }
1156     }
1157 }
1158
1159
1160 /* We keep info about constantness of SSA names.  */
1161
1162 typedef struct predicate predicate_t;
1163 DEF_VEC_O (predicate_t);
1164 DEF_VEC_ALLOC_O (predicate_t, heap);
1165
1166
1167 /* Return predicate specifying when the STMT might have result that is not a compile
1168    time constant.  */
1169
1170 static struct predicate
1171 will_be_nonconstant_predicate (struct ipa_node_params *info,
1172                                struct inline_summary *summary,
1173                                gimple stmt,
1174                                VEC (predicate_t, heap) *nonconstant_names)
1175
1176 {
1177   struct predicate p = true_predicate ();
1178   ssa_op_iter iter;
1179   tree use;
1180   struct predicate op_non_const;
1181
1182   /* What statments might be optimized away
1183      when their arguments are constant
1184      TODO: also trivial builtins.
1185      builtin_constant_p is already handled later.  */
1186   if (gimple_code (stmt) != GIMPLE_ASSIGN
1187       && gimple_code (stmt) != GIMPLE_COND
1188       && gimple_code (stmt) != GIMPLE_SWITCH)
1189     return p;
1190
1191   /* Stores and loads will stay anyway.
1192      TODO: Constant memory accesses could be handled here, too.  */
1193   if (gimple_vuse (stmt))
1194     return p;
1195
1196   /* See if we understand all operands before we start
1197      adding conditionals.  */
1198   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
1199     {
1200       if (TREE_CODE (use) != SSA_NAME)
1201         return p;
1202       /* For arguments we can build a condition.  */
1203       if (SSA_NAME_IS_DEFAULT_DEF (use)
1204           && ipa_get_param_decl_index (info, SSA_NAME_VAR (use)) >= 0)
1205         continue;
1206       /* If we know when operand is constant,
1207          we still can say something useful.  */
1208       if (!true_predicate_p (VEC_index (predicate_t, nonconstant_names,
1209                                         SSA_NAME_VERSION (use))))
1210         continue;
1211       return p;
1212     }
1213   op_non_const = false_predicate ();
1214   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
1215     {
1216       if (SSA_NAME_IS_DEFAULT_DEF (use)
1217           && ipa_get_param_decl_index (info, SSA_NAME_VAR (use)) >= 0)
1218         p = add_condition (summary,
1219                            ipa_get_param_decl_index (info, SSA_NAME_VAR (use)),
1220                            IS_NOT_CONSTANT, NULL);
1221       else
1222         p = *VEC_index (predicate_t, nonconstant_names,
1223                         SSA_NAME_VERSION (use));
1224       op_non_const = or_predicates (&p, &op_non_const);
1225     }
1226   if (gimple_code (stmt) == GIMPLE_ASSIGN
1227       && TREE_CODE (gimple_assign_lhs (stmt)) == SSA_NAME)
1228     VEC_replace (predicate_t, nonconstant_names,
1229                  SSA_NAME_VERSION (gimple_assign_lhs (stmt)), &op_non_const);
1230   return op_non_const;
1231 }
1232
1233
1234 /* Compute function body size parameters for NODE.
1235    When EARLY is true, we compute only simple summaries without
1236    non-trivial predicates to drive the early inliner.  */
1237
1238 static void
1239 estimate_function_body_sizes (struct cgraph_node *node, bool early)
1240 {
1241   gcov_type time = 0;
1242   /* Estimate static overhead for function prologue/epilogue and alignment. */
1243   int size = 2;
1244   /* Benefits are scaled by probability of elimination that is in range
1245      <0,2>.  */
1246   basic_block bb;
1247   gimple_stmt_iterator bsi;
1248   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
1249   int freq;
1250   struct inline_summary *info = inline_summary (node);
1251   struct predicate bb_predicate;
1252   struct ipa_node_params *parms_info = NULL;
1253   VEC (predicate_t, heap) *nonconstant_names = NULL;
1254
1255   if (ipa_node_params_vector && !early && optimize)
1256     {
1257       parms_info = IPA_NODE_REF (node);
1258       VEC_safe_grow_cleared (predicate_t, heap, nonconstant_names,
1259                              VEC_length (tree, SSANAMES (my_function)));
1260     }
1261
1262   info->conds = 0;
1263   info->entry = 0;
1264
1265
1266   if (dump_file)
1267     fprintf (dump_file, "\nAnalyzing function body size: %s\n",
1268              cgraph_node_name (node));
1269
1270   /* When we run into maximal number of entries, we assign everything to the
1271      constant truth case.  Be sure to have it in list. */
1272   bb_predicate = true_predicate ();
1273   account_size_time (info, 0, 0, &bb_predicate);
1274
1275   bb_predicate = not_inlined_predicate ();
1276   account_size_time (info, 2 * INLINE_SIZE_SCALE, 0, &bb_predicate);
1277
1278   gcc_assert (my_function && my_function->cfg);
1279   if (parms_info)
1280     compute_bb_predicates (node, parms_info, info);
1281   FOR_EACH_BB_FN (bb, my_function)
1282     {
1283       freq = compute_call_stmt_bb_frequency (node->decl, bb);
1284
1285       /* TODO: Obviously predicates can be propagated down across CFG.  */
1286       if (parms_info)
1287         {
1288           if (bb->aux)
1289             bb_predicate = *(struct predicate *)bb->aux;
1290           else
1291             bb_predicate = false_predicate ();
1292         }
1293       else
1294         bb_predicate = true_predicate ();
1295
1296       if (dump_file && (dump_flags & TDF_DETAILS))
1297         {
1298           fprintf (dump_file, "\n BB %i predicate:", bb->index);
1299           dump_predicate (dump_file, info->conds, &bb_predicate);
1300         }
1301
1302       for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
1303         {
1304           gimple stmt = gsi_stmt (bsi);
1305           int this_size = estimate_num_insns (stmt, &eni_size_weights);
1306           int this_time = estimate_num_insns (stmt, &eni_time_weights);
1307           int prob;
1308           struct predicate will_be_nonconstant;
1309
1310           if (dump_file && (dump_flags & TDF_DETAILS))
1311             {
1312               fprintf (dump_file, "  ");
1313               print_gimple_stmt (dump_file, stmt, 0, 0);
1314               fprintf (dump_file, "\t\tfreq:%3.2f size:%3i time:%3i\n",
1315                        ((double)freq)/CGRAPH_FREQ_BASE, this_size, this_time);
1316             }
1317
1318           if (is_gimple_call (stmt))
1319             {
1320               struct cgraph_edge *edge = cgraph_edge (node, stmt);
1321               struct inline_edge_summary *es = inline_edge_summary (edge);
1322
1323               /* Special case: results of BUILT_IN_CONSTANT_P will be always
1324                  resolved as constant.  We however don't want to optimize
1325                  out the cgraph edges.  */
1326               if (nonconstant_names
1327                   && gimple_call_builtin_p (stmt, BUILT_IN_CONSTANT_P)
1328                   && gimple_call_lhs (stmt)
1329                   && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
1330                 {
1331                   struct predicate false_p = false_predicate ();
1332                   VEC_replace (predicate_t, nonconstant_names,
1333                                SSA_NAME_VERSION (gimple_call_lhs (stmt)), &false_p);
1334                 }
1335
1336               es->call_stmt_size = this_size;
1337               es->call_stmt_time = this_time;
1338               es->loop_depth = bb->loop_depth;
1339               edge_set_predicate (edge, &bb_predicate);
1340
1341               /* Do not inline calls where we cannot triviall work around
1342                  mismatches in argument or return types.  */
1343               if (edge->callee
1344                   && !gimple_check_call_matching_types (stmt, edge->callee->decl))
1345                 {
1346                   edge->call_stmt_cannot_inline_p = true;
1347                   gimple_call_set_cannot_inline (stmt, true);
1348                 }
1349               else
1350                 gcc_assert (!gimple_call_cannot_inline_p (stmt));
1351             }
1352
1353           /* TODO: When conditional jump or swithc is known to be constant, but
1354              we did not translate it into the predicates, we really can account
1355              just maximum of the possible paths.  */
1356           if (parms_info)
1357             will_be_nonconstant
1358                = will_be_nonconstant_predicate (parms_info, info,
1359                                                 stmt, nonconstant_names);
1360           if (this_time || this_size)
1361             {
1362               struct predicate p;
1363
1364               this_time *= freq;
1365               time += this_time;
1366               size += this_size;
1367
1368               prob = eliminated_by_inlining_prob (stmt);
1369               if (prob == 1 && dump_file && (dump_flags & TDF_DETAILS))
1370                 fprintf (dump_file, "\t\t50%% will be eliminated by inlining\n");
1371               if (prob == 2 && dump_file && (dump_flags & TDF_DETAILS))
1372                 fprintf (dump_file, "\t\twill eliminated by inlining\n");
1373
1374               if (parms_info)
1375                 p = and_predicates (&bb_predicate, &will_be_nonconstant);
1376               else
1377                 p = true_predicate ();
1378
1379               /* We account everything but the calls.  Calls have their own
1380                  size/time info attached to cgraph edges.  This is neccesary
1381                  in order to make the cost disappear after inlining.  */
1382               if (!is_gimple_call (stmt))
1383                 {
1384                   if (prob)
1385                     {
1386                       struct predicate ip = not_inlined_predicate ();
1387                       ip = and_predicates (&ip, &p);
1388                       account_size_time (info, this_size * prob,
1389                                          this_time * prob, &ip);
1390                     }
1391                   if (prob != 2)
1392                     account_size_time (info, this_size * (2 - prob),
1393                                        this_time * (2 - prob), &p);
1394                 }
1395
1396               gcc_assert (time >= 0);
1397               gcc_assert (size >= 0);
1398             }
1399         }
1400     }
1401   FOR_ALL_BB_FN (bb, my_function)
1402     {
1403       edge e;
1404       edge_iterator ei;
1405
1406       if (bb->aux)
1407         pool_free (edge_predicate_pool, bb->aux);
1408       bb->aux = NULL;
1409       FOR_EACH_EDGE (e, ei, bb->succs)
1410         {
1411           if (e->aux)
1412             pool_free (edge_predicate_pool, e->aux);
1413           e->aux = NULL;
1414         }
1415     }
1416   time = (time + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
1417   if (time > MAX_TIME)
1418     time = MAX_TIME;
1419   inline_summary (node)->self_time = time;
1420   inline_summary (node)->self_size = size;
1421   VEC_free (predicate_t, heap, nonconstant_names);
1422   if (dump_file)
1423     {
1424       fprintf (dump_file, "\n");
1425       dump_inline_summary (dump_file, node);
1426     }
1427 }
1428
1429
1430 /* Compute parameters of functions used by inliner.
1431    EARLY is true when we compute parameters for the early inliner  */
1432
1433 void
1434 compute_inline_parameters (struct cgraph_node *node, bool early)
1435 {
1436   HOST_WIDE_INT self_stack_size;
1437   struct cgraph_edge *e;
1438   struct inline_summary *info;
1439
1440   gcc_assert (!node->global.inlined_to);
1441
1442   inline_summary_alloc ();
1443
1444   info = inline_summary (node);
1445
1446   /* Estimate the stack size for the function if we're optimizing.  */
1447   self_stack_size = optimize ? estimated_stack_frame_size (node) : 0;
1448   info->estimated_self_stack_size = self_stack_size;
1449   info->estimated_stack_size = self_stack_size;
1450   info->stack_frame_offset = 0;
1451
1452   /* Can this function be inlined at all?  */
1453   info->inlinable = tree_inlinable_function_p (node->decl);
1454
1455   /* Inlinable functions always can change signature.  */
1456   if (info->inlinable)
1457     node->local.can_change_signature = true;
1458   else
1459     {
1460       /* Functions calling builtin_apply can not change signature.  */
1461       for (e = node->callees; e; e = e->next_callee)
1462         if (DECL_BUILT_IN (e->callee->decl)
1463             && DECL_BUILT_IN_CLASS (e->callee->decl) == BUILT_IN_NORMAL
1464             && DECL_FUNCTION_CODE (e->callee->decl) == BUILT_IN_APPLY_ARGS)
1465           break;
1466       node->local.can_change_signature = !e;
1467     }
1468   estimate_function_body_sizes (node, early);
1469
1470   /* Inlining characteristics are maintained by the cgraph_mark_inline.  */
1471   info->time = info->self_time;
1472   info->size = info->self_size;
1473   info->stack_frame_offset = 0;
1474   info->estimated_stack_size = info->estimated_self_stack_size;
1475 }
1476
1477
1478 /* Compute parameters of functions used by inliner using
1479    current_function_decl.  */
1480
1481 static unsigned int
1482 compute_inline_parameters_for_current (void)
1483 {
1484   compute_inline_parameters (cgraph_get_node (current_function_decl), true);
1485   return 0;
1486 }
1487
1488 struct gimple_opt_pass pass_inline_parameters =
1489 {
1490  {
1491   GIMPLE_PASS,
1492   "inline_param",                       /* name */
1493   NULL,                                 /* gate */
1494   compute_inline_parameters_for_current,/* execute */
1495   NULL,                                 /* sub */
1496   NULL,                                 /* next */
1497   0,                                    /* static_pass_number */
1498   TV_INLINE_HEURISTICS,                 /* tv_id */
1499   0,                                    /* properties_required */
1500   0,                                    /* properties_provided */
1501   0,                                    /* properties_destroyed */
1502   0,                                    /* todo_flags_start */
1503   0                                     /* todo_flags_finish */
1504  }
1505 };
1506
1507
1508 /* Increase SIZE and TIME for size and time needed to handle edge E.  */
1509
1510 static void
1511 estimate_edge_size_and_time (struct cgraph_edge *e, int *size, int *time)
1512 {
1513   struct inline_edge_summary *es = inline_edge_summary (e);
1514   *size += es->call_stmt_size * INLINE_SIZE_SCALE;
1515   *time += (es->call_stmt_time
1516             * e->frequency * (INLINE_TIME_SCALE / CGRAPH_FREQ_BASE));
1517   if (*time > MAX_TIME * INLINE_TIME_SCALE)
1518     *time = MAX_TIME * INLINE_TIME_SCALE;
1519 }
1520
1521
1522 /* Increase SIZE and TIME for size and time needed to handle all calls in NODE.  */
1523
1524 static void
1525 estimate_calls_size_and_time (struct cgraph_node *node, int *size, int *time,
1526                               clause_t possible_truths)
1527 {
1528   struct cgraph_edge *e;
1529   for (e = node->callees; e; e = e->next_callee)
1530     {
1531       struct inline_edge_summary *es = inline_edge_summary (e);
1532       if (!es->predicate || evaluate_predicate (es->predicate, possible_truths))
1533         {
1534           if (e->inline_failed)
1535             estimate_edge_size_and_time (e, size, time);
1536           else
1537             estimate_calls_size_and_time (e->callee, size, time,
1538                                           possible_truths);
1539         }
1540     }
1541   /* TODO: look for devirtualizing oppurtunities.  */
1542   for (e = node->indirect_calls; e; e = e->next_callee)
1543     {
1544       struct inline_edge_summary *es = inline_edge_summary (e);
1545       if (!es->predicate || evaluate_predicate (es->predicate, possible_truths))
1546         estimate_edge_size_and_time (e, size, time);
1547     }
1548 }
1549
1550
1551 /* Estimate size and time needed to execute callee of EDGE assuming
1552    that parameters known to be constant at caller of EDGE are
1553    propagated.  If INLINE_P is true, it is assumed that call will
1554    be inlined.  */
1555
1556 static void
1557 estimate_callee_size_and_time (struct cgraph_edge *edge, bool inline_p,
1558                                int *ret_size, int *ret_time)
1559 {
1560   struct inline_summary *info = inline_summary (edge->callee);
1561   clause_t clause = evaluate_conditions_for_edge (edge, inline_p);
1562   size_time_entry *e;
1563   int size = 0, time = 0;
1564   int i;
1565
1566   if (dump_file
1567       && (dump_flags & TDF_DETAILS))
1568     {
1569       bool found = false;
1570       fprintf (dump_file, "   Estimating callee body: %s/%i\n"
1571                           "   Known to be false: ",
1572                cgraph_node_name (edge->callee),
1573                edge->callee->uid);
1574
1575       for (i = predicate_not_inlined_condition;
1576            i < (predicate_first_dynamic_condition
1577                 + (int)VEC_length (condition, info->conds)); i++)
1578         if (!(clause & (1 << i)))
1579           {
1580             if (found)
1581               fprintf (dump_file, ", ");
1582             found = true;
1583             dump_condition (dump_file, info->conds, i);
1584           }
1585     }
1586
1587   for (i = 0; VEC_iterate (size_time_entry, info->entry, i, e); i++)
1588     if (evaluate_predicate (&e->predicate, clause))
1589       time += e->time, size += e->size;
1590
1591   if (time > MAX_TIME * INLINE_TIME_SCALE)
1592     time = MAX_TIME * INLINE_TIME_SCALE;
1593
1594   estimate_calls_size_and_time (edge->callee, &size, &time, clause);
1595   time = (time + INLINE_TIME_SCALE / 2) / INLINE_TIME_SCALE;
1596   size = (size + INLINE_SIZE_SCALE / 2) / INLINE_SIZE_SCALE;
1597
1598
1599   if (dump_file
1600       && (dump_flags & TDF_DETAILS))
1601     fprintf (dump_file, "\n   size:%i time:%i\n", size, time);
1602   if (ret_time)
1603     *ret_time = time;
1604   if (ret_size)
1605     *ret_size = size;
1606   return;
1607 }
1608
1609
1610 /* Translate all conditions from callee representation into caller representation and
1611    symbolically evaluate predicate P into new predicate.
1612
1613    INFO is inline_summary of function we are adding predicate into, CALLEE_INFO is summary
1614    of function predicate P is from. OPERAND_MAP is array giving callee formal IDs the
1615    caller formal IDs. POSSSIBLE_TRUTHS is clausule of all callee conditions that
1616    may be true in caller context. TOPLEV_PREDICATE is predicate under which callee
1617    is executed.  */
1618
1619 static struct predicate
1620 remap_predicate (struct inline_summary *info, struct inline_summary *callee_info,
1621                  struct predicate *p,
1622                  VEC (int, heap) *operand_map,
1623                  clause_t possible_truths,
1624                  struct predicate *toplev_predicate)
1625 {
1626   int i;
1627   struct predicate out = true_predicate ();
1628
1629   /* True predicate is easy.  */
1630   if (true_predicate_p (p))
1631     return *toplev_predicate;
1632   for (i = 0; p->clause[i]; i++)
1633     {
1634       clause_t clause = p->clause[i];
1635       int cond;
1636       struct predicate clause_predicate = false_predicate ();
1637
1638       gcc_assert (i < MAX_CLAUSES);
1639
1640       for (cond = 0; cond < NUM_CONDITIONS; cond ++)
1641         /* Do we have condition we can't disprove?   */
1642         if (clause & possible_truths & (1 << cond))
1643           {
1644             struct predicate cond_predicate;
1645             /* Work out if the condition can translate to predicate in the
1646                inlined function.  */
1647             if (cond >= predicate_first_dynamic_condition)
1648               {
1649                  struct condition *c;
1650
1651                  c = VEC_index (condition, callee_info->conds,
1652                                 cond - predicate_first_dynamic_condition);
1653                  /* See if we can remap condition operand to caller's operand.
1654                     Otherwise give up.  */
1655                  if (!operand_map
1656                      || VEC_index (int, operand_map, c->operand_num) == -1)
1657                    cond_predicate = true_predicate ();
1658                  else
1659                    cond_predicate = add_condition (info,
1660                                                    VEC_index (int, operand_map,
1661                                                               c->operand_num),
1662                                                    c->code, c->val);
1663               }
1664             /* Fixed conditions remains same, construct single
1665                condition predicate.  */
1666             else
1667               {
1668                 cond_predicate.clause[0] = 1 << cond;
1669                 cond_predicate.clause[1] = 0;
1670               }
1671             clause_predicate = or_predicates (&clause_predicate, &cond_predicate);
1672           }
1673       out = and_predicates (&out, &clause_predicate);
1674     }
1675   return and_predicates (&out, toplev_predicate);
1676 }
1677
1678
1679 /* Update summary information of inline clones after inlining.
1680    Compute peak stack usage.  */
1681
1682 static void
1683 inline_update_callee_summaries (struct cgraph_node *node,
1684                                 int depth)
1685 {
1686   struct cgraph_edge *e;
1687   struct inline_summary *callee_info = inline_summary (node);
1688   struct inline_summary *caller_info = inline_summary (node->callers->caller);
1689   HOST_WIDE_INT peak;
1690
1691   callee_info->stack_frame_offset
1692     = caller_info->stack_frame_offset
1693       + caller_info->estimated_self_stack_size;
1694   peak = callee_info->stack_frame_offset
1695       + callee_info->estimated_self_stack_size;
1696   if (inline_summary (node->global.inlined_to)->estimated_stack_size
1697       < peak)
1698     inline_summary (node->global.inlined_to)->estimated_stack_size = peak;
1699   cgraph_propagate_frequency (node);
1700   for (e = node->callees; e; e = e->next_callee)
1701     {
1702       if (!e->inline_failed)
1703         inline_update_callee_summaries (e->callee, depth);
1704       inline_edge_summary (e)->loop_depth += depth;
1705     }
1706   for (e = node->indirect_calls; e; e = e->next_callee)
1707     inline_edge_summary (e)->loop_depth += depth;
1708 }
1709
1710
1711 /* Remap predicates of callees of NODE.  Rest of arguments match
1712    remap_predicate.  */
1713
1714 static void
1715 remap_edge_predicates (struct cgraph_node *node,
1716                        struct inline_summary *info,
1717                        struct inline_summary *callee_info,
1718                        VEC (int, heap) *operand_map,
1719                        clause_t possible_truths,
1720                        struct predicate *toplev_predicate)
1721 {
1722   struct cgraph_edge *e;
1723   for (e = node->callees; e; e = e->next_callee)
1724     {
1725       struct inline_edge_summary *es = inline_edge_summary (e);
1726       struct predicate p;
1727       if (es->predicate)
1728         {
1729           p = remap_predicate (info, callee_info,
1730                                es->predicate, operand_map, possible_truths,
1731                                toplev_predicate);
1732           edge_set_predicate (e, &p);
1733           /* TODO: We should remove the edge for code that will be optimized out,
1734              but we need to keep verifiers and tree-inline happy.
1735              Make it cold for now.  */
1736           if (false_predicate_p (&p))
1737             {
1738               e->count = 0;
1739               e->frequency = 0;
1740             }
1741         }
1742       if (!e->inline_failed)
1743         remap_edge_predicates (e->callee, info, callee_info, operand_map,
1744                                possible_truths, toplev_predicate);
1745     }
1746   for (e = node->indirect_calls; e; e = e->next_callee)
1747     {
1748       struct inline_edge_summary *es = inline_edge_summary (e);
1749       struct predicate p;
1750       if (es->predicate)
1751         {
1752           p = remap_predicate (info, callee_info,
1753                                es->predicate, operand_map, possible_truths,
1754                                toplev_predicate);
1755           edge_set_predicate (e, &p);
1756           /* TODO: We should remove the edge for code that will be optimized out,
1757              but we need to keep verifiers and tree-inline happy.
1758              Make it cold for now.  */
1759           if (false_predicate_p (&p))
1760             {
1761               e->count = 0;
1762               e->frequency = 0;
1763             }
1764         }
1765     }
1766 }
1767
1768
1769 /* We inlined EDGE.  Update summary of the function we inlined into.  */
1770
1771 void
1772 inline_merge_summary (struct cgraph_edge *edge)
1773 {
1774   struct inline_summary *callee_info = inline_summary (edge->callee);
1775   struct cgraph_node *to = (edge->caller->global.inlined_to
1776                             ? edge->caller->global.inlined_to : edge->caller);
1777   struct inline_summary *info = inline_summary (to);
1778   clause_t clause = 0;          /* not_inline is known to be false.  */
1779   size_time_entry *e;
1780   VEC (int, heap) *operand_map = NULL;
1781   int i;
1782   struct predicate toplev_predicate;
1783   struct inline_edge_summary *es = inline_edge_summary (edge);
1784
1785   if (es->predicate)
1786     toplev_predicate = *es->predicate;
1787   else
1788     toplev_predicate = true_predicate ();
1789
1790   if (ipa_node_params_vector && callee_info->conds
1791       /* FIXME: it seems that we forget to get argument count in some cases,
1792          probaby for previously indirect edges or so.
1793          Removing the test leads to ICE on tramp3d.  */
1794       && ipa_get_cs_argument_count (IPA_EDGE_REF (edge)))
1795     {
1796       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
1797       int count = ipa_get_cs_argument_count (args);
1798       int i;
1799
1800       clause = evaluate_conditions_for_edge (edge, true);
1801       VEC_safe_grow_cleared (int, heap, operand_map, count);
1802       for (i = 0; i < count; i++)
1803         {
1804           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
1805           int map = -1;
1806           /* TODO: handle non-NOPs when merging.  */
1807           if (jfunc->type == IPA_JF_PASS_THROUGH
1808               && jfunc->value.pass_through.operation == NOP_EXPR)
1809             map = jfunc->value.pass_through.formal_id;
1810           VEC_replace (int, operand_map, i, map);
1811           gcc_assert (map < ipa_get_param_count (IPA_NODE_REF (to)));
1812         }
1813     }
1814   for (i = 0; VEC_iterate (size_time_entry, callee_info->entry, i, e); i++)
1815     {
1816       struct predicate p = remap_predicate (info, callee_info,
1817                                             &e->predicate, operand_map, clause,
1818                                             &toplev_predicate);
1819       gcov_type add_time = ((gcov_type)e->time * edge->frequency
1820                             + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
1821       if (add_time > MAX_TIME)
1822         add_time = MAX_TIME;
1823       account_size_time (info, e->size, add_time, &p);
1824     }
1825   remap_edge_predicates (edge->callee, info, callee_info, operand_map,
1826                          clause, &toplev_predicate);
1827   info->size = 0;
1828   info->time = 0;
1829   for (i = 0; VEC_iterate (size_time_entry, info->entry, i, e); i++)
1830     info->size += e->size, info->time += e->time;
1831   estimate_calls_size_and_time (to, &info->size, &info->time,
1832                                 ~(clause_t)(1 << predicate_false_condition));
1833
1834   inline_update_callee_summaries (edge->callee,
1835                                   inline_edge_summary (edge)->loop_depth);
1836
1837   info->time = (info->time + INLINE_TIME_SCALE / 2) / INLINE_TIME_SCALE;
1838   info->size = (info->size + INLINE_SIZE_SCALE / 2) / INLINE_SIZE_SCALE;
1839 }
1840
1841
1842 /* Estimate the time cost for the caller when inlining EDGE.
1843    Only to be called via estimate_edge_time, that handles the
1844    caching mechanism.
1845
1846    When caching, also update the cache entry.  Compute both time and
1847    size, since we always need both metrics eventually.  */
1848
1849 int
1850 do_estimate_edge_time (struct cgraph_edge *edge)
1851 {
1852   int time;
1853   int size;
1854   gcov_type ret;
1855   struct inline_edge_summary *es = inline_edge_summary (edge);
1856
1857   gcc_checking_assert (edge->inline_failed);
1858   estimate_callee_size_and_time (edge, true, &size, &time);
1859
1860   ret = (((gcov_type)time - es->call_stmt_time) * edge->frequency
1861          + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
1862   if (ret > MAX_TIME)
1863     ret = MAX_TIME;
1864
1865   /* When caching, update the cache entry.  */
1866   if (edge_growth_cache)
1867     {
1868       int ret_size;
1869       if ((int)VEC_length (edge_growth_cache_entry, edge_growth_cache)
1870           <= edge->uid)
1871         VEC_safe_grow_cleared (edge_growth_cache_entry, heap, edge_growth_cache,
1872                                cgraph_edge_max_uid);
1873       VEC_index (edge_growth_cache_entry, edge_growth_cache, edge->uid)->time
1874         = ret + (ret >= 0);
1875
1876       ret_size = size - es->call_stmt_size;
1877       gcc_checking_assert (es->call_stmt_size);
1878       VEC_index (edge_growth_cache_entry, edge_growth_cache, edge->uid)->size
1879         = ret_size + (ret_size >= 0);
1880     }
1881   return ret;
1882 }
1883
1884
1885 /* Estimate the growth of the caller when inlining EDGE.
1886    Only to be called via estimate_edge_size.  */
1887
1888 int
1889 do_estimate_edge_growth (struct cgraph_edge *edge)
1890 {
1891   int size;
1892
1893   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
1894
1895   if (edge_growth_cache)
1896     {
1897       do_estimate_edge_time (edge);
1898       size = VEC_index (edge_growth_cache_entry,
1899                         edge_growth_cache,
1900                         edge->uid)->size;
1901       gcc_checking_assert (size);
1902       return size - (size > 0);
1903     }
1904
1905   /* Early inliner runs without caching, go ahead and do the dirty work.  */
1906   gcc_checking_assert (edge->inline_failed);
1907   estimate_callee_size_and_time (edge, true, &size, NULL);
1908   gcc_checking_assert (inline_edge_summary (edge)->call_stmt_size);
1909   return size - inline_edge_summary (edge)->call_stmt_size;
1910 }
1911
1912
1913 /* Estimate self time of the function NODE after inlining EDGE.  */
1914
1915 int
1916 estimate_time_after_inlining (struct cgraph_node *node,
1917                               struct cgraph_edge *edge)
1918 {
1919   struct inline_edge_summary *es = inline_edge_summary (edge);
1920   if (!es->predicate || !false_predicate_p (es->predicate))
1921     {
1922       gcov_type time = inline_summary (node)->time + estimate_edge_time (edge);
1923       if (time < 0)
1924         time = 0;
1925       if (time > MAX_TIME)
1926         time = MAX_TIME;
1927       return time;
1928     }
1929   return inline_summary (node)->time;
1930 }
1931
1932
1933 /* Estimate the size of NODE after inlining EDGE which should be an
1934    edge to either NODE or a call inlined into NODE.  */
1935
1936 int
1937 estimate_size_after_inlining (struct cgraph_node *node,
1938                               struct cgraph_edge *edge)
1939 {
1940   struct inline_edge_summary *es = inline_edge_summary (edge);
1941   if (!es->predicate || !false_predicate_p (es->predicate))
1942     {
1943       int size = inline_summary (node)->size + estimate_edge_growth (edge);
1944       gcc_assert (size >= 0);
1945       return size;
1946     }
1947   return inline_summary (node)->size;
1948 }
1949
1950
1951 /* Estimate the growth caused by inlining NODE into all callees.  */
1952
1953 int
1954 do_estimate_growth (struct cgraph_node *node)
1955 {
1956   int growth = 0;
1957   struct cgraph_edge *e;
1958   bool self_recursive = false;
1959   struct inline_summary *info = inline_summary (node);
1960
1961   for (e = node->callers; e; e = e->next_caller)
1962     {
1963       gcc_checking_assert (e->inline_failed);
1964
1965       if (e->caller == node
1966           || (e->caller->global.inlined_to
1967               && e->caller->global.inlined_to == node))
1968         self_recursive = true;
1969       growth += estimate_edge_growth (e);
1970     }
1971
1972
1973   /* For self recursive functions the growth estimation really should be
1974      infinity.  We don't want to return very large values because the growth
1975      plays various roles in badness computation fractions.  Be sure to not
1976      return zero or negative growths. */
1977   if (self_recursive)
1978     growth = growth < info->size ? info->size : growth;
1979   else
1980     {
1981       if (cgraph_will_be_removed_from_program_if_no_direct_calls (node)
1982           && !DECL_EXTERNAL (node->decl))
1983         growth -= info->size;
1984       /* COMDAT functions are very often not shared across multiple units since they
1985          come from various template instantiations.  Take this into account.  */
1986       else  if (DECL_COMDAT (node->decl)
1987                 && cgraph_can_remove_if_no_direct_calls_p (node))
1988         growth -= (info->size
1989                    * (100 - PARAM_VALUE (PARAM_COMDAT_SHARING_PROBABILITY)) + 50) / 100;
1990     }
1991
1992   if (node_growth_cache)
1993     {
1994       if ((int)VEC_length (int, node_growth_cache) <= node->uid)
1995         VEC_safe_grow_cleared (int, heap, node_growth_cache, cgraph_max_uid);
1996       VEC_replace (int, node_growth_cache, node->uid, growth + (growth >= 0));
1997     }
1998   return growth;
1999 }
2000
2001
2002 /* This function performs intraprocedural analysis in NODE that is required to
2003    inline indirect calls.  */
2004
2005 static void
2006 inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
2007 {
2008   ipa_analyze_node (node);
2009   if (dump_file && (dump_flags & TDF_DETAILS))
2010     {
2011       ipa_print_node_params (dump_file, node);
2012       ipa_print_node_jump_functions (dump_file, node);
2013     }
2014 }
2015
2016
2017 /* Note function body size.  */
2018
2019 static void
2020 inline_analyze_function (struct cgraph_node *node)
2021 {
2022   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
2023   current_function_decl = node->decl;
2024
2025   if (dump_file)
2026     fprintf (dump_file, "\nAnalyzing function: %s/%u\n",
2027              cgraph_node_name (node), node->uid);
2028   /* FIXME: We should remove the optimize check after we ensure we never run
2029      IPA passes when not optimizing.  */
2030   if (flag_indirect_inlining && optimize)
2031     inline_indirect_intraprocedural_analysis (node);
2032   compute_inline_parameters (node, false);
2033
2034   current_function_decl = NULL;
2035   pop_cfun ();
2036 }
2037
2038
2039 /* Called when new function is inserted to callgraph late.  */
2040
2041 static void
2042 add_new_function (struct cgraph_node *node, void *data ATTRIBUTE_UNUSED)
2043 {
2044   inline_analyze_function (node);
2045 }
2046
2047
2048 /* Note function body size.  */
2049
2050 void
2051 inline_generate_summary (void)
2052 {
2053   struct cgraph_node *node;
2054
2055   function_insertion_hook_holder =
2056       cgraph_add_function_insertion_hook (&add_new_function, NULL);
2057
2058   if (flag_indirect_inlining)
2059     ipa_register_cgraph_hooks ();
2060
2061   for (node = cgraph_nodes; node; node = node->next)
2062     if (node->analyzed)
2063       inline_analyze_function (node);
2064 }
2065
2066
2067 /* Read predicate from IB.  */
2068
2069 static struct predicate
2070 read_predicate (struct lto_input_block *ib)
2071 {
2072   struct predicate out;
2073   clause_t clause;
2074   int k = 0;
2075
2076   do
2077     {
2078       gcc_assert (k <= MAX_CLAUSES);
2079       clause = out.clause[k++] = lto_input_uleb128 (ib);
2080     }
2081   while (clause);
2082   return out;
2083 }
2084
2085
2086 /* Write inline summary for edge E to OB.  */
2087
2088 static void
2089 read_inline_edge_summary (struct lto_input_block *ib, struct cgraph_edge *e)
2090 {
2091   struct inline_edge_summary *es = inline_edge_summary (e);
2092   struct predicate p;
2093
2094   es->call_stmt_size = lto_input_uleb128 (ib);
2095   es->call_stmt_time = lto_input_uleb128 (ib);
2096   es->loop_depth = lto_input_uleb128 (ib);
2097   p = read_predicate (ib);
2098   edge_set_predicate (e, &p);
2099 }
2100
2101
2102 /* Stream in inline summaries from the section.  */
2103
2104 static void
2105 inline_read_section (struct lto_file_decl_data *file_data, const char *data,
2106                      size_t len)
2107 {
2108   const struct lto_function_header *header =
2109     (const struct lto_function_header *) data;
2110   const int32_t cfg_offset = sizeof (struct lto_function_header);
2111   const int32_t main_offset = cfg_offset + header->cfg_size;
2112   const int32_t string_offset = main_offset + header->main_size;
2113   struct data_in *data_in;
2114   struct lto_input_block ib;
2115   unsigned int i, count2, j;
2116   unsigned int f_count;
2117
2118   LTO_INIT_INPUT_BLOCK (ib, (const char *) data + main_offset, 0,
2119                         header->main_size);
2120
2121   data_in =
2122     lto_data_in_create (file_data, (const char *) data + string_offset,
2123                         header->string_size, NULL);
2124   f_count = lto_input_uleb128 (&ib);
2125   for (i = 0; i < f_count; i++)
2126     {
2127       unsigned int index;
2128       struct cgraph_node *node;
2129       struct inline_summary *info;
2130       lto_cgraph_encoder_t encoder;
2131       struct bitpack_d bp;
2132       struct cgraph_edge *e;
2133
2134       index = lto_input_uleb128 (&ib);
2135       encoder = file_data->cgraph_node_encoder;
2136       node = lto_cgraph_encoder_deref (encoder, index);
2137       info = inline_summary (node);
2138
2139       info->estimated_stack_size
2140         = info->estimated_self_stack_size = lto_input_uleb128 (&ib);
2141       info->size = info->self_size = lto_input_uleb128 (&ib);
2142       info->time = info->self_time = lto_input_uleb128 (&ib);
2143
2144       bp = lto_input_bitpack (&ib);
2145       info->inlinable = bp_unpack_value (&bp, 1);
2146       info->versionable = bp_unpack_value (&bp, 1);
2147
2148       count2 = lto_input_uleb128 (&ib);
2149       gcc_assert (!info->conds);
2150       for (j = 0; j < count2; j++)
2151         {
2152           struct condition c;
2153           c.operand_num = lto_input_uleb128 (&ib);
2154           c.code = (enum tree_code) lto_input_uleb128 (&ib);
2155           c.val = lto_input_tree (&ib, data_in);
2156           VEC_safe_push (condition, gc, info->conds, &c);
2157         }
2158       count2 = lto_input_uleb128 (&ib);
2159       gcc_assert (!info->entry);
2160       for (j = 0; j < count2; j++)
2161         {
2162           struct size_time_entry e;
2163
2164           e.size = lto_input_uleb128 (&ib);
2165           e.time = lto_input_uleb128 (&ib);
2166           e.predicate = read_predicate (&ib);
2167
2168           VEC_safe_push (size_time_entry, gc, info->entry, &e);
2169         }
2170       for (e = node->callees; e; e = e->next_callee)
2171         read_inline_edge_summary (&ib, e);
2172       for (e = node->indirect_calls; e; e = e->next_callee)
2173         read_inline_edge_summary (&ib, e);
2174     }
2175
2176   lto_free_section_data (file_data, LTO_section_inline_summary, NULL, data,
2177                          len);
2178   lto_data_in_delete (data_in);
2179 }
2180
2181
2182 /* Read inline summary.  Jump functions are shared among ipa-cp
2183    and inliner, so when ipa-cp is active, we don't need to write them
2184    twice.  */
2185
2186 void
2187 inline_read_summary (void)
2188 {
2189   struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
2190   struct lto_file_decl_data *file_data;
2191   unsigned int j = 0;
2192
2193   inline_summary_alloc ();
2194
2195   while ((file_data = file_data_vec[j++]))
2196     {
2197       size_t len;
2198       const char *data = lto_get_section_data (file_data, LTO_section_inline_summary, NULL, &len);
2199       if (data)
2200         inline_read_section (file_data, data, len);
2201       else
2202         /* Fatal error here.  We do not want to support compiling ltrans units with
2203            different version of compiler or different flags than the WPA unit, so
2204            this should never happen.  */
2205         fatal_error ("ipa inline summary is missing in input file");
2206     }
2207   if (flag_indirect_inlining)
2208     {
2209       ipa_register_cgraph_hooks ();
2210       if (!flag_ipa_cp)
2211         ipa_prop_read_jump_functions ();
2212     }
2213   function_insertion_hook_holder =
2214       cgraph_add_function_insertion_hook (&add_new_function, NULL);
2215 }
2216
2217
2218 /* Write predicate P to OB.  */
2219
2220 static void
2221 write_predicate (struct output_block *ob, struct predicate *p)
2222 {
2223   int j;
2224   if (p)
2225     for (j = 0; p->clause[j]; j++)
2226       {
2227          gcc_assert (j < MAX_CLAUSES);
2228          lto_output_uleb128_stream (ob->main_stream,
2229                                     p->clause[j]);
2230       }
2231   lto_output_uleb128_stream (ob->main_stream, 0);
2232 }
2233
2234
2235 /* Write inline summary for edge E to OB.  */
2236
2237 static void
2238 write_inline_edge_summary (struct output_block *ob, struct cgraph_edge *e)
2239 {
2240   struct inline_edge_summary *es = inline_edge_summary (e);
2241   lto_output_uleb128_stream (ob->main_stream, es->call_stmt_size);
2242   lto_output_uleb128_stream (ob->main_stream, es->call_stmt_time);
2243   lto_output_uleb128_stream (ob->main_stream, es->loop_depth);
2244   write_predicate (ob, es->predicate);
2245 }
2246
2247
2248 /* Write inline summary for node in SET.
2249    Jump functions are shared among ipa-cp and inliner, so when ipa-cp is
2250    active, we don't need to write them twice.  */
2251
2252 void
2253 inline_write_summary (cgraph_node_set set,
2254                       varpool_node_set vset ATTRIBUTE_UNUSED)
2255 {
2256   struct cgraph_node *node;
2257   struct output_block *ob = create_output_block (LTO_section_inline_summary);
2258   lto_cgraph_encoder_t encoder = ob->decl_state->cgraph_node_encoder;
2259   unsigned int count = 0;
2260   int i;
2261
2262   for (i = 0; i < lto_cgraph_encoder_size (encoder); i++)
2263     if (lto_cgraph_encoder_deref (encoder, i)->analyzed)
2264       count++;
2265   lto_output_uleb128_stream (ob->main_stream, count);
2266
2267   for (i = 0; i < lto_cgraph_encoder_size (encoder); i++)
2268     {
2269       node = lto_cgraph_encoder_deref (encoder, i);
2270       if (node->analyzed)
2271         {
2272           struct inline_summary *info = inline_summary (node);
2273           struct bitpack_d bp;
2274           struct cgraph_edge *edge;
2275           int i;
2276           size_time_entry *e;
2277           struct condition *c;
2278
2279
2280           lto_output_uleb128_stream (ob->main_stream,
2281                                      lto_cgraph_encoder_encode (encoder, node));
2282           lto_output_sleb128_stream (ob->main_stream,
2283                                      info->estimated_self_stack_size);
2284           lto_output_sleb128_stream (ob->main_stream,
2285                                      info->self_size);
2286           lto_output_sleb128_stream (ob->main_stream,
2287                                      info->self_time);
2288           bp = bitpack_create (ob->main_stream);
2289           bp_pack_value (&bp, info->inlinable, 1);
2290           bp_pack_value (&bp, info->versionable, 1);
2291           lto_output_bitpack (&bp);
2292           lto_output_uleb128_stream (ob->main_stream,
2293                                      VEC_length (condition, info->conds));
2294           for (i = 0; VEC_iterate (condition, info->conds, i, c); i++)
2295             {
2296               lto_output_uleb128_stream (ob->main_stream,
2297                                          c->operand_num);
2298               lto_output_uleb128_stream (ob->main_stream,
2299                                          c->code);
2300               lto_output_tree (ob, c->val, true);
2301             }
2302           lto_output_uleb128_stream (ob->main_stream,
2303                                      VEC_length (size_time_entry, info->entry));
2304           for (i = 0;
2305                VEC_iterate (size_time_entry, info->entry, i, e);
2306                i++)
2307             {
2308               lto_output_uleb128_stream (ob->main_stream,
2309                                          e->size);
2310               lto_output_uleb128_stream (ob->main_stream,
2311                                          e->time);
2312               write_predicate (ob, &e->predicate);
2313             }
2314           for (edge = node->callees; edge; edge = edge->next_callee)
2315             write_inline_edge_summary (ob, edge);
2316           for (edge = node->indirect_calls; edge; edge = edge->next_callee)
2317             write_inline_edge_summary (ob, edge);
2318         }
2319     }
2320   lto_output_1_stream (ob->main_stream, 0);
2321   produce_asm (ob, NULL);
2322   destroy_output_block (ob);
2323
2324   if (flag_indirect_inlining && !flag_ipa_cp)
2325     ipa_prop_write_jump_functions (set);
2326 }
2327
2328
2329 /* Release inline summary.  */
2330
2331 void
2332 inline_free_summary (void)
2333 {
2334   if (function_insertion_hook_holder)
2335     cgraph_remove_function_insertion_hook (function_insertion_hook_holder);
2336   function_insertion_hook_holder = NULL;
2337   if (node_removal_hook_holder)
2338     cgraph_remove_node_removal_hook (node_removal_hook_holder);
2339   if (edge_removal_hook_holder)
2340     cgraph_remove_edge_removal_hook (edge_removal_hook_holder);
2341   node_removal_hook_holder = NULL;
2342   if (node_duplication_hook_holder)
2343     cgraph_remove_node_duplication_hook (node_duplication_hook_holder);
2344   if (edge_duplication_hook_holder)
2345     cgraph_remove_edge_duplication_hook (edge_duplication_hook_holder);
2346   node_duplication_hook_holder = NULL;
2347   VEC_free (inline_summary_t, gc, inline_summary_vec);
2348   inline_summary_vec = NULL;
2349   VEC_free (inline_edge_summary_t, heap, inline_edge_summary_vec);
2350   inline_edge_summary_vec = NULL;
2351   if (edge_predicate_pool)
2352     free_alloc_pool (edge_predicate_pool);
2353   edge_predicate_pool = 0;
2354 }