gcc/ipa-inline.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003-2019 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /*  Inlining decision heuristics
  22
  23     The implementation of inliner is organized as follows:
  24
  25     inlining heuristics limits
  26
  27       can_inline_edge_p allow to check that particular inlining is allowed
  28       by the limits specified by user (allowed function growth, growth and so
  29       on).
  30
  31       Functions are inlined when it is obvious the result is profitable (such
  32       as functions called once or when inlining reduce code size).
  33       In addition to that we perform inlining of small functions and recursive
  34       inlining.
  35
  36     inlining heuristics
  37
  38        The inliner itself is split into two passes:
  39
  40        pass_early_inlining
  41
  42          Simple local inlining pass inlining callees into current function.
  43          This pass makes no use of whole unit analysis and thus it can do only
  44          very simple decisions based on local properties.
  45
  46          The strength of the pass is that it is run in topological order
  47          (reverse postorder) on the callgraph. Functions are converted into SSA
  48          form just before this pass and optimized subsequently. As a result, the
  49          callees of the function seen by the early inliner was already optimized
  50          and results of early inlining adds a lot of optimization opportunities
  51          for the local optimization.
  52
  53          The pass handle the obvious inlining decisions within the compilation
  54          unit - inlining auto inline functions, inlining for size and
  55          flattening.
  56
  57          main strength of the pass is the ability to eliminate abstraction
  58          penalty in C++ code (via combination of inlining and early
  59          optimization) and thus improve quality of analysis done by real IPA
  60          optimizers.
  61
  62          Because of lack of whole unit knowledge, the pass cannot really make
  63          good code size/performance tradeoffs.  It however does very simple
  64          speculative inlining allowing code size to grow by
  65          EARLY_INLINING_INSNS when callee is leaf function.  In this case the
  66          optimizations performed later are very likely to eliminate the cost.
  67
  68        pass_ipa_inline
  69
  70          This is the real inliner able to handle inlining with whole program
  71          knowledge. It performs following steps:
  72
  73          1) inlining of small functions.  This is implemented by greedy
  74          algorithm ordering all inlinable cgraph edges by their badness and
  75          inlining them in this order as long as inline limits allows doing so.
  76
  77          This heuristics is not very good on inlining recursive calls. Recursive
  78          calls can be inlined with results similar to loop unrolling. To do so,
  79          special purpose recursive inliner is executed on function when
  80          recursive edge is met as viable candidate.
  81
  82          2) Unreachable functions are removed from callgraph.  Inlining leads
  83          to devirtualization and other modification of callgraph so functions
  84          may become unreachable during the process. Also functions declared as
  85          extern inline or virtual functions are removed, since after inlining
  86          we no longer need the offline bodies.
  87
  88          3) Functions called once and not exported from the unit are inlined.
  89          This should almost always lead to reduction of code size by eliminating
  90          the need for offline copy of the function.  */
  91
  92 #include "config.h"
  93 #include "system.h"
  94 #include "coretypes.h"
  95 #include "backend.h"
  96 #include "target.h"
  97 #include "rtl.h"
  98 #include "tree.h"
  99 #include "gimple.h"
 100 #include "alloc-pool.h"
 101 #include "tree-pass.h"
 102 #include "gimple-ssa.h"
 103 #include "cgraph.h"
 104 #include "lto-streamer.h"
 105 #include "trans-mem.h"
 106 #include "calls.h"
 107 #include "tree-inline.h"
 108 #include "params.h"
 109 #include "profile.h"
 110 #include "symbol-summary.h"
 111 #include "tree-vrp.h"
 112 #include "ipa-prop.h"
 113 #include "ipa-fnsummary.h"
 114 #include "ipa-inline.h"
 115 #include "ipa-utils.h"
 116 #include "sreal.h"
 117 #include "auto-profile.h"
 118 #include "builtins.h"
 119 #include "fibonacci_heap.h"
 120 #include "stringpool.h"
 121 #include "attribs.h"
 122 #include "asan.h"
 123
 124 typedef fibonacci_heap <sreal, cgraph_edge> edge_heap_t;
 125 typedef fibonacci_node <sreal, cgraph_edge> edge_heap_node_t;
 126
 127 /* Statistics we collect about inlining algorithm.  */
 128 static int overall_size;
 129 static profile_count max_count;
 130 static profile_count spec_rem;
 131
 132 /* Return false when inlining edge E would lead to violating
 133    limits on function unit growth or stack usage growth.
 134
 135    The relative function body growth limit is present generally
 136    to avoid problems with non-linear behavior of the compiler.
 137    To allow inlining huge functions into tiny wrapper, the limit
 138    is always based on the bigger of the two functions considered.
 139
 140    For stack growth limits we always base the growth in stack usage
 141    of the callers.  We want to prevent applications from segfaulting
 142    on stack overflow when functions with huge stack frames gets
 143    inlined. */
 144
 145 static bool
 146 caller_growth_limits (struct cgraph_edge *e)
 147 {
 148   struct cgraph_node *to = e->caller;
 149   struct cgraph_node *what = e->callee->ultimate_alias_target ();
 150   int newsize;
 151   int limit = 0;
 152   HOST_WIDE_INT stack_size_limit = 0, inlined_stack;
 153   ipa_size_summary *outer_info = ipa_size_summaries->get (to);
 154
 155   /* Look for function e->caller is inlined to.  While doing
 156      so work out the largest function body on the way.  As
 157      described above, we want to base our function growth
 158      limits based on that.  Not on the self size of the
 159      outer function, not on the self size of inline code
 160      we immediately inline to.  This is the most relaxed
 161      interpretation of the rule "do not grow large functions
 162      too much in order to prevent compiler from exploding".  */
 163   while (true)
 164     {
 165       ipa_size_summary *size_info = ipa_size_summaries->get (to);
 166       if (limit < size_info->self_size)
 167         limit = size_info->self_size;
 168       if (stack_size_limit < size_info->estimated_self_stack_size)
 169         stack_size_limit = size_info->estimated_self_stack_size;
 170       if (to->inlined_to)
 171         to = to->callers->caller;
 172       else
 173         break;
 174     }
 175
 176   ipa_fn_summary *what_info = ipa_fn_summaries->get (what);
 177   ipa_size_summary *what_size_info = ipa_size_summaries->get (what);
 178
 179   if (limit < what_size_info->self_size)
 180     limit = what_size_info->self_size;
 181
 182   limit += limit * PARAM_VALUE (PARAM_LARGE_FUNCTION_GROWTH) / 100;
 183
 184   /* Check the size after inlining against the function limits.  But allow
 185      the function to shrink if it went over the limits by forced inlining.  */
 186   newsize = estimate_size_after_inlining (to, e);
 187   if (newsize >= ipa_size_summaries->get (what)->size
 188       && newsize > PARAM_VALUE (PARAM_LARGE_FUNCTION_INSNS)
 189       && newsize > limit)
 190     {
 191       e->inline_failed = CIF_LARGE_FUNCTION_GROWTH_LIMIT;
 192       return false;
 193     }
 194
 195   if (!what_info->estimated_stack_size)
 196     return true;
 197
 198   /* FIXME: Stack size limit often prevents inlining in Fortran programs
 199      due to large i/o datastructures used by the Fortran front-end.
 200      We ought to ignore this limit when we know that the edge is executed
 201      on every invocation of the caller (i.e. its call statement dominates
 202      exit block).  We do not track this information, yet.  */
 203   stack_size_limit += ((gcov_type)stack_size_limit
 204                        * PARAM_VALUE (PARAM_STACK_FRAME_GROWTH) / 100);
 205
 206   inlined_stack = (ipa_get_stack_frame_offset (to)
 207                    + outer_info->estimated_self_stack_size
 208                    + what_info->estimated_stack_size);
 209   /* Check new stack consumption with stack consumption at the place
 210      stack is used.  */
 211   if (inlined_stack > stack_size_limit
 212       /* If function already has large stack usage from sibling
 213          inline call, we can inline, too.
 214          This bit overoptimistically assume that we are good at stack
 215          packing.  */
 216       && inlined_stack > ipa_fn_summaries->get (to)->estimated_stack_size
 217       && inlined_stack > PARAM_VALUE (PARAM_LARGE_STACK_FRAME))
 218     {
 219       e->inline_failed = CIF_LARGE_STACK_FRAME_GROWTH_LIMIT;
 220       return false;
 221     }
 222   return true;
 223 }
 224
 225 /* Dump info about why inlining has failed.  */
 226
 227 static void
 228 report_inline_failed_reason (struct cgraph_edge *e)
 229 {
 230   if (dump_enabled_p ())
 231     {
 232       dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
 233                        "  not inlinable: %C -> %C, %s\n",
 234                        e->caller, e->callee,
 235                        cgraph_inline_failed_string (e->inline_failed));
 236       if ((e->inline_failed == CIF_TARGET_OPTION_MISMATCH
 237            || e->inline_failed == CIF_OPTIMIZATION_MISMATCH)
 238           && e->caller->lto_file_data
 239           && e->callee->ultimate_alias_target ()->lto_file_data)
 240         {
 241           dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
 242                            "  LTO objects: %s, %s\n",
 243                            e->caller->lto_file_data->file_name,
 244                            e->callee->ultimate_alias_target ()->lto_file_data->file_name);
 245         }
 246       if (e->inline_failed == CIF_TARGET_OPTION_MISMATCH)
 247         if (dump_file)
 248           cl_target_option_print_diff
 249             (dump_file, 2, target_opts_for_fn (e->caller->decl),
 250              target_opts_for_fn (e->callee->ultimate_alias_target ()->decl));
 251       if (e->inline_failed == CIF_OPTIMIZATION_MISMATCH)
 252         if (dump_file)
 253           cl_optimization_print_diff
 254             (dump_file, 2, opts_for_fn (e->caller->decl),
 255              opts_for_fn (e->callee->ultimate_alias_target ()->decl));
 256     }
 257 }
 258
 259  /* Decide whether sanitizer-related attributes allow inlining. */
 260
 261 static bool
 262 sanitize_attrs_match_for_inline_p (const_tree caller, const_tree callee)
 263 {
 264   if (!caller || !callee)
 265     return true;
 266
 267   /* Allow inlining always_inline functions into no_sanitize_address
 268      functions.  */
 269   if (!sanitize_flags_p (SANITIZE_ADDRESS, caller)
 270       && lookup_attribute ("always_inline", DECL_ATTRIBUTES (callee)))
 271     return true;
 272
 273   return ((sanitize_flags_p (SANITIZE_ADDRESS, caller)
 274            == sanitize_flags_p (SANITIZE_ADDRESS, callee))
 275           && (sanitize_flags_p (SANITIZE_POINTER_COMPARE, caller)
 276               == sanitize_flags_p (SANITIZE_POINTER_COMPARE, callee))
 277           && (sanitize_flags_p (SANITIZE_POINTER_SUBTRACT, caller)
 278               == sanitize_flags_p (SANITIZE_POINTER_SUBTRACT, callee)));
 279 }
 280
 281 /* Used for flags where it is safe to inline when caller's value is
 282    grater than callee's.  */
 283 #define check_maybe_up(flag) \
 284       (opts_for_fn (caller->decl)->x_##flag             \
 285        != opts_for_fn (callee->decl)->x_##flag          \
 286        && (!always_inline                               \
 287            || opts_for_fn (caller->decl)->x_##flag      \
 288               < opts_for_fn (callee->decl)->x_##flag))
 289 /* Used for flags where it is safe to inline when caller's value is
 290    smaller than callee's.  */
 291 #define check_maybe_down(flag) \
 292       (opts_for_fn (caller->decl)->x_##flag             \
 293        != opts_for_fn (callee->decl)->x_##flag          \
 294        && (!always_inline                               \
 295            || opts_for_fn (caller->decl)->x_##flag      \
 296               > opts_for_fn (callee->decl)->x_##flag))
 297 /* Used for flags where exact match is needed for correctness.  */
 298 #define check_match(flag) \
 299       (opts_for_fn (caller->decl)->x_##flag             \
 300        != opts_for_fn (callee->decl)->x_##flag)
 301
 302 /* Decide if we can inline the edge and possibly update
 303    inline_failed reason.
 304    We check whether inlining is possible at all and whether
 305    caller growth limits allow doing so.
 306
 307    if REPORT is true, output reason to the dump file. */
 308
 309 static bool
 310 can_inline_edge_p (struct cgraph_edge *e, bool report,
 311                    bool early = false)
 312 {
 313   gcc_checking_assert (e->inline_failed);
 314
 315   if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
 316     {
 317       if (report)
 318         report_inline_failed_reason (e);
 319       return false;
 320     }
 321
 322   bool inlinable = true;
 323   enum availability avail;
 324   cgraph_node *caller = (e->caller->inlined_to
 325                          ? e->caller->inlined_to : e->caller);
 326   cgraph_node *callee = e->callee->ultimate_alias_target (&avail, caller);
 327
 328   if (!callee->definition)
 329     {
 330       e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 331       inlinable = false;
 332     }
 333   if (!early && (!opt_for_fn (callee->decl, optimize)
 334                  || !opt_for_fn (caller->decl, optimize)))
 335     {
 336       e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
 337       inlinable = false;
 338     }
 339   else if (callee->calls_comdat_local)
 340     {
 341       e->inline_failed = CIF_USES_COMDAT_LOCAL;
 342       inlinable = false;
 343     }
 344   else if (avail <= AVAIL_INTERPOSABLE)
 345     {
 346       e->inline_failed = CIF_OVERWRITABLE;
 347       inlinable = false;
 348     }
 349   /* All edges with call_stmt_cannot_inline_p should have inline_failed
 350      initialized to one of FINAL_ERROR reasons.  */
 351   else if (e->call_stmt_cannot_inline_p)
 352     gcc_unreachable ();
 353   /* Don't inline if the functions have different EH personalities.  */
 354   else if (DECL_FUNCTION_PERSONALITY (caller->decl)
 355            && DECL_FUNCTION_PERSONALITY (callee->decl)
 356            && (DECL_FUNCTION_PERSONALITY (caller->decl)
 357                != DECL_FUNCTION_PERSONALITY (callee->decl)))
 358     {
 359       e->inline_failed = CIF_EH_PERSONALITY;
 360       inlinable = false;
 361     }
 362   /* TM pure functions should not be inlined into non-TM_pure
 363      functions.  */
 364   else if (is_tm_pure (callee->decl) && !is_tm_pure (caller->decl))
 365     {
 366       e->inline_failed = CIF_UNSPECIFIED;
 367       inlinable = false;
 368     }
 369   /* Check compatibility of target optimization options.  */
 370   else if (!targetm.target_option.can_inline_p (caller->decl,
 371                                                 callee->decl))
 372     {
 373       e->inline_failed = CIF_TARGET_OPTION_MISMATCH;
 374       inlinable = false;
 375     }
 376   else if (ipa_fn_summaries->get (callee) == NULL
 377            || !ipa_fn_summaries->get (callee)->inlinable)
 378     {
 379       e->inline_failed = CIF_FUNCTION_NOT_INLINABLE;
 380       inlinable = false;
 381     }
 382   /* Don't inline a function with mismatched sanitization attributes. */
 383   else if (!sanitize_attrs_match_for_inline_p (caller->decl, callee->decl))
 384     {
 385       e->inline_failed = CIF_ATTRIBUTE_MISMATCH;
 386       inlinable = false;
 387     }
 388   if (!inlinable && report)
 389     report_inline_failed_reason (e);
 390   return inlinable;
 391 }
 392
 393 /* Return inlining_insns_single limit for function N. If HINT is true
 394    scale up the bound.  */
 395
 396 static int
 397 inline_insns_single (cgraph_node *n, bool hint)
 398 {
 399   if (opt_for_fn (n->decl, optimize) >= 3)
 400     {
 401       if (hint)
 402         return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SINGLE)
 403                * PARAM_VALUE (PARAM_INLINE_HEURISTICS_HINT_PERCENT) / 100;
 404       return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SINGLE);
 405     }
 406   else
 407     {
 408       if (hint)
 409         return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SINGLE_O2)
 410                * PARAM_VALUE (PARAM_INLINE_HEURISTICS_HINT_PERCENT_O2) / 100;
 411       return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SINGLE_O2);
 412     }
 413 }
 414
 415 /* Return inlining_insns_auto limit for function N. If HINT is true
 416    scale up the bound.   */
 417
 418 static int
 419 inline_insns_auto (cgraph_node *n, bool hint)
 420 {
 421   if (opt_for_fn (n->decl, optimize) >= 3)
 422     {
 423       if (hint)
 424         return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_AUTO)
 425                * PARAM_VALUE (PARAM_INLINE_HEURISTICS_HINT_PERCENT) / 100;
 426       return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_AUTO);
 427     }
 428   else
 429     {
 430       if (hint)
 431         return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_AUTO_O2)
 432                * PARAM_VALUE (PARAM_INLINE_HEURISTICS_HINT_PERCENT_O2) / 100;
 433       return PARAM_VALUE (PARAM_MAX_INLINE_INSNS_AUTO_O2);
 434     }
 435 }
 436
 437 /* Decide if we can inline the edge and possibly update
 438    inline_failed reason.
 439    We check whether inlining is possible at all and whether
 440    caller growth limits allow doing so.
 441
 442    if REPORT is true, output reason to the dump file.
 443
 444    if DISREGARD_LIMITS is true, ignore size limits.  */
 445
 446 static bool
 447 can_inline_edge_by_limits_p (struct cgraph_edge *e, bool report,
 448                              bool disregard_limits = false, bool early = false)
 449 {
 450   gcc_checking_assert (e->inline_failed);
 451
 452   if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
 453     {
 454       if (report)
 455         report_inline_failed_reason (e);
 456       return false;
 457     }
 458
 459   bool inlinable = true;
 460   enum availability avail;
 461   cgraph_node *caller = (e->caller->inlined_to
 462                          ? e->caller->inlined_to : e->caller);
 463   cgraph_node *callee = e->callee->ultimate_alias_target (&avail, caller);
 464   tree caller_tree = DECL_FUNCTION_SPECIFIC_OPTIMIZATION (caller->decl);
 465   tree callee_tree
 466     = callee ? DECL_FUNCTION_SPECIFIC_OPTIMIZATION (callee->decl) : NULL;
 467   /* Check if caller growth allows the inlining.  */
 468   if (!DECL_DISREGARD_INLINE_LIMITS (callee->decl)
 469       && !disregard_limits
 470       && !lookup_attribute ("flatten",
 471                  DECL_ATTRIBUTES (caller->decl))
 472       && !caller_growth_limits (e))
 473     inlinable = false;
 474   else if (callee->externally_visible
 475            && !DECL_DISREGARD_INLINE_LIMITS (callee->decl)
 476            && flag_live_patching == LIVE_PATCHING_INLINE_ONLY_STATIC)
 477     {
 478       e->inline_failed = CIF_EXTERN_LIVE_ONLY_STATIC;
 479       inlinable = false;
 480     }
 481   /* Don't inline a function with a higher optimization level than the
 482      caller.  FIXME: this is really just tip of iceberg of handling
 483      optimization attribute.  */
 484   else if (caller_tree != callee_tree)
 485     {
 486       bool always_inline =
 487              (DECL_DISREGARD_INLINE_LIMITS (callee->decl)
 488               && lookup_attribute ("always_inline",
 489                                    DECL_ATTRIBUTES (callee->decl)));
 490       ipa_fn_summary *caller_info = ipa_fn_summaries->get (caller);
 491       ipa_fn_summary *callee_info = ipa_fn_summaries->get (callee);
 492
 493      /* Until GCC 4.9 we did not check the semantics-altering flags
 494         below and inlined across optimization boundaries.
 495         Enabling checks below breaks several packages by refusing
 496         to inline library always_inline functions. See PR65873.
 497         Disable the check for early inlining for now until better solution
 498         is found.  */
 499      if (always_inline && early)
 500         ;
 501       /* There are some options that change IL semantics which means
 502          we cannot inline in these cases for correctness reason.
 503          Not even for always_inline declared functions.  */
 504      else if (check_match (flag_wrapv)
 505               || check_match (flag_trapv)
 506               || check_match (flag_pcc_struct_return)
 507               /* When caller or callee does FP math, be sure FP codegen flags
 508                  compatible.  */
 509               || ((caller_info->fp_expressions && callee_info->fp_expressions)
 510                   && (check_maybe_up (flag_rounding_math)
 511                       || check_maybe_up (flag_trapping_math)
 512                       || check_maybe_down (flag_unsafe_math_optimizations)
 513                       || check_maybe_down (flag_finite_math_only)
 514                       || check_maybe_up (flag_signaling_nans)
 515                       || check_maybe_down (flag_cx_limited_range)
 516                       || check_maybe_up (flag_signed_zeros)
 517                       || check_maybe_down (flag_associative_math)
 518                       || check_maybe_down (flag_reciprocal_math)
 519                       || check_maybe_down (flag_fp_int_builtin_inexact)
 520                       /* Strictly speaking only when the callee contains function
 521                          calls that may end up setting errno.  */
 522                       || check_maybe_up (flag_errno_math)))
 523               /* We do not want to make code compiled with exceptions to be
 524                  brought into a non-EH function unless we know that the callee
 525                  does not throw.
 526                  This is tracked by DECL_FUNCTION_PERSONALITY.  */
 527               || (check_maybe_up (flag_non_call_exceptions)
 528                   && DECL_FUNCTION_PERSONALITY (callee->decl))
 529               || (check_maybe_up (flag_exceptions)
 530                   && DECL_FUNCTION_PERSONALITY (callee->decl))
 531               /* When devirtualization is diabled for callee, it is not safe
 532                  to inline it as we possibly mangled the type info.
 533                  Allow early inlining of always inlines.  */
 534               || (!early && check_maybe_down (flag_devirtualize)))
 535         {
 536           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 537           inlinable = false;
 538         }
 539       /* gcc.dg/pr43564.c.  Apply user-forced inline even at -O0.  */
 540       else if (always_inline)
 541         ;
 542       /* When user added an attribute to the callee honor it.  */
 543       else if (lookup_attribute ("optimize", DECL_ATTRIBUTES (callee->decl))
 544                && opts_for_fn (caller->decl) != opts_for_fn (callee->decl))
 545         {
 546           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 547           inlinable = false;
 548         }
 549       /* If explicit optimize attribute are not used, the mismatch is caused
 550          by different command line options used to build different units.
 551          Do not care about COMDAT functions - those are intended to be
 552          optimized with the optimization flags of module they are used in.
 553          Also do not care about mixing up size/speed optimization when
 554          DECL_DISREGARD_INLINE_LIMITS is set.  */
 555       else if ((callee->merged_comdat
 556                 && !lookup_attribute ("optimize",
 557                                       DECL_ATTRIBUTES (caller->decl)))
 558                || DECL_DISREGARD_INLINE_LIMITS (callee->decl))
 559         ;
 560       /* If mismatch is caused by merging two LTO units with different
 561          optimizationflags we want to be bit nicer.  However never inline
 562          if one of functions is not optimized at all.  */
 563       else if (!opt_for_fn (callee->decl, optimize)
 564                || !opt_for_fn (caller->decl, optimize))
 565         {
 566           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 567           inlinable = false;
 568         }
 569       /* If callee is optimized for size and caller is not, allow inlining if
 570          code shrinks or we are in MAX_INLINE_INSNS_SINGLE limit and callee
 571          is inline (and thus likely an unified comdat).  This will allow caller
 572          to run faster.  */
 573       else if (opt_for_fn (callee->decl, optimize_size)
 574                > opt_for_fn (caller->decl, optimize_size))
 575         {
 576           int growth = estimate_edge_growth (e);
 577           if (growth > PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SIZE)
 578               && (!DECL_DECLARED_INLINE_P (callee->decl)
 579                   && growth >= MAX (inline_insns_single (caller, false),
 580                                     inline_insns_auto (caller, false))))
 581             {
 582               e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 583               inlinable = false;
 584             }
 585         }
 586       /* If callee is more aggressively optimized for performance than caller,
 587          we generally want to inline only cheap (runtime wise) functions.  */
 588       else if (opt_for_fn (callee->decl, optimize_size)
 589                < opt_for_fn (caller->decl, optimize_size)
 590                || (opt_for_fn (callee->decl, optimize)
 591                    > opt_for_fn (caller->decl, optimize)))
 592         {
 593           if (estimate_edge_time (e)
 594               >= 20 + ipa_call_summaries->get (e)->call_stmt_time)
 595             {
 596               e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 597               inlinable = false;
 598             }
 599         }
 600
 601     }
 602
 603   if (!inlinable && report)
 604     report_inline_failed_reason (e);
 605   return inlinable;
 606 }
 607
 608
 609 /* Return true if the edge E is inlinable during early inlining.  */
 610
 611 static bool
 612 can_early_inline_edge_p (struct cgraph_edge *e)
 613 {
 614   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 615   /* Early inliner might get called at WPA stage when IPA pass adds new
 616      function.  In this case we cannot really do any of early inlining
 617      because function bodies are missing.  */
 618   if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
 619     return false;
 620   if (!gimple_has_body_p (callee->decl))
 621     {
 622       e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 623       return false;
 624     }
 625   /* In early inliner some of callees may not be in SSA form yet
 626      (i.e. the callgraph is cyclic and we did not process
 627      the callee by early inliner, yet).  We don't have CIF code for this
 628      case; later we will re-do the decision in the real inliner.  */
 629   if (!gimple_in_ssa_p (DECL_STRUCT_FUNCTION (e->caller->decl))
 630       || !gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->decl)))
 631     {
 632       if (dump_enabled_p ())
 633         dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
 634                          "  edge not inlinable: not in SSA form\n");
 635       return false;
 636     }
 637   if (!can_inline_edge_p (e, true, true)
 638       || !can_inline_edge_by_limits_p (e, true, false, true))
 639     return false;
 640   return true;
 641 }
 642
 643
 644 /* Return number of calls in N.  Ignore cheap builtins.  */
 645
 646 static int
 647 num_calls (struct cgraph_node *n)
 648 {
 649   struct cgraph_edge *e;
 650   int num = 0;
 651
 652   for (e = n->callees; e; e = e->next_callee)
 653     if (!is_inexpensive_builtin (e->callee->decl))
 654       num++;
 655   return num;
 656 }
 657
 658
 659 /* Return true if we are interested in inlining small function.  */
 660
 661 static bool
 662 want_early_inline_function_p (struct cgraph_edge *e)
 663 {
 664   bool want_inline = true;
 665   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 666
 667   if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
 668     ;
 669   /* For AutoFDO, we need to make sure that before profile summary, all
 670      hot paths' IR look exactly the same as profiled binary. As a result,
 671      in einliner, we will disregard size limit and inline those callsites
 672      that are:
 673        * inlined in the profiled binary, and
 674        * the cloned callee has enough samples to be considered "hot".  */
 675   else if (flag_auto_profile && afdo_callsite_hot_enough_for_early_inline (e))
 676     ;
 677   else if (!DECL_DECLARED_INLINE_P (callee->decl)
 678            && !opt_for_fn (e->caller->decl, flag_inline_small_functions))
 679     {
 680       e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
 681       report_inline_failed_reason (e);
 682       want_inline = false;
 683     }
 684   else
 685     {
 686       int growth = estimate_edge_growth (e);
 687       int n;
 688       int early_inlining_insns = opt_for_fn (e->caller->decl, optimize) >= 3
 689                                  ? PARAM_VALUE (PARAM_EARLY_INLINING_INSNS)
 690                                  : PARAM_VALUE (PARAM_EARLY_INLINING_INSNS_O2);
 691
 692
 693       if (growth <= PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SIZE))
 694         ;
 695       else if (!e->maybe_hot_p ())
 696         {
 697           if (dump_enabled_p ())
 698             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
 699                              "  will not early inline: %C->%C, "
 700                              "call is cold and code would grow by %i\n",
 701                              e->caller, callee,
 702                              growth);
 703           want_inline = false;
 704         }
 705       else if (growth > early_inlining_insns)
 706         {
 707           if (dump_enabled_p ())
 708             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
 709                              "  will not early inline: %C->%C, "
 710                              "growth %i exceeds --param early-inlining-insns%s\n",
 711                              e->caller, callee, growth,
 712                              opt_for_fn (e->caller->decl, optimize) >= 3
 713                              ? "" : "-O2");
 714           want_inline = false;
 715         }
 716       else if ((n = num_calls (callee)) != 0
 717                && growth * (n + 1) > early_inlining_insns)
 718         {
 719           if (dump_enabled_p ())
 720             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
 721                              "  will not early inline: %C->%C, "
 722                              "growth %i exceeds --param early-inlining-insns%s "
 723                              "divided by number of calls\n",
 724                              e->caller, callee, growth,
 725                              opt_for_fn (e->caller->decl, optimize) >= 3
 726                              ? "" : "-O2");
 727           want_inline = false;
 728         }
 729     }
 730   return want_inline;
 731 }
 732
 733 /* Compute time of the edge->caller + edge->callee execution when inlining
 734    does not happen.  */
 735
 736 inline sreal
 737 compute_uninlined_call_time (struct cgraph_edge *edge,
 738                              sreal uninlined_call_time)
 739 {
 740   cgraph_node *caller = (edge->caller->inlined_to
 741                          ? edge->caller->inlined_to
 742                          : edge->caller);
 743
 744   sreal freq = edge->sreal_frequency ();
 745   if (freq > 0)
 746     uninlined_call_time *= freq;
 747   else
 748     uninlined_call_time = uninlined_call_time >> 11;
 749
 750   sreal caller_time = ipa_fn_summaries->get (caller)->time;
 751   return uninlined_call_time + caller_time;
 752 }
 753
 754 /* Same as compute_uinlined_call_time but compute time when inlining
 755    does happen.  */
 756
 757 inline sreal
 758 compute_inlined_call_time (struct cgraph_edge *edge,
 759                            sreal time)
 760 {
 761   cgraph_node *caller = (edge->caller->inlined_to
 762                          ? edge->caller->inlined_to
 763                          : edge->caller);
 764   sreal caller_time = ipa_fn_summaries->get (caller)->time;
 765
 766   sreal freq = edge->sreal_frequency ();
 767   if (freq > 0)
 768     time *= freq;
 769   else
 770     time = time >> 11;
 771
 772   /* This calculation should match one in ipa-inline-analysis.c
 773      (estimate_edge_size_and_time).  */
 774   time -= (sreal)ipa_call_summaries->get (edge)->call_stmt_time * freq;
 775   time += caller_time;
 776   if (time <= 0)
 777     time = ((sreal) 1) >> 8;
 778   gcc_checking_assert (time >= 0);
 779   return time;
 780 }
 781
 782 /* Return true if the speedup for inlining E is bigger than
 783    PARAM_MAX_INLINE_MIN_SPEEDUP.  */
 784
 785 static bool
 786 big_speedup_p (struct cgraph_edge *e)
 787 {
 788   sreal unspec_time;
 789   sreal spec_time = estimate_edge_time (e, &unspec_time);
 790   sreal time = compute_uninlined_call_time (e, unspec_time);
 791   sreal inlined_time = compute_inlined_call_time (e, spec_time);
 792   cgraph_node *caller = (e->caller->inlined_to
 793                          ? e->caller->inlined_to
 794                          : e->caller);
 795   int limit = opt_for_fn (caller->decl, optimize) >= 3
 796               ? PARAM_VALUE (PARAM_INLINE_MIN_SPEEDUP)
 797               : PARAM_VALUE (PARAM_INLINE_MIN_SPEEDUP_O2);
 798
 799   if ((time - inlined_time) * 100 > time * limit)
 800     return true;
 801   return false;
 802 }
 803
 804 /* Return true if we are interested in inlining small function.
 805    When REPORT is true, report reason to dump file.  */
 806
 807 static bool
 808 want_inline_small_function_p (struct cgraph_edge *e, bool report)
 809 {
 810   bool want_inline = true;
 811   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 812
 813   /* Allow this function to be called before can_inline_edge_p,
 814      since it's usually cheaper.  */
 815   if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
 816     want_inline = false;
 817   else if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
 818     ;
 819   else if (!DECL_DECLARED_INLINE_P (callee->decl)
 820            && !opt_for_fn (e->caller->decl, flag_inline_small_functions))
 821     {
 822       e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
 823       want_inline = false;
 824     }
 825   /* Do fast and conservative check if the function can be good
 826      inline candidate.  */
 827   else if ((!DECL_DECLARED_INLINE_P (callee->decl)
 828            && (!e->count.ipa ().initialized_p () || !e->maybe_hot_p ()))
 829            && ipa_fn_summaries->get (callee)->min_size
 830                 - ipa_call_summaries->get (e)->call_stmt_size
 831               > inline_insns_auto (e->caller, true))
 832     {
 833       if (opt_for_fn (e->caller->decl, optimize) >= 3)
 834         e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
 835       else
 836         e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_O2_LIMIT;
 837       want_inline = false;
 838     }
 839   else if ((DECL_DECLARED_INLINE_P (callee->decl)
 840             || e->count.ipa ().nonzero_p ())
 841            && ipa_fn_summaries->get (callee)->min_size
 842                 - ipa_call_summaries->get (e)->call_stmt_size
 843               > inline_insns_single (e->caller, true))
 844     {
 845       if (opt_for_fn (e->caller->decl, optimize) >= 3)
 846         e->inline_failed = (DECL_DECLARED_INLINE_P (callee->decl)
 847                             ? CIF_MAX_INLINE_INSNS_SINGLE_LIMIT
 848                             : CIF_MAX_INLINE_INSNS_AUTO_LIMIT);
 849       else
 850         e->inline_failed = (DECL_DECLARED_INLINE_P (callee->decl)
 851                             ? CIF_MAX_INLINE_INSNS_SINGLE_O2_LIMIT
 852                             : CIF_MAX_INLINE_INSNS_AUTO_O2_LIMIT);
 853       want_inline = false;
 854     }
 855   else
 856     {
 857       int growth = estimate_edge_growth (e);
 858       ipa_hints hints = estimate_edge_hints (e);
 859       bool apply_hints = (hints & (INLINE_HINT_indirect_call
 860                                    | INLINE_HINT_known_hot
 861                                    | INLINE_HINT_loop_iterations
 862                                    | INLINE_HINT_loop_stride));
 863
 864       if (growth <= PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SIZE))
 865         ;
 866       /* Apply MAX_INLINE_INSNS_SINGLE limit.  Do not do so when
 867          hints suggests that inlining given function is very profitable.
 868          Avoid computation of big_speedup_p when not necessary to change
 869          outcome of decision.  */
 870       else if (DECL_DECLARED_INLINE_P (callee->decl)
 871                && growth >= inline_insns_single (e->caller, apply_hints)
 872                && (apply_hints
 873                    || growth >= inline_insns_single (e->caller, true)
 874                    || !big_speedup_p (e)))
 875         {
 876           if (opt_for_fn (e->caller->decl, optimize) >= 3)
 877             e->inline_failed = CIF_MAX_INLINE_INSNS_SINGLE_LIMIT;
 878           else
 879             e->inline_failed = CIF_MAX_INLINE_INSNS_SINGLE_O2_LIMIT;
 880           want_inline = false;
 881         }
 882       else if (!DECL_DECLARED_INLINE_P (callee->decl)
 883                && !opt_for_fn (e->caller->decl, flag_inline_functions)
 884                && growth >= PARAM_VALUE (PARAM_MAX_INLINE_INSNS_SMALL))
 885         {
 886           /* growth_likely_positive is expensive, always test it last.  */
 887           if (growth >= inline_insns_single (e->caller, false)
 888               || growth_likely_positive (callee, growth))
 889             {
 890               e->inline_failed = CIF_NOT_DECLARED_INLINED;
 891               want_inline = false;
 892             }
 893         }
 894       /* Apply MAX_INLINE_INSNS_AUTO limit for functions not declared inline.
 895          Bypass the limit when speedup seems big.  */
 896       else if (!DECL_DECLARED_INLINE_P (callee->decl)
 897                && growth >= inline_insns_auto (e->caller, apply_hints)
 898                && (apply_hints
 899                    || growth >= inline_insns_auto (e->caller, true)
 900                    || !big_speedup_p (e)))
 901         {
 902           /* growth_likely_positive is expensive, always test it last.  */
 903           if (growth >= inline_insns_single (e->caller, false)
 904               || growth_likely_positive (callee, growth))
 905             {
 906               if (opt_for_fn (e->caller->decl, optimize) >= 3)
 907                 e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
 908               else
 909                 e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_O2_LIMIT;
 910               want_inline = false;
 911             }
 912         }
 913       /* If call is cold, do not inline when function body would grow. */
 914       else if (!e->maybe_hot_p ()
 915                && (growth >= inline_insns_single (e->caller, false)
 916                    || growth_likely_positive (callee, growth)))
 917         {
 918           e->inline_failed = CIF_UNLIKELY_CALL;
 919           want_inline = false;
 920         }
 921     }
 922   if (!want_inline && report)
 923     report_inline_failed_reason (e);
 924   return want_inline;
 925 }
 926
 927 /* EDGE is self recursive edge.
 928    We hand two cases - when function A is inlining into itself
 929    or when function A is being inlined into another inliner copy of function
 930    A within function B.
 931
 932    In first case OUTER_NODE points to the toplevel copy of A, while
 933    in the second case OUTER_NODE points to the outermost copy of A in B.
 934
 935    In both cases we want to be extra selective since
 936    inlining the call will just introduce new recursive calls to appear.  */
 937
 938 static bool
 939 want_inline_self_recursive_call_p (struct cgraph_edge *edge,
 940                                    struct cgraph_node *outer_node,
 941                                    bool peeling,
 942                                    int depth)
 943 {
 944   char const *reason = NULL;
 945   bool want_inline = true;
 946   sreal caller_freq = 1;
 947   int max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH_AUTO);
 948
 949   if (DECL_DECLARED_INLINE_P (edge->caller->decl))
 950     max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH);
 951
 952   if (!edge->maybe_hot_p ())
 953     {
 954       reason = "recursive call is cold";
 955       want_inline = false;
 956     }
 957   else if (depth > max_depth)
 958     {
 959       reason = "--param max-inline-recursive-depth exceeded.";
 960       want_inline = false;
 961     }
 962   else if (outer_node->inlined_to
 963            && (caller_freq = outer_node->callers->sreal_frequency ()) == 0)
 964     {
 965       reason = "caller frequency is 0";
 966       want_inline = false;
 967     }
 968
 969   if (!want_inline)
 970     ;
 971   /* Inlining of self recursive function into copy of itself within other
 972      function is transformation similar to loop peeling.
 973
 974      Peeling is profitable if we can inline enough copies to make probability
 975      of actual call to the self recursive function very small.  Be sure that
 976      the probability of recursion is small.
 977
 978      We ensure that the frequency of recursing is at most 1 - (1/max_depth).
 979      This way the expected number of recursion is at most max_depth.  */
 980   else if (peeling)
 981     {
 982       sreal max_prob = (sreal)1 - ((sreal)1 / (sreal)max_depth);
 983       int i;
 984       for (i = 1; i < depth; i++)
 985         max_prob = max_prob * max_prob;
 986       if (edge->sreal_frequency () >= max_prob * caller_freq)
 987         {
 988           reason = "frequency of recursive call is too large";
 989           want_inline = false;
 990         }
 991     }
 992   /* Recursive inlining, i.e. equivalent of unrolling, is profitable if
 993      recursion depth is large.  We reduce function call overhead and increase
 994      chances that things fit in hardware return predictor.
 995
 996      Recursive inlining might however increase cost of stack frame setup
 997      actually slowing down functions whose recursion tree is wide rather than
 998      deep.
 999
1000      Deciding reliably on when to do recursive inlining without profile feedback
1001      is tricky.  For now we disable recursive inlining when probability of self
1002      recursion is low.
1003
1004      Recursive inlining of self recursive call within loop also results in
1005      large loop depths that generally optimize badly.  We may want to throttle
1006      down inlining in those cases.  In particular this seems to happen in one
1007      of libstdc++ rb tree methods.  */
1008   else
1009     {
1010       if (edge->sreal_frequency () * 100
1011           <= caller_freq
1012              * PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY))
1013         {
1014           reason = "frequency of recursive call is too small";
1015           want_inline = false;
1016         }
1017     }
1018   if (!want_inline && dump_enabled_p ())
1019     dump_printf_loc (MSG_MISSED_OPTIMIZATION, edge->call_stmt,
1020                      "   not inlining recursively: %s\n", reason);
1021   return want_inline;
1022 }
1023
1024 /* Return true when NODE has uninlinable caller;
1025    set HAS_HOT_CALL if it has hot call.
1026    Worker for cgraph_for_node_and_aliases.  */
1027
1028 static bool
1029 check_callers (struct cgraph_node *node, void *has_hot_call)
1030 {
1031   struct cgraph_edge *e;
1032    for (e = node->callers; e; e = e->next_caller)
1033      {
1034        if (!opt_for_fn (e->caller->decl, flag_inline_functions_called_once)
1035            || !opt_for_fn (e->caller->decl, optimize))
1036          return true;
1037        if (!can_inline_edge_p (e, true))
1038          return true;
1039        if (e->recursive_p ())
1040          return true;
1041        if (!can_inline_edge_by_limits_p (e, true))
1042          return true;
1043        if (!(*(bool *)has_hot_call) && e->maybe_hot_p ())
1044          *(bool *)has_hot_call = true;
1045      }
1046   return false;
1047 }
1048
1049 /* If NODE has a caller, return true.  */
1050
1051 static bool
1052 has_caller_p (struct cgraph_node *node, void *data ATTRIBUTE_UNUSED)
1053 {
1054   if (node->callers)
1055     return true;
1056   return false;
1057 }
1058
1059 /* Decide if inlining NODE would reduce unit size by eliminating
1060    the offline copy of function.
1061    When COLD is true the cold calls are considered, too.  */
1062
1063 static bool
1064 want_inline_function_to_all_callers_p (struct cgraph_node *node, bool cold)
1065 {
1066   bool has_hot_call = false;
1067
1068   /* Aliases gets inlined along with the function they alias.  */
1069   if (node->alias)
1070     return false;
1071   /* Already inlined?  */
1072   if (node->inlined_to)
1073     return false;
1074   /* Does it have callers?  */
1075   if (!node->call_for_symbol_and_aliases (has_caller_p, NULL, true))
1076     return false;
1077   /* Inlining into all callers would increase size?  */
1078   if (estimate_growth (node) > 0)
1079     return false;
1080   /* All inlines must be possible.  */
1081   if (node->call_for_symbol_and_aliases (check_callers, &has_hot_call,
1082                                          true))
1083     return false;
1084   if (!cold && !has_hot_call)
1085     return false;
1086   return true;
1087 }
1088
1089 /* A cost model driving the inlining heuristics in a way so the edges with
1090    smallest badness are inlined first.  After each inlining is performed
1091    the costs of all caller edges of nodes affected are recomputed so the
1092    metrics may accurately depend on values such as number of inlinable callers
1093    of the function or function body size.  */
1094
1095 static sreal
1096 edge_badness (struct cgraph_edge *edge, bool dump)
1097 {
1098   sreal badness;
1099   int growth;
1100   sreal edge_time, unspec_edge_time;
1101   struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
1102   class ipa_fn_summary *callee_info = ipa_fn_summaries->get (callee);
1103   ipa_hints hints;
1104   cgraph_node *caller = (edge->caller->inlined_to
1105                          ? edge->caller->inlined_to
1106                          : edge->caller);
1107
1108   growth = estimate_edge_growth (edge);
1109   edge_time = estimate_edge_time (edge, &unspec_edge_time);
1110   hints = estimate_edge_hints (edge);
1111   gcc_checking_assert (edge_time >= 0);
1112   /* Check that inlined time is better, but tolerate some roundoff issues.
1113      FIXME: When callee profile drops to 0 we account calls more.  This
1114      should be fixed by never doing that.  */
1115   gcc_checking_assert ((edge_time * 100
1116                         - callee_info->time * 101).to_int () <= 0
1117                         || callee->count.ipa ().initialized_p ());
1118   gcc_checking_assert (growth <= ipa_size_summaries->get (callee)->size);
1119
1120   if (dump)
1121     {
1122       fprintf (dump_file, "    Badness calculation for %s -> %s\n",
1123                edge->caller->dump_name (),
1124                edge->callee->dump_name ());
1125       fprintf (dump_file, "      size growth %i, time %f unspec %f ",
1126                growth,
1127                edge_time.to_double (),
1128                unspec_edge_time.to_double ());
1129       ipa_dump_hints (dump_file, hints);
1130       if (big_speedup_p (edge))
1131         fprintf (dump_file, " big_speedup");
1132       fprintf (dump_file, "\n");
1133     }
1134
1135   /* Always prefer inlining saving code size.  */
1136   if (growth <= 0)
1137     {
1138       badness = (sreal) (-SREAL_MIN_SIG + growth) << (SREAL_MAX_EXP / 256);
1139       if (dump)
1140         fprintf (dump_file, "      %f: Growth %d <= 0\n", badness.to_double (),
1141                  growth);
1142     }
1143    /* Inlining into EXTERNAL functions is not going to change anything unless
1144       they are themselves inlined.  */
1145    else if (DECL_EXTERNAL (caller->decl))
1146     {
1147       if (dump)
1148         fprintf (dump_file, "      max: function is external\n");
1149       return sreal::max ();
1150     }
1151   /* When profile is available. Compute badness as:
1152
1153                  time_saved * caller_count
1154      goodness =  -------------------------------------------------
1155                  growth_of_caller * overall_growth * combined_size
1156
1157      badness = - goodness
1158
1159      Again use negative value to make calls with profile appear hotter
1160      then calls without.
1161   */
1162   else if (opt_for_fn (caller->decl, flag_guess_branch_prob)
1163            || caller->count.ipa ().nonzero_p ())
1164     {
1165       sreal numerator, denominator;
1166       int overall_growth;
1167       sreal inlined_time = compute_inlined_call_time (edge, edge_time);
1168
1169       numerator = (compute_uninlined_call_time (edge, unspec_edge_time)
1170                    - inlined_time);
1171       if (numerator <= 0)
1172         numerator = ((sreal) 1 >> 8);
1173       if (caller->count.ipa ().nonzero_p ())
1174         numerator *= caller->count.ipa ().to_gcov_type ();
1175       else if (caller->count.ipa ().initialized_p ())
1176         numerator = numerator >> 11;
1177       denominator = growth;
1178
1179       overall_growth = callee_info->growth;
1180
1181       /* Look for inliner wrappers of the form:
1182
1183          inline_caller ()
1184            {
1185              do_fast_job...
1186              if (need_more_work)
1187                noninline_callee ();
1188            }
1189          Withhout penalizing this case, we usually inline noninline_callee
1190          into the inline_caller because overall_growth is small preventing
1191          further inlining of inline_caller.
1192
1193          Penalize only callgraph edges to functions with small overall
1194          growth ...
1195         */
1196       if (growth > overall_growth
1197           /* ... and having only one caller which is not inlined ... */
1198           && callee_info->single_caller
1199           && !edge->caller->inlined_to
1200           /* ... and edges executed only conditionally ... */
1201           && edge->sreal_frequency () < 1
1202           /* ... consider case where callee is not inline but caller is ... */
1203           && ((!DECL_DECLARED_INLINE_P (edge->callee->decl)
1204                && DECL_DECLARED_INLINE_P (caller->decl))
1205               /* ... or when early optimizers decided to split and edge
1206                  frequency still indicates splitting is a win ... */
1207               || (callee->split_part && !caller->split_part
1208                   && edge->sreal_frequency () * 100
1209                      < PARAM_VALUE
1210                           (PARAM_PARTIAL_INLINING_ENTRY_PROBABILITY)
1211                   /* ... and do not overwrite user specified hints.   */
1212                   && (!DECL_DECLARED_INLINE_P (edge->callee->decl)
1213                       || DECL_DECLARED_INLINE_P (caller->decl)))))
1214         {
1215           ipa_fn_summary *caller_info = ipa_fn_summaries->get (caller);
1216           int caller_growth = caller_info->growth;
1217
1218           /* Only apply the penalty when caller looks like inline candidate,
1219              and it is not called once.  */
1220           if (!caller_info->single_caller && overall_growth < caller_growth
1221               && caller_info->inlinable
1222               && ipa_size_summaries->get (caller)->size
1223                  < (DECL_DECLARED_INLINE_P (caller->decl)
1224                     ? inline_insns_single (caller, false)
1225                     : inline_insns_auto (caller, false)))
1226             {
1227               if (dump)
1228                 fprintf (dump_file,
1229                          "     Wrapper penalty. Increasing growth %i to %i\n",
1230                          overall_growth, caller_growth);
1231               overall_growth = caller_growth;
1232             }
1233         }
1234       if (overall_growth > 0)
1235         {
1236           /* Strongly preffer functions with few callers that can be inlined
1237              fully.  The square root here leads to smaller binaries at average.
1238              Watch however for extreme cases and return to linear function
1239              when growth is large.  */
1240           if (overall_growth < 256)
1241             overall_growth *= overall_growth;
1242           else
1243             overall_growth += 256 * 256 - 256;
1244           denominator *= overall_growth;
1245         }
1246       denominator *= ipa_size_summaries->get (caller)->size + growth;
1247
1248       badness = - numerator / denominator;
1249
1250       if (dump)
1251         {
1252           fprintf (dump_file,
1253                    "      %f: guessed profile. frequency %f, count %" PRId64
1254                    " caller count %" PRId64
1255                    " time w/o inlining %f, time with inlining %f"
1256                    " overall growth %i (current) %i (original)"
1257                    " %i (compensated)\n",
1258                    badness.to_double (),
1259                    edge->sreal_frequency ().to_double (),
1260                    edge->count.ipa ().initialized_p () ? edge->count.ipa ().to_gcov_type () : -1,
1261                    caller->count.ipa ().initialized_p () ? caller->count.ipa ().to_gcov_type () : -1,
1262                    compute_uninlined_call_time (edge,
1263                                                 unspec_edge_time).to_double (),
1264                    inlined_time.to_double (),
1265                    estimate_growth (callee),
1266                    callee_info->growth, overall_growth);
1267         }
1268     }
1269   /* When function local profile is not available or it does not give
1270      useful information (ie frequency is zero), base the cost on
1271      loop nest and overall size growth, so we optimize for overall number
1272      of functions fully inlined in program.  */
1273   else
1274     {
1275       int nest = MIN (ipa_call_summaries->get (edge)->loop_depth, 8);
1276       badness = growth;
1277
1278       /* Decrease badness if call is nested.  */
1279       if (badness > 0)
1280         badness = badness >> nest;
1281       else
1282         badness = badness << nest;
1283       if (dump)
1284         fprintf (dump_file, "      %f: no profile. nest %i\n",
1285                  badness.to_double (), nest);
1286     }
1287   gcc_checking_assert (badness != 0);
1288
1289   if (edge->recursive_p ())
1290     badness = badness.shift (badness > 0 ? 4 : -4);
1291   if ((hints & (INLINE_HINT_indirect_call
1292                 | INLINE_HINT_loop_iterations
1293                 | INLINE_HINT_loop_stride))
1294       || callee_info->growth <= 0)
1295     badness = badness.shift (badness > 0 ? -2 : 2);
1296   if (hints & (INLINE_HINT_same_scc))
1297     badness = badness.shift (badness > 0 ? 3 : -3);
1298   else if (hints & (INLINE_HINT_in_scc))
1299     badness = badness.shift (badness > 0 ? 2 : -2);
1300   else if (hints & (INLINE_HINT_cross_module))
1301     badness = badness.shift (badness > 0 ? 1 : -1);
1302   if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
1303     badness = badness.shift (badness > 0 ? -4 : 4);
1304   else if ((hints & INLINE_HINT_declared_inline))
1305     badness = badness.shift (badness > 0 ? -3 : 3);
1306   if (dump)
1307     fprintf (dump_file, "      Adjusted by hints %f\n", badness.to_double ());
1308   return badness;
1309 }
1310
1311 /* Recompute badness of EDGE and update its key in HEAP if needed.  */
1312 static inline void
1313 update_edge_key (edge_heap_t *heap, struct cgraph_edge *edge)
1314 {
1315   sreal badness = edge_badness (edge, false);
1316   if (edge->aux)
1317     {
1318       edge_heap_node_t *n = (edge_heap_node_t *) edge->aux;
1319       gcc_checking_assert (n->get_data () == edge);
1320
1321       /* fibonacci_heap::replace_key does busy updating of the
1322          heap that is unnecesarily expensive.
1323          We do lazy increases: after extracting minimum if the key
1324          turns out to be out of date, it is re-inserted into heap
1325          with correct value.  */
1326       if (badness < n->get_key ())
1327         {
1328           if (dump_file && (dump_flags & TDF_DETAILS))
1329             {
1330               fprintf (dump_file,
1331                        "  decreasing badness %s -> %s, %f to %f\n",
1332                        edge->caller->dump_name (),
1333                        edge->callee->dump_name (),
1334                        n->get_key ().to_double (),
1335                        badness.to_double ());
1336             }
1337           heap->decrease_key (n, badness);
1338         }
1339     }
1340   else
1341     {
1342        if (dump_file && (dump_flags & TDF_DETAILS))
1343          {
1344            fprintf (dump_file,
1345                     "  enqueuing call %s -> %s, badness %f\n",
1346                     edge->caller->dump_name (),
1347                     edge->callee->dump_name (),
1348                     badness.to_double ());
1349          }
1350       edge->aux = heap->insert (badness, edge);
1351     }
1352 }
1353
1354
1355 /* NODE was inlined.
1356    All caller edges needs to be resetted because
1357    size estimates change. Similarly callees needs reset
1358    because better context may be known.  */
1359
1360 static void
1361 reset_edge_caches (struct cgraph_node *node)
1362 {
1363   struct cgraph_edge *edge;
1364   struct cgraph_edge *e = node->callees;
1365   struct cgraph_node *where = node;
1366   struct ipa_ref *ref;
1367
1368   if (where->inlined_to)
1369     where = where->inlined_to;
1370
1371   reset_node_cache (where);
1372
1373   if (edge_growth_cache != NULL)
1374     for (edge = where->callers; edge; edge = edge->next_caller)
1375       if (edge->inline_failed)
1376         edge_growth_cache->remove (edge);
1377
1378   FOR_EACH_ALIAS (where, ref)
1379     reset_edge_caches (dyn_cast <cgraph_node *> (ref->referring));
1380
1381   if (!e)
1382     return;
1383
1384   while (true)
1385     if (!e->inline_failed && e->callee->callees)
1386       e = e->callee->callees;
1387     else
1388       {
1389         if (edge_growth_cache != NULL && e->inline_failed)
1390           edge_growth_cache->remove (e);
1391         if (e->next_callee)
1392           e = e->next_callee;
1393         else
1394           {
1395             do
1396               {
1397                 if (e->caller == node)
1398                   return;
1399                 e = e->caller->callers;
1400               }
1401             while (!e->next_callee);
1402             e = e->next_callee;
1403           }
1404       }
1405 }
1406
1407 /* Recompute HEAP nodes for each of caller of NODE.
1408    UPDATED_NODES track nodes we already visited, to avoid redundant work.
1409    When CHECK_INLINABLITY_FOR is set, re-check for specified edge that
1410    it is inlinable. Otherwise check all edges.  */
1411
1412 static void
1413 update_caller_keys (edge_heap_t *heap, struct cgraph_node *node,
1414                     bitmap updated_nodes,
1415                     struct cgraph_edge *check_inlinablity_for)
1416 {
1417   struct cgraph_edge *edge;
1418   struct ipa_ref *ref;
1419
1420   if ((!node->alias && !ipa_fn_summaries->get (node)->inlinable)
1421       || node->inlined_to)
1422     return;
1423   if (!bitmap_set_bit (updated_nodes, node->get_uid ()))
1424     return;
1425
1426   FOR_EACH_ALIAS (node, ref)
1427     {
1428       struct cgraph_node *alias = dyn_cast <cgraph_node *> (ref->referring);
1429       update_caller_keys (heap, alias, updated_nodes, check_inlinablity_for);
1430     }
1431
1432   for (edge = node->callers; edge; edge = edge->next_caller)
1433     if (edge->inline_failed)
1434       {
1435         if (!check_inlinablity_for
1436             || check_inlinablity_for == edge)
1437           {
1438             if (can_inline_edge_p (edge, false)
1439                 && want_inline_small_function_p (edge, false)
1440                 && can_inline_edge_by_limits_p (edge, false))
1441               update_edge_key (heap, edge);
1442             else if (edge->aux)
1443               {
1444                 report_inline_failed_reason (edge);
1445                 heap->delete_node ((edge_heap_node_t *) edge->aux);
1446                 edge->aux = NULL;
1447               }
1448           }
1449         else if (edge->aux)
1450           update_edge_key (heap, edge);
1451       }
1452 }
1453
1454 /* Recompute HEAP nodes for each uninlined call in NODE.
1455    This is used when we know that edge badnesses are going only to increase
1456    (we introduced new call site) and thus all we need is to insert newly
1457    created edges into heap.  */
1458
1459 static void
1460 update_callee_keys (edge_heap_t *heap, struct cgraph_node *node,
1461                     bitmap updated_nodes)
1462 {
1463   struct cgraph_edge *e = node->callees;
1464
1465   if (!e)
1466     return;
1467   while (true)
1468     if (!e->inline_failed && e->callee->callees)
1469       e = e->callee->callees;
1470     else
1471       {
1472         enum availability avail;
1473         struct cgraph_node *callee;
1474         /* We do not reset callee growth cache here.  Since we added a new call,
1475            growth chould have just increased and consequentely badness metric
1476            don't need updating.  */
1477         if (e->inline_failed
1478             && (callee = e->callee->ultimate_alias_target (&avail, e->caller))
1479             && ipa_fn_summaries->get (callee) != NULL
1480             && ipa_fn_summaries->get (callee)->inlinable
1481             && avail >= AVAIL_AVAILABLE
1482             && !bitmap_bit_p (updated_nodes, callee->get_uid ()))
1483           {
1484             if (can_inline_edge_p (e, false)
1485                 && want_inline_small_function_p (e, false)
1486                 && can_inline_edge_by_limits_p (e, false))
1487               update_edge_key (heap, e);
1488             else if (e->aux)
1489               {
1490                 report_inline_failed_reason (e);
1491                 heap->delete_node ((edge_heap_node_t *) e->aux);
1492                 e->aux = NULL;
1493               }
1494           }
1495         if (e->next_callee)
1496           e = e->next_callee;
1497         else
1498           {
1499             do
1500               {
1501                 if (e->caller == node)
1502                   return;
1503                 e = e->caller->callers;
1504               }
1505             while (!e->next_callee);
1506             e = e->next_callee;
1507           }
1508       }
1509 }
1510
1511 /* Enqueue all recursive calls from NODE into priority queue depending on
1512    how likely we want to recursively inline the call.  */
1513
1514 static void
1515 lookup_recursive_calls (struct cgraph_node *node, struct cgraph_node *where,
1516                         edge_heap_t *heap)
1517 {
1518   struct cgraph_edge *e;
1519   enum availability avail;
1520
1521   for (e = where->callees; e; e = e->next_callee)
1522     if (e->callee == node
1523         || (e->callee->ultimate_alias_target (&avail, e->caller) == node
1524             && avail > AVAIL_INTERPOSABLE))
1525       heap->insert (-e->sreal_frequency (), e);
1526   for (e = where->callees; e; e = e->next_callee)
1527     if (!e->inline_failed)
1528       lookup_recursive_calls (node, e->callee, heap);
1529 }
1530
1531 /* Decide on recursive inlining: in the case function has recursive calls,
1532    inline until body size reaches given argument.  If any new indirect edges
1533    are discovered in the process, add them to *NEW_EDGES, unless NEW_EDGES
1534    is NULL.  */
1535
1536 static bool
1537 recursive_inlining (struct cgraph_edge *edge,
1538                     vec<cgraph_edge *> *new_edges)
1539 {
1540   int limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE_AUTO);
1541   edge_heap_t heap (sreal::min ());
1542   struct cgraph_node *node;
1543   struct cgraph_edge *e;
1544   struct cgraph_node *master_clone = NULL, *next;
1545   int depth = 0;
1546   int n = 0;
1547
1548   node = edge->caller;
1549   if (node->inlined_to)
1550     node = node->inlined_to;
1551
1552   if (DECL_DECLARED_INLINE_P (node->decl))
1553     limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE);
1554
1555   /* Make sure that function is small enough to be considered for inlining.  */
1556   if (estimate_size_after_inlining (node, edge)  >= limit)
1557     return false;
1558   lookup_recursive_calls (node, node, &heap);
1559   if (heap.empty ())
1560     return false;
1561
1562   if (dump_file)
1563     fprintf (dump_file,
1564              "  Performing recursive inlining on %s\n",
1565              node->name ());
1566
1567   /* Do the inlining and update list of recursive call during process.  */
1568   while (!heap.empty ())
1569     {
1570       struct cgraph_edge *curr = heap.extract_min ();
1571       struct cgraph_node *cnode, *dest = curr->callee;
1572
1573       if (!can_inline_edge_p (curr, true)
1574           || !can_inline_edge_by_limits_p (curr, true))
1575         continue;
1576
1577       /* MASTER_CLONE is produced in the case we already started modified
1578          the function. Be sure to redirect edge to the original body before
1579          estimating growths otherwise we will be seeing growths after inlining
1580          the already modified body.  */
1581       if (master_clone)
1582         {
1583           curr->redirect_callee (master_clone);
1584           if (edge_growth_cache != NULL)
1585             edge_growth_cache->remove (curr);
1586         }
1587
1588       if (estimate_size_after_inlining (node, curr) > limit)
1589         {
1590           curr->redirect_callee (dest);
1591           if (edge_growth_cache != NULL)
1592             edge_growth_cache->remove (curr);
1593           break;
1594         }
1595
1596       depth = 1;
1597       for (cnode = curr->caller;
1598            cnode->inlined_to; cnode = cnode->callers->caller)
1599         if (node->decl
1600             == curr->callee->ultimate_alias_target ()->decl)
1601           depth++;
1602
1603       if (!want_inline_self_recursive_call_p (curr, node, false, depth))
1604         {
1605           curr->redirect_callee (dest);
1606           if (edge_growth_cache != NULL)
1607             edge_growth_cache->remove (curr);
1608           continue;
1609         }
1610
1611       if (dump_file)
1612         {
1613           fprintf (dump_file,
1614                    "   Inlining call of depth %i", depth);
1615           if (node->count.nonzero_p () && curr->count.initialized_p ())
1616             {
1617               fprintf (dump_file, " called approx. %.2f times per call",
1618                        (double)curr->count.to_gcov_type ()
1619                        / node->count.to_gcov_type ());
1620             }
1621           fprintf (dump_file, "\n");
1622         }
1623       if (!master_clone)
1624         {
1625           /* We need original clone to copy around.  */
1626           master_clone = node->create_clone (node->decl, node->count,
1627             false, vNULL, true, NULL, NULL);
1628           for (e = master_clone->callees; e; e = e->next_callee)
1629             if (!e->inline_failed)
1630               clone_inlined_nodes (e, true, false, NULL);
1631           curr->redirect_callee (master_clone);
1632           if (edge_growth_cache != NULL)
1633             edge_growth_cache->remove (curr);
1634         }
1635
1636       inline_call (curr, false, new_edges, &overall_size, true);
1637       lookup_recursive_calls (node, curr->callee, &heap);
1638       n++;
1639     }
1640
1641   if (!heap.empty () && dump_file)
1642     fprintf (dump_file, "    Recursive inlining growth limit met.\n");
1643
1644   if (!master_clone)
1645     return false;
1646
1647   if (dump_enabled_p ())
1648     dump_printf_loc (MSG_NOTE, edge->call_stmt,
1649                      "\n   Inlined %i times, "
1650                      "body grown from size %i to %i, time %f to %f\n", n,
1651                      ipa_size_summaries->get (master_clone)->size,
1652                      ipa_size_summaries->get (node)->size,
1653                      ipa_fn_summaries->get (master_clone)->time.to_double (),
1654                      ipa_fn_summaries->get (node)->time.to_double ());
1655
1656   /* Remove master clone we used for inlining.  We rely that clones inlined
1657      into master clone gets queued just before master clone so we don't
1658      need recursion.  */
1659   for (node = symtab->first_function (); node != master_clone;
1660        node = next)
1661     {
1662       next = symtab->next_function (node);
1663       if (node->inlined_to == master_clone)
1664         node->remove ();
1665     }
1666   master_clone->remove ();
1667   return true;
1668 }
1669
1670
1671 /* Given whole compilation unit estimate of INSNS, compute how large we can
1672    allow the unit to grow.  */
1673
1674 static int
1675 compute_max_insns (int insns)
1676 {
1677   int max_insns = insns;
1678   if (max_insns < PARAM_VALUE (PARAM_LARGE_UNIT_INSNS))
1679     max_insns = PARAM_VALUE (PARAM_LARGE_UNIT_INSNS);
1680
1681   return ((int64_t) max_insns
1682           * (100 + PARAM_VALUE (PARAM_INLINE_UNIT_GROWTH)) / 100);
1683 }
1684
1685
1686 /* Compute badness of all edges in NEW_EDGES and add them to the HEAP.  */
1687
1688 static void
1689 add_new_edges_to_heap (edge_heap_t *heap, vec<cgraph_edge *> new_edges)
1690 {
1691   while (new_edges.length () > 0)
1692     {
1693       struct cgraph_edge *edge = new_edges.pop ();
1694
1695       gcc_assert (!edge->aux);
1696       gcc_assert (edge->callee);
1697       if (edge->inline_failed
1698           && can_inline_edge_p (edge, true)
1699           && want_inline_small_function_p (edge, true)
1700           && can_inline_edge_by_limits_p (edge, true))
1701         edge->aux = heap->insert (edge_badness (edge, false), edge);
1702     }
1703 }
1704
1705 /* Remove EDGE from the fibheap.  */
1706
1707 static void
1708 heap_edge_removal_hook (struct cgraph_edge *e, void *data)
1709 {
1710   if (e->aux)
1711     {
1712       ((edge_heap_t *)data)->delete_node ((edge_heap_node_t *)e->aux);
1713       e->aux = NULL;
1714     }
1715 }
1716
1717 /* Return true if speculation of edge E seems useful.
1718    If ANTICIPATE_INLINING is true, be conservative and hope that E
1719    may get inlined.  */
1720
1721 bool
1722 speculation_useful_p (struct cgraph_edge *e, bool anticipate_inlining)
1723 {
1724   /* If we have already decided to inline the edge, it seems useful.  */
1725   if (!e->inline_failed)
1726     return true;
1727
1728   enum availability avail;
1729   struct cgraph_node *target = e->callee->ultimate_alias_target (&avail,
1730                                                                  e->caller);
1731   struct cgraph_edge *direct, *indirect;
1732   struct ipa_ref *ref;
1733
1734   gcc_assert (e->speculative && !e->indirect_unknown_callee);
1735
1736   if (!e->maybe_hot_p ())
1737     return false;
1738
1739   /* See if IP optimizations found something potentially useful about the
1740      function.  For now we look only for CONST/PURE flags.  Almost everything
1741      else we propagate is useless.  */
1742   if (avail >= AVAIL_AVAILABLE)
1743     {
1744       int ecf_flags = flags_from_decl_or_type (target->decl);
1745       if (ecf_flags & ECF_CONST)
1746         {
1747           e->speculative_call_info (direct, indirect, ref);
1748           if (!(indirect->indirect_info->ecf_flags & ECF_CONST))
1749             return true;
1750         }
1751       else if (ecf_flags & ECF_PURE)
1752         {
1753           e->speculative_call_info (direct, indirect, ref);
1754           if (!(indirect->indirect_info->ecf_flags & ECF_PURE))
1755             return true;
1756         }
1757     }
1758   /* If we did not managed to inline the function nor redirect
1759      to an ipa-cp clone (that are seen by having local flag set),
1760      it is probably pointless to inline it unless hardware is missing
1761      indirect call predictor.  */
1762   if (!anticipate_inlining && !target->local)
1763     return false;
1764   /* For overwritable targets there is not much to do.  */
1765   if (!can_inline_edge_p (e, false)
1766       || !can_inline_edge_by_limits_p (e, false, true))
1767     return false;
1768   /* OK, speculation seems interesting.  */
1769   return true;
1770 }
1771
1772 /* We know that EDGE is not going to be inlined.
1773    See if we can remove speculation.  */
1774
1775 static void
1776 resolve_noninline_speculation (edge_heap_t *edge_heap, struct cgraph_edge *edge)
1777 {
1778   if (edge->speculative && !speculation_useful_p (edge, false))
1779     {
1780       struct cgraph_node *node = edge->caller;
1781       struct cgraph_node *where = node->inlined_to
1782                                   ? node->inlined_to : node;
1783       auto_bitmap updated_nodes;
1784
1785       if (edge->count.ipa ().initialized_p ())
1786         spec_rem += edge->count.ipa ();
1787       edge->resolve_speculation ();
1788       reset_edge_caches (where);
1789       ipa_update_overall_fn_summary (where);
1790       update_caller_keys (edge_heap, where,
1791                           updated_nodes, NULL);
1792       update_callee_keys (edge_heap, where,
1793                           updated_nodes);
1794     }
1795 }
1796
1797 /* Return true if NODE should be accounted for overall size estimate.
1798    Skip all nodes optimized for size so we can measure the growth of hot
1799    part of program no matter of the padding.  */
1800
1801 bool
1802 inline_account_function_p (struct cgraph_node *node)
1803 {
1804    return (!DECL_EXTERNAL (node->decl)
1805            && !opt_for_fn (node->decl, optimize_size)
1806            && node->frequency != NODE_FREQUENCY_UNLIKELY_EXECUTED);
1807 }
1808
1809 /* Count number of callers of NODE and store it into DATA (that
1810    points to int.  Worker for cgraph_for_node_and_aliases.  */
1811
1812 static bool
1813 sum_callers (struct cgraph_node *node, void *data)
1814 {
1815   struct cgraph_edge *e;
1816   int *num_calls = (int *)data;
1817
1818   for (e = node->callers; e; e = e->next_caller)
1819     (*num_calls)++;
1820   return false;
1821 }
1822
1823 /* We only propagate across edges with non-interposable callee.  */
1824
1825 inline bool
1826 ignore_edge_p (struct cgraph_edge *e)
1827 {
1828   enum availability avail;
1829   e->callee->function_or_virtual_thunk_symbol (&avail, e->caller);
1830   return (avail <= AVAIL_INTERPOSABLE);
1831 }
1832
1833 /* We use greedy algorithm for inlining of small functions:
1834    All inline candidates are put into prioritized heap ordered in
1835    increasing badness.
1836
1837    The inlining of small functions is bounded by unit growth parameters.  */
1838
1839 static void
1840 inline_small_functions (void)
1841 {
1842   struct cgraph_node *node;
1843   struct cgraph_edge *edge;
1844   edge_heap_t edge_heap (sreal::min ());
1845   auto_bitmap updated_nodes;
1846   int min_size, max_size;
1847   auto_vec<cgraph_edge *> new_indirect_edges;
1848   int initial_size = 0;
1849   struct cgraph_node **order = XCNEWVEC (cgraph_node *, symtab->cgraph_count);
1850   struct cgraph_edge_hook_list *edge_removal_hook_holder;
1851   new_indirect_edges.create (8);
1852
1853   edge_removal_hook_holder
1854     = symtab->add_edge_removal_hook (&heap_edge_removal_hook, &edge_heap);
1855
1856   /* Compute overall unit size and other global parameters used by badness
1857      metrics.  */
1858
1859   max_count = profile_count::uninitialized ();
1860   ipa_reduced_postorder (order, true, ignore_edge_p);
1861   free (order);
1862
1863   FOR_EACH_DEFINED_FUNCTION (node)
1864     if (!node->inlined_to)
1865       {
1866         if (!node->alias && node->analyzed
1867             && (node->has_gimple_body_p () || node->thunk.thunk_p)
1868             && opt_for_fn (node->decl, optimize))
1869           {
1870             class ipa_fn_summary *info = ipa_fn_summaries->get (node);
1871             struct ipa_dfs_info *dfs = (struct ipa_dfs_info *) node->aux;
1872
1873             /* Do not account external functions, they will be optimized out
1874                if not inlined.  Also only count the non-cold portion of program.  */
1875             if (inline_account_function_p (node))
1876               initial_size += ipa_size_summaries->get (node)->size;
1877             info->growth = estimate_growth (node);
1878
1879             int num_calls = 0;
1880             node->call_for_symbol_and_aliases (sum_callers, &num_calls,
1881                                                true);
1882             if (num_calls == 1)
1883               info->single_caller = true;
1884             if (dfs && dfs->next_cycle)
1885               {
1886                 struct cgraph_node *n2;
1887                 int id = dfs->scc_no + 1;
1888                 for (n2 = node; n2;
1889                      n2 = ((struct ipa_dfs_info *) n2->aux)->next_cycle)
1890                   if (opt_for_fn (n2->decl, optimize))
1891                     {
1892                       ipa_fn_summary *info2 = ipa_fn_summaries->get
1893                          (n2->inlined_to ? n2->inlined_to : n2);
1894                       if (info2->scc_no)
1895                         break;
1896                       info2->scc_no = id;
1897                     }
1898               }
1899           }
1900
1901         for (edge = node->callers; edge; edge = edge->next_caller)
1902           max_count = max_count.max (edge->count.ipa ());
1903       }
1904   ipa_free_postorder_info ();
1905   initialize_growth_caches ();
1906
1907   if (dump_file)
1908     fprintf (dump_file,
1909              "\nDeciding on inlining of small functions.  Starting with size %i.\n",
1910              initial_size);
1911
1912   overall_size = initial_size;
1913   max_size = compute_max_insns (overall_size);
1914   min_size = overall_size;
1915
1916   /* Populate the heap with all edges we might inline.  */
1917
1918   FOR_EACH_DEFINED_FUNCTION (node)
1919     {
1920       bool update = false;
1921       struct cgraph_edge *next = NULL;
1922       bool has_speculative = false;
1923
1924       if (!opt_for_fn (node->decl, optimize))
1925         continue;
1926
1927       if (dump_file)
1928         fprintf (dump_file, "Enqueueing calls in %s.\n", node->dump_name ());
1929
1930       for (edge = node->callees; edge; edge = next)
1931         {
1932           next = edge->next_callee;
1933           if (edge->inline_failed
1934               && !edge->aux
1935               && can_inline_edge_p (edge, true)
1936               && want_inline_small_function_p (edge, true)
1937               && can_inline_edge_by_limits_p (edge, true)
1938               && edge->inline_failed)
1939             {
1940               gcc_assert (!edge->aux);
1941               update_edge_key (&edge_heap, edge);
1942             }
1943           if (edge->speculative)
1944             has_speculative = true;
1945         }
1946       if (has_speculative)
1947         for (edge = node->callees; edge; edge = next)
1948           if (edge->speculative && !speculation_useful_p (edge,
1949                                                           edge->aux != NULL))
1950             {
1951               edge->resolve_speculation ();
1952               update = true;
1953             }
1954       if (update)
1955         {
1956           struct cgraph_node *where = node->inlined_to
1957                                       ? node->inlined_to : node;
1958           ipa_update_overall_fn_summary (where);
1959           reset_edge_caches (where);
1960           update_caller_keys (&edge_heap, where,
1961                               updated_nodes, NULL);
1962           update_callee_keys (&edge_heap, where,
1963                               updated_nodes);
1964           bitmap_clear (updated_nodes);
1965         }
1966     }
1967
1968   gcc_assert (in_lto_p
1969               || !(max_count > 0)
1970               || (profile_info && flag_branch_probabilities));
1971
1972   while (!edge_heap.empty ())
1973     {
1974       int old_size = overall_size;
1975       struct cgraph_node *where, *callee;
1976       sreal badness = edge_heap.min_key ();
1977       sreal current_badness;
1978       int growth;
1979
1980       edge = edge_heap.extract_min ();
1981       gcc_assert (edge->aux);
1982       edge->aux = NULL;
1983       if (!edge->inline_failed || !edge->callee->analyzed)
1984         continue;
1985
1986 #if CHECKING_P
1987       /* Be sure that caches are maintained consistent.
1988          This check is affected by scaling roundoff errors when compiling for
1989          IPA this we skip it in that case.  */
1990       if (!edge->callee->count.ipa_p ()
1991           && (!max_count.initialized_p () || !max_count.nonzero_p ()))
1992         {
1993           sreal cached_badness = edge_badness (edge, false);
1994
1995           int old_size_est = estimate_edge_size (edge);
1996           sreal old_time_est = estimate_edge_time (edge);
1997           int old_hints_est = estimate_edge_hints (edge);
1998
1999           if (edge_growth_cache != NULL)
2000             edge_growth_cache->remove (edge);
2001           gcc_assert (old_size_est == estimate_edge_size (edge));
2002           gcc_assert (old_time_est == estimate_edge_time (edge));
2003           /* FIXME:
2004
2005              gcc_assert (old_hints_est == estimate_edge_hints (edge));
2006
2007              fails with profile feedback because some hints depends on
2008              maybe_hot_edge_p predicate and because callee gets inlined to other
2009              calls, the edge may become cold.
2010              This ought to be fixed by computing relative probabilities
2011              for given invocation but that will be better done once whole
2012              code is converted to sreals.  Disable for now and revert to "wrong"
2013              value so enable/disable checking paths agree.  */
2014           edge_growth_cache->get (edge)->hints = old_hints_est + 1;
2015
2016           /* When updating the edge costs, we only decrease badness in the keys.
2017              Increases of badness are handled lazilly; when we see key with out
2018              of date value on it, we re-insert it now.  */
2019           current_badness = edge_badness (edge, false);
2020           gcc_assert (cached_badness == current_badness);
2021           gcc_assert (current_badness >= badness);
2022         }
2023       else
2024         current_badness = edge_badness (edge, false);
2025 #else
2026       current_badness = edge_badness (edge, false);
2027 #endif
2028       if (current_badness != badness)
2029         {
2030           if (edge_heap.min () && current_badness > edge_heap.min_key ())
2031             {
2032               edge->aux = edge_heap.insert (current_badness, edge);
2033               continue;
2034             }
2035           else
2036             badness = current_badness;
2037         }
2038
2039       if (!can_inline_edge_p (edge, true)
2040           || !can_inline_edge_by_limits_p (edge, true))
2041         {
2042           resolve_noninline_speculation (&edge_heap, edge);
2043           continue;
2044         }
2045
2046       callee = edge->callee->ultimate_alias_target ();
2047       growth = estimate_edge_growth (edge);
2048       if (dump_file)
2049         {
2050           fprintf (dump_file,
2051                    "\nConsidering %s with %i size\n",
2052                    callee->dump_name (),
2053                    ipa_size_summaries->get (callee)->size);
2054           fprintf (dump_file,
2055                    " to be inlined into %s in %s:%i\n"
2056                    " Estimated badness is %f, frequency %.2f.\n",
2057                    edge->caller->dump_name (),
2058                    edge->call_stmt
2059                    && (LOCATION_LOCUS (gimple_location ((const gimple *)
2060                                                         edge->call_stmt))
2061                        > BUILTINS_LOCATION)
2062                    ? gimple_filename ((const gimple *) edge->call_stmt)
2063                    : "unknown",
2064                    edge->call_stmt
2065                    ? gimple_lineno ((const gimple *) edge->call_stmt)
2066                    : -1,
2067                    badness.to_double (),
2068                    edge->sreal_frequency ().to_double ());
2069           if (edge->count.ipa ().initialized_p ())
2070             {
2071               fprintf (dump_file, " Called ");
2072               edge->count.ipa ().dump (dump_file);
2073               fprintf (dump_file, " times\n");
2074             }
2075           if (dump_flags & TDF_DETAILS)
2076             edge_badness (edge, true);
2077         }
2078
2079       if (overall_size + growth > max_size
2080           && !DECL_DISREGARD_INLINE_LIMITS (callee->decl))
2081         {
2082           edge->inline_failed = CIF_INLINE_UNIT_GROWTH_LIMIT;
2083           report_inline_failed_reason (edge);
2084           resolve_noninline_speculation (&edge_heap, edge);
2085           continue;
2086         }
2087
2088       if (!want_inline_small_function_p (edge, true))
2089         {
2090           resolve_noninline_speculation (&edge_heap, edge);
2091           continue;
2092         }
2093
2094       /* Heuristics for inlining small functions work poorly for
2095          recursive calls where we do effects similar to loop unrolling.
2096          When inlining such edge seems profitable, leave decision on
2097          specific inliner.  */
2098       if (edge->recursive_p ())
2099         {
2100           where = edge->caller;
2101           if (where->inlined_to)
2102             where = where->inlined_to;
2103           if (!recursive_inlining (edge,
2104                                    opt_for_fn (edge->caller->decl,
2105                                                flag_indirect_inlining)
2106                                    ? &new_indirect_edges : NULL))
2107             {
2108               edge->inline_failed = CIF_RECURSIVE_INLINING;
2109               resolve_noninline_speculation (&edge_heap, edge);
2110               continue;
2111             }
2112           reset_edge_caches (where);
2113           /* Recursive inliner inlines all recursive calls of the function
2114              at once. Consequently we need to update all callee keys.  */
2115           if (opt_for_fn (edge->caller->decl, flag_indirect_inlining))
2116             add_new_edges_to_heap (&edge_heap, new_indirect_edges);
2117           update_callee_keys (&edge_heap, where, updated_nodes);
2118           bitmap_clear (updated_nodes);
2119         }
2120       else
2121         {
2122           struct cgraph_node *outer_node = NULL;
2123           int depth = 0;
2124
2125           /* Consider the case where self recursive function A is inlined
2126              into B.  This is desired optimization in some cases, since it
2127              leads to effect similar of loop peeling and we might completely
2128              optimize out the recursive call.  However we must be extra
2129              selective.  */
2130
2131           where = edge->caller;
2132           while (where->inlined_to)
2133             {
2134               if (where->decl == callee->decl)
2135                 outer_node = where, depth++;
2136               where = where->callers->caller;
2137             }
2138           if (outer_node
2139               && !want_inline_self_recursive_call_p (edge, outer_node,
2140                                                      true, depth))
2141             {
2142               edge->inline_failed
2143                 = (DECL_DISREGARD_INLINE_LIMITS (edge->callee->decl)
2144                    ? CIF_RECURSIVE_INLINING : CIF_UNSPECIFIED);
2145               resolve_noninline_speculation (&edge_heap, edge);
2146               continue;
2147             }
2148           else if (depth && dump_file)
2149             fprintf (dump_file, " Peeling recursion with depth %i\n", depth);
2150
2151           gcc_checking_assert (!callee->inlined_to);
2152           inline_call (edge, true, &new_indirect_edges, &overall_size, true);
2153           add_new_edges_to_heap (&edge_heap, new_indirect_edges);
2154
2155           reset_edge_caches (edge->callee);
2156
2157           update_callee_keys (&edge_heap, where, updated_nodes);
2158         }
2159       where = edge->caller;
2160       if (where->inlined_to)
2161         where = where->inlined_to;
2162
2163       /* Our profitability metric can depend on local properties
2164          such as number of inlinable calls and size of the function body.
2165          After inlining these properties might change for the function we
2166          inlined into (since it's body size changed) and for the functions
2167          called by function we inlined (since number of it inlinable callers
2168          might change).  */
2169       update_caller_keys (&edge_heap, where, updated_nodes, NULL);
2170       /* Offline copy count has possibly changed, recompute if profile is
2171          available.  */
2172       struct cgraph_node *n = cgraph_node::get (edge->callee->decl);
2173       if (n != edge->callee && n->analyzed && n->count.ipa ().initialized_p ())
2174         update_callee_keys (&edge_heap, n, updated_nodes);
2175       bitmap_clear (updated_nodes);
2176
2177       if (dump_enabled_p ())
2178         {
2179           ipa_fn_summary *s = ipa_fn_summaries->get (where);
2180
2181           /* dump_printf can't handle %+i.  */
2182           char buf_net_change[100];
2183           snprintf (buf_net_change, sizeof buf_net_change, "%+i",
2184                     overall_size - old_size);
2185
2186           dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, edge->call_stmt,
2187                            " Inlined %C into %C which now has time %f and "
2188                            "size %i, net change of %s.\n",
2189                            edge->callee, edge->caller,
2190                            s->time.to_double (),
2191                            ipa_size_summaries->get (edge->caller)->size,
2192                            buf_net_change);
2193         }
2194       if (min_size > overall_size)
2195         {
2196           min_size = overall_size;
2197           max_size = compute_max_insns (min_size);
2198
2199           if (dump_file)
2200             fprintf (dump_file, "New minimal size reached: %i\n", min_size);
2201         }
2202     }
2203
2204   free_growth_caches ();
2205   if (dump_enabled_p ())
2206     dump_printf (MSG_NOTE,
2207                  "Unit growth for small function inlining: %i->%i (%i%%)\n",
2208                  initial_size, overall_size,
2209                  initial_size ? overall_size * 100 / (initial_size) - 100: 0);
2210   symtab->remove_edge_removal_hook (edge_removal_hook_holder);
2211 }
2212
2213 /* Flatten NODE.  Performed both during early inlining and
2214    at IPA inlining time.  */
2215
2216 static void
2217 flatten_function (struct cgraph_node *node, bool early, bool update)
2218 {
2219   struct cgraph_edge *e;
2220
2221   /* We shouldn't be called recursively when we are being processed.  */
2222   gcc_assert (node->aux == NULL);
2223
2224   node->aux = (void *) node;
2225
2226   for (e = node->callees; e; e = e->next_callee)
2227     {
2228       struct cgraph_node *orig_callee;
2229       struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2230
2231       /* We've hit cycle?  It is time to give up.  */
2232       if (callee->aux)
2233         {
2234           if (dump_enabled_p ())
2235             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2236                              "Not inlining %C into %C to avoid cycle.\n",
2237                              callee, e->caller);
2238           if (cgraph_inline_failed_type (e->inline_failed) != CIF_FINAL_ERROR)
2239             e->inline_failed = CIF_RECURSIVE_INLINING;
2240           continue;
2241         }
2242
2243       /* When the edge is already inlined, we just need to recurse into
2244          it in order to fully flatten the leaves.  */
2245       if (!e->inline_failed)
2246         {
2247           flatten_function (callee, early, false);
2248           continue;
2249         }
2250
2251       /* Flatten attribute needs to be processed during late inlining. For
2252          extra code quality we however do flattening during early optimization,
2253          too.  */
2254       if (!early
2255           ? !can_inline_edge_p (e, true)
2256             && !can_inline_edge_by_limits_p (e, true)
2257           : !can_early_inline_edge_p (e))
2258         continue;
2259
2260       if (e->recursive_p ())
2261         {
2262           if (dump_enabled_p ())
2263             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2264                              "Not inlining: recursive call.\n");
2265           continue;
2266         }
2267
2268       if (gimple_in_ssa_p (DECL_STRUCT_FUNCTION (node->decl))
2269           != gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->decl)))
2270         {
2271           if (dump_enabled_p ())
2272             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2273                              "Not inlining: SSA form does not match.\n");
2274           continue;
2275         }
2276
2277       /* Inline the edge and flatten the inline clone.  Avoid
2278          recursing through the original node if the node was cloned.  */
2279       if (dump_enabled_p ())
2280         dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, e->call_stmt,
2281                          " Inlining %C into %C.\n",
2282                          callee, e->caller);
2283       orig_callee = callee;
2284       inline_call (e, true, NULL, NULL, false);
2285       if (e->callee != orig_callee)
2286         orig_callee->aux = (void *) node;
2287       flatten_function (e->callee, early, false);
2288       if (e->callee != orig_callee)
2289         orig_callee->aux = NULL;
2290     }
2291
2292   node->aux = NULL;
2293   cgraph_node *where = node->inlined_to ? node->inlined_to : node;
2294   if (update && opt_for_fn (where->decl, optimize))
2295     ipa_update_overall_fn_summary (where);
2296 }
2297
2298 /* Inline NODE to all callers.  Worker for cgraph_for_node_and_aliases.
2299    DATA points to number of calls originally found so we avoid infinite
2300    recursion.  */
2301
2302 static bool
2303 inline_to_all_callers_1 (struct cgraph_node *node, void *data,
2304                          hash_set<cgraph_node *> *callers)
2305 {
2306   int *num_calls = (int *)data;
2307   bool callee_removed = false;
2308
2309   while (node->callers && !node->inlined_to)
2310     {
2311       struct cgraph_node *caller = node->callers->caller;
2312
2313       if (!can_inline_edge_p (node->callers, true)
2314           || !can_inline_edge_by_limits_p (node->callers, true)
2315           || node->callers->recursive_p ())
2316         {
2317           if (dump_file)
2318             fprintf (dump_file, "Uninlinable call found; giving up.\n");
2319           *num_calls = 0;
2320           return false;
2321         }
2322
2323       if (dump_file)
2324         {
2325           cgraph_node *ultimate = node->ultimate_alias_target ();
2326           fprintf (dump_file,
2327                    "\nInlining %s size %i.\n",
2328                    ultimate->name (),
2329                    ipa_size_summaries->get (ultimate)->size);
2330           fprintf (dump_file,
2331                    " Called once from %s %i insns.\n",
2332                    node->callers->caller->name (),
2333                    ipa_size_summaries->get (node->callers->caller)->size);
2334         }
2335
2336       /* Remember which callers we inlined to, delaying updating the
2337          overall summary.  */
2338       callers->add (node->callers->caller);
2339       inline_call (node->callers, true, NULL, NULL, false, &callee_removed);
2340       if (dump_file)
2341         fprintf (dump_file,
2342                  " Inlined into %s which now has %i size\n",
2343                  caller->name (),
2344                  ipa_size_summaries->get (caller)->size);
2345       if (!(*num_calls)--)
2346         {
2347           if (dump_file)
2348             fprintf (dump_file, "New calls found; giving up.\n");
2349           return callee_removed;
2350         }
2351       if (callee_removed)
2352         return true;
2353     }
2354   return false;
2355 }
2356
2357 /* Wrapper around inline_to_all_callers_1 doing delayed overall summary
2358    update.  */
2359
2360 static bool
2361 inline_to_all_callers (struct cgraph_node *node, void *data)
2362 {
2363   hash_set<cgraph_node *> callers;
2364   bool res = inline_to_all_callers_1 (node, data, &callers);
2365   /* Perform the delayed update of the overall summary of all callers
2366      processed.  This avoids quadratic behavior in the cases where
2367      we have a lot of calls to the same function.  */
2368   for (hash_set<cgraph_node *>::iterator i = callers.begin ();
2369        i != callers.end (); ++i)
2370     ipa_update_overall_fn_summary ((*i)->inlined_to ? (*i)->inlined_to : *i);
2371   return res;
2372 }
2373
2374 /* Output overall time estimate.  */
2375 static void
2376 dump_overall_stats (void)
2377 {
2378   sreal sum_weighted = 0, sum = 0;
2379   struct cgraph_node *node;
2380
2381   FOR_EACH_DEFINED_FUNCTION (node)
2382     if (!node->inlined_to
2383         && !node->alias)
2384       {
2385         ipa_fn_summary *s = ipa_fn_summaries->get (node);
2386         if (s != NULL)
2387           {
2388           sum += s->time;
2389           if (node->count.ipa ().initialized_p ())
2390             sum_weighted += s->time * node->count.ipa ().to_gcov_type ();
2391           }
2392       }
2393   fprintf (dump_file, "Overall time estimate: "
2394            "%f weighted by profile: "
2395            "%f\n", sum.to_double (), sum_weighted.to_double ());
2396 }
2397
2398 /* Output some useful stats about inlining.  */
2399
2400 static void
2401 dump_inline_stats (void)
2402 {
2403   int64_t inlined_cnt = 0, inlined_indir_cnt = 0;
2404   int64_t inlined_virt_cnt = 0, inlined_virt_indir_cnt = 0;
2405   int64_t noninlined_cnt = 0, noninlined_indir_cnt = 0;
2406   int64_t noninlined_virt_cnt = 0, noninlined_virt_indir_cnt = 0;
2407   int64_t  inlined_speculative = 0, inlined_speculative_ply = 0;
2408   int64_t indirect_poly_cnt = 0, indirect_cnt = 0;
2409   int64_t reason[CIF_N_REASONS][2];
2410   sreal reason_freq[CIF_N_REASONS];
2411   int i;
2412   struct cgraph_node *node;
2413
2414   memset (reason, 0, sizeof (reason));
2415   for (i=0; i < CIF_N_REASONS; i++)
2416     reason_freq[i] = 0;
2417   FOR_EACH_DEFINED_FUNCTION (node)
2418   {
2419     struct cgraph_edge *e;
2420     for (e = node->callees; e; e = e->next_callee)
2421       {
2422         if (e->inline_failed)
2423           {
2424             if (e->count.ipa ().initialized_p ())
2425               reason[(int) e->inline_failed][0] += e->count.ipa ().to_gcov_type ();
2426             reason_freq[(int) e->inline_failed] += e->sreal_frequency ();
2427             reason[(int) e->inline_failed][1] ++;
2428             if (DECL_VIRTUAL_P (e->callee->decl)
2429                 && e->count.ipa ().initialized_p ())
2430               {
2431                 if (e->indirect_inlining_edge)
2432                   noninlined_virt_indir_cnt += e->count.ipa ().to_gcov_type ();
2433                 else
2434                   noninlined_virt_cnt += e->count.ipa ().to_gcov_type ();
2435               }
2436             else if (e->count.ipa ().initialized_p ())
2437               {
2438                 if (e->indirect_inlining_edge)
2439                   noninlined_indir_cnt += e->count.ipa ().to_gcov_type ();
2440                 else
2441                   noninlined_cnt += e->count.ipa ().to_gcov_type ();
2442               }
2443           }
2444         else if (e->count.ipa ().initialized_p ())
2445           {
2446             if (e->speculative)
2447               {
2448                 if (DECL_VIRTUAL_P (e->callee->decl))
2449                   inlined_speculative_ply += e->count.ipa ().to_gcov_type ();
2450                 else
2451                   inlined_speculative += e->count.ipa ().to_gcov_type ();
2452               }
2453             else if (DECL_VIRTUAL_P (e->callee->decl))
2454               {
2455                 if (e->indirect_inlining_edge)
2456                   inlined_virt_indir_cnt += e->count.ipa ().to_gcov_type ();
2457                 else
2458                   inlined_virt_cnt += e->count.ipa ().to_gcov_type ();
2459               }
2460             else
2461               {
2462                 if (e->indirect_inlining_edge)
2463                   inlined_indir_cnt += e->count.ipa ().to_gcov_type ();
2464                 else
2465                   inlined_cnt += e->count.ipa ().to_gcov_type ();
2466               }
2467           }
2468       }
2469     for (e = node->indirect_calls; e; e = e->next_callee)
2470       if (e->indirect_info->polymorphic
2471           & e->count.ipa ().initialized_p ())
2472         indirect_poly_cnt += e->count.ipa ().to_gcov_type ();
2473       else if (e->count.ipa ().initialized_p ())
2474         indirect_cnt += e->count.ipa ().to_gcov_type ();
2475   }
2476   if (max_count.initialized_p ())
2477     {
2478       fprintf (dump_file,
2479                "Inlined %" PRId64 " + speculative "
2480                "%" PRId64 " + speculative polymorphic "
2481                "%" PRId64 " + previously indirect "
2482                "%" PRId64 " + virtual "
2483                "%" PRId64 " + virtual and previously indirect "
2484                "%" PRId64 "\n" "Not inlined "
2485                "%" PRId64 " + previously indirect "
2486                "%" PRId64 " + virtual "
2487                "%" PRId64 " + virtual and previously indirect "
2488                "%" PRId64 " + stil indirect "
2489                "%" PRId64 " + still indirect polymorphic "
2490                "%" PRId64 "\n", inlined_cnt,
2491                inlined_speculative, inlined_speculative_ply,
2492                inlined_indir_cnt, inlined_virt_cnt, inlined_virt_indir_cnt,
2493                noninlined_cnt, noninlined_indir_cnt, noninlined_virt_cnt,
2494                noninlined_virt_indir_cnt, indirect_cnt, indirect_poly_cnt);
2495       fprintf (dump_file, "Removed speculations ");
2496       spec_rem.dump (dump_file);
2497       fprintf (dump_file, "\n");
2498     }
2499   dump_overall_stats ();
2500   fprintf (dump_file, "\nWhy inlining failed?\n");
2501   for (i = 0; i < CIF_N_REASONS; i++)
2502     if (reason[i][1])
2503       fprintf (dump_file, "%-50s: %8i calls, %8f freq, %" PRId64" count\n",
2504                cgraph_inline_failed_string ((cgraph_inline_failed_t) i),
2505                (int) reason[i][1], reason_freq[i].to_double (), reason[i][0]);
2506 }
2507
2508 /* Called when node is removed.  */
2509
2510 static void
2511 flatten_remove_node_hook (struct cgraph_node *node, void *data)
2512 {
2513   if (lookup_attribute ("flatten", DECL_ATTRIBUTES (node->decl)) == NULL)
2514     return;
2515
2516   hash_set<struct cgraph_node *> *removed
2517     = (hash_set<struct cgraph_node *> *) data;
2518   removed->add (node);
2519 }
2520
2521 /* Decide on the inlining.  We do so in the topological order to avoid
2522    expenses on updating data structures.  */
2523
2524 static unsigned int
2525 ipa_inline (void)
2526 {
2527   struct cgraph_node *node;
2528   int nnodes;
2529   struct cgraph_node **order;
2530   int i, j;
2531   int cold;
2532   bool remove_functions = false;
2533
2534   order = XCNEWVEC (struct cgraph_node *, symtab->cgraph_count);
2535
2536   if (dump_file)
2537     ipa_dump_fn_summaries (dump_file);
2538
2539   nnodes = ipa_reverse_postorder (order);
2540   spec_rem = profile_count::zero ();
2541
2542   FOR_EACH_FUNCTION (node)
2543     {
2544       node->aux = 0;
2545
2546       /* Recompute the default reasons for inlining because they may have
2547          changed during merging.  */
2548       if (in_lto_p)
2549         {
2550           for (cgraph_edge *e = node->callees; e; e = e->next_callee)
2551             {
2552               gcc_assert (e->inline_failed);
2553               initialize_inline_failed (e);
2554             }
2555           for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
2556             initialize_inline_failed (e);
2557         }
2558     }
2559
2560   if (dump_file)
2561     fprintf (dump_file, "\nFlattening functions:\n");
2562
2563   /* First shrink order array, so that it only contains nodes with
2564      flatten attribute.  */
2565   for (i = nnodes - 1, j = i; i >= 0; i--)
2566     {
2567       node = order[i];
2568       if (lookup_attribute ("flatten",
2569                             DECL_ATTRIBUTES (node->decl)) != NULL)
2570         order[j--] = order[i];
2571     }
2572
2573   /* After the above loop, order[j + 1] ... order[nnodes - 1] contain
2574      nodes with flatten attribute.  If there is more than one such
2575      node, we need to register a node removal hook, as flatten_function
2576      could remove other nodes with flatten attribute.  See PR82801.  */
2577   struct cgraph_node_hook_list *node_removal_hook_holder = NULL;
2578   hash_set<struct cgraph_node *> *flatten_removed_nodes = NULL;
2579   if (j < nnodes - 2)
2580     {
2581       flatten_removed_nodes = new hash_set<struct cgraph_node *>;
2582       node_removal_hook_holder
2583         = symtab->add_cgraph_removal_hook (&flatten_remove_node_hook,
2584                                            flatten_removed_nodes);
2585     }
2586
2587   /* In the first pass handle functions to be flattened.  Do this with
2588      a priority so none of our later choices will make this impossible.  */
2589   for (i = nnodes - 1; i > j; i--)
2590     {
2591       node = order[i];
2592       if (flatten_removed_nodes
2593           && flatten_removed_nodes->contains (node))
2594         continue;
2595
2596       /* Handle nodes to be flattened.
2597          Ideally when processing callees we stop inlining at the
2598          entry of cycles, possibly cloning that entry point and
2599          try to flatten itself turning it into a self-recursive
2600          function.  */
2601       if (dump_file)
2602         fprintf (dump_file, "Flattening %s\n", node->name ());
2603       flatten_function (node, false, true);
2604     }
2605
2606   if (j < nnodes - 2)
2607     {
2608       symtab->remove_cgraph_removal_hook (node_removal_hook_holder);
2609       delete flatten_removed_nodes;
2610     }
2611   free (order);
2612
2613   if (dump_file)
2614     dump_overall_stats ();
2615
2616   inline_small_functions ();
2617
2618   gcc_assert (symtab->state == IPA_SSA);
2619   symtab->state = IPA_SSA_AFTER_INLINING;
2620   /* Do first after-inlining removal.  We want to remove all "stale" extern
2621      inline functions and virtual functions so we really know what is called
2622      once.  */
2623   symtab->remove_unreachable_nodes (dump_file);
2624
2625   /* Inline functions with a property that after inlining into all callers the
2626      code size will shrink because the out-of-line copy is eliminated.
2627      We do this regardless on the callee size as long as function growth limits
2628      are met.  */
2629   if (dump_file)
2630     fprintf (dump_file,
2631              "\nDeciding on functions to be inlined into all callers and "
2632              "removing useless speculations:\n");
2633
2634   /* Inlining one function called once has good chance of preventing
2635      inlining other function into the same callee.  Ideally we should
2636      work in priority order, but probably inlining hot functions first
2637      is good cut without the extra pain of maintaining the queue.
2638
2639      ??? this is not really fitting the bill perfectly: inlining function
2640      into callee often leads to better optimization of callee due to
2641      increased context for optimization.
2642      For example if main() function calls a function that outputs help
2643      and then function that does the main optmization, we should inline
2644      the second with priority even if both calls are cold by themselves.
2645
2646      We probably want to implement new predicate replacing our use of
2647      maybe_hot_edge interpreted as maybe_hot_edge || callee is known
2648      to be hot.  */
2649   for (cold = 0; cold <= 1; cold ++)
2650     {
2651       FOR_EACH_DEFINED_FUNCTION (node)
2652         {
2653           struct cgraph_edge *edge, *next;
2654           bool update=false;
2655
2656           if (!opt_for_fn (node->decl, optimize)
2657               || !opt_for_fn (node->decl, flag_inline_functions_called_once))
2658             continue;
2659
2660           for (edge = node->callees; edge; edge = next)
2661             {
2662               next = edge->next_callee;
2663               if (edge->speculative && !speculation_useful_p (edge, false))
2664                 {
2665                   if (edge->count.ipa ().initialized_p ())
2666                     spec_rem += edge->count.ipa ();
2667                   edge->resolve_speculation ();
2668                   update = true;
2669                   remove_functions = true;
2670                 }
2671             }
2672           if (update)
2673             {
2674               struct cgraph_node *where = node->inlined_to
2675                                           ? node->inlined_to : node;
2676               reset_edge_caches (where);
2677               ipa_update_overall_fn_summary (where);
2678             }
2679           if (want_inline_function_to_all_callers_p (node, cold))
2680             {
2681               int num_calls = 0;
2682               node->call_for_symbol_and_aliases (sum_callers, &num_calls,
2683                                                  true);
2684               while (node->call_for_symbol_and_aliases
2685                        (inline_to_all_callers, &num_calls, true))
2686                 ;
2687               remove_functions = true;
2688             }
2689         }
2690     }
2691
2692   /* Free ipa-prop structures if they are no longer needed.  */
2693   ipa_free_all_structures_after_iinln ();
2694
2695   if (dump_enabled_p ())
2696     dump_printf (MSG_NOTE,
2697                  "\nInlined %i calls, eliminated %i functions\n\n",
2698                  ncalls_inlined, nfunctions_inlined);
2699   if (dump_file)
2700     dump_inline_stats ();
2701
2702   if (dump_file)
2703     ipa_dump_fn_summaries (dump_file);
2704   return remove_functions ? TODO_remove_functions : 0;
2705 }
2706
2707 /* Inline always-inline function calls in NODE.  */
2708
2709 static bool
2710 inline_always_inline_functions (struct cgraph_node *node)
2711 {
2712   struct cgraph_edge *e;
2713   bool inlined = false;
2714
2715   for (e = node->callees; e; e = e->next_callee)
2716     {
2717       struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2718       if (!DECL_DISREGARD_INLINE_LIMITS (callee->decl))
2719         continue;
2720
2721       if (e->recursive_p ())
2722         {
2723           if (dump_enabled_p ())
2724             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2725                              "  Not inlining recursive call to %C.\n",
2726                              e->callee);
2727           e->inline_failed = CIF_RECURSIVE_INLINING;
2728           continue;
2729         }
2730
2731       if (!can_early_inline_edge_p (e))
2732         {
2733           /* Set inlined to true if the callee is marked "always_inline" but
2734              is not inlinable.  This will allow flagging an error later in
2735              expand_call_inline in tree-inline.c.  */
2736           if (lookup_attribute ("always_inline",
2737                                  DECL_ATTRIBUTES (callee->decl)) != NULL)
2738             inlined = true;
2739           continue;
2740         }
2741
2742       if (dump_enabled_p ())
2743         dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, e->call_stmt,
2744                          "  Inlining %C into %C (always_inline).\n",
2745                          e->callee, e->caller);
2746       inline_call (e, true, NULL, NULL, false);
2747       inlined = true;
2748     }
2749   if (inlined)
2750     ipa_update_overall_fn_summary (node);
2751
2752   return inlined;
2753 }
2754
2755 /* Decide on the inlining.  We do so in the topological order to avoid
2756    expenses on updating data structures.  */
2757
2758 static bool
2759 early_inline_small_functions (struct cgraph_node *node)
2760 {
2761   struct cgraph_edge *e;
2762   bool inlined = false;
2763
2764   for (e = node->callees; e; e = e->next_callee)
2765     {
2766       struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2767
2768       /* We can enounter not-yet-analyzed function during
2769          early inlining on callgraphs with strongly
2770          connected components.  */
2771       ipa_fn_summary *s = ipa_fn_summaries->get (callee);
2772       if (s == NULL || !s->inlinable || !e->inline_failed)
2773         continue;
2774
2775       /* Do not consider functions not declared inline.  */
2776       if (!DECL_DECLARED_INLINE_P (callee->decl)
2777           && !opt_for_fn (node->decl, flag_inline_small_functions)
2778           && !opt_for_fn (node->decl, flag_inline_functions))
2779         continue;
2780
2781       if (dump_enabled_p ())
2782         dump_printf_loc (MSG_NOTE, e->call_stmt,
2783                          "Considering inline candidate %C.\n",
2784                          callee);
2785
2786       if (!can_early_inline_edge_p (e))
2787         continue;
2788
2789       if (e->recursive_p ())
2790         {
2791           if (dump_enabled_p ())
2792             dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2793                              "  Not inlining: recursive call.\n");
2794           continue;
2795         }
2796
2797       if (!want_early_inline_function_p (e))
2798         continue;
2799
2800       if (dump_enabled_p ())
2801         dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, e->call_stmt,
2802                          " Inlining %C into %C.\n",
2803                          callee, e->caller);
2804       inline_call (e, true, NULL, NULL, false);
2805       inlined = true;
2806     }
2807
2808   if (inlined)
2809     ipa_update_overall_fn_summary (node);
2810
2811   return inlined;
2812 }
2813
2814 unsigned int
2815 early_inliner (function *fun)
2816 {
2817   struct cgraph_node *node = cgraph_node::get (current_function_decl);
2818   struct cgraph_edge *edge;
2819   unsigned int todo = 0;
2820   int iterations = 0;
2821   bool inlined = false;
2822
2823   if (seen_error ())
2824     return 0;
2825
2826   /* Do nothing if datastructures for ipa-inliner are already computed.  This
2827      happens when some pass decides to construct new function and
2828      cgraph_add_new_function calls lowering passes and early optimization on
2829      it.  This may confuse ourself when early inliner decide to inline call to
2830      function clone, because function clones don't have parameter list in
2831      ipa-prop matching their signature.  */
2832   if (ipa_node_params_sum)
2833     return 0;
2834
2835   if (flag_checking)
2836     node->verify ();
2837   node->remove_all_references ();
2838
2839   /* Even when not optimizing or not inlining inline always-inline
2840      functions.  */
2841   inlined = inline_always_inline_functions (node);
2842
2843   if (!optimize
2844       || flag_no_inline
2845       || !flag_early_inlining
2846       /* Never inline regular functions into always-inline functions
2847          during incremental inlining.  This sucks as functions calling
2848          always inline functions will get less optimized, but at the
2849          same time inlining of functions calling always inline
2850          function into an always inline function might introduce
2851          cycles of edges to be always inlined in the callgraph.
2852
2853          We might want to be smarter and just avoid this type of inlining.  */
2854       || (DECL_DISREGARD_INLINE_LIMITS (node->decl)
2855           && lookup_attribute ("always_inline",
2856                                DECL_ATTRIBUTES (node->decl))))
2857     ;
2858   else if (lookup_attribute ("flatten",
2859                              DECL_ATTRIBUTES (node->decl)) != NULL)
2860     {
2861       /* When the function is marked to be flattened, recursively inline
2862          all calls in it.  */
2863       if (dump_enabled_p ())
2864         dump_printf (MSG_OPTIMIZED_LOCATIONS,
2865                      "Flattening %C\n", node);
2866       flatten_function (node, true, true);
2867       inlined = true;
2868     }
2869   else
2870     {
2871       /* If some always_inline functions was inlined, apply the changes.
2872          This way we will not account always inline into growth limits and
2873          moreover we will inline calls from always inlines that we skipped
2874          previously because of conditional above.  */
2875       if (inlined)
2876         {
2877           timevar_push (TV_INTEGRATION);
2878           todo |= optimize_inline_calls (current_function_decl);
2879           /* optimize_inline_calls call above might have introduced new
2880              statements that don't have inline parameters computed.  */
2881           for (edge = node->callees; edge; edge = edge->next_callee)
2882             {
2883               /* We can enounter not-yet-analyzed function during
2884                  early inlining on callgraphs with strongly
2885                  connected components.  */
2886               ipa_call_summary *es = ipa_call_summaries->get_create (edge);
2887               es->call_stmt_size
2888                 = estimate_num_insns (edge->call_stmt, &eni_size_weights);
2889               es->call_stmt_time
2890                 = estimate_num_insns (edge->call_stmt, &eni_time_weights);
2891             }
2892           ipa_update_overall_fn_summary (node);
2893           inlined = false;
2894           timevar_pop (TV_INTEGRATION);
2895         }
2896       /* We iterate incremental inlining to get trivial cases of indirect
2897          inlining.  */
2898       while (iterations < PARAM_VALUE (PARAM_EARLY_INLINER_MAX_ITERATIONS)
2899              && early_inline_small_functions (node))
2900         {
2901           timevar_push (TV_INTEGRATION);
2902           todo |= optimize_inline_calls (current_function_decl);
2903
2904           /* Technically we ought to recompute inline parameters so the new
2905              iteration of early inliner works as expected.  We however have
2906              values approximately right and thus we only need to update edge
2907              info that might be cleared out for newly discovered edges.  */
2908           for (edge = node->callees; edge; edge = edge->next_callee)
2909             {
2910               /* We have no summary for new bound store calls yet.  */
2911               ipa_call_summary *es = ipa_call_summaries->get_create (edge);
2912               es->call_stmt_size
2913                 = estimate_num_insns (edge->call_stmt, &eni_size_weights);
2914               es->call_stmt_time
2915                 = estimate_num_insns (edge->call_stmt, &eni_time_weights);
2916             }
2917           if (iterations < PARAM_VALUE (PARAM_EARLY_INLINER_MAX_ITERATIONS) - 1)
2918             ipa_update_overall_fn_summary (node);
2919           timevar_pop (TV_INTEGRATION);
2920           iterations++;
2921           inlined = false;
2922         }
2923       if (dump_file)
2924         fprintf (dump_file, "Iterations: %i\n", iterations);
2925     }
2926
2927   if (inlined)
2928     {
2929       timevar_push (TV_INTEGRATION);
2930       todo |= optimize_inline_calls (current_function_decl);
2931       timevar_pop (TV_INTEGRATION);
2932     }
2933
2934   fun->always_inline_functions_inlined = true;
2935
2936   return todo;
2937 }
2938
2939 /* Do inlining of small functions.  Doing so early helps profiling and other
2940    passes to be somewhat more effective and avoids some code duplication in
2941    later real inlining pass for testcases with very many function calls.  */
2942
2943 namespace {
2944
2945 const pass_data pass_data_early_inline =
2946 {
2947   GIMPLE_PASS, /* type */
2948   "einline", /* name */
2949   OPTGROUP_INLINE, /* optinfo_flags */
2950   TV_EARLY_INLINING, /* tv_id */
2951   PROP_ssa, /* properties_required */
2952   0, /* properties_provided */
2953   0, /* properties_destroyed */
2954   0, /* todo_flags_start */
2955   0, /* todo_flags_finish */
2956 };
2957
2958 class pass_early_inline : public gimple_opt_pass
2959 {
2960 public:
2961   pass_early_inline (gcc::context *ctxt)
2962     : gimple_opt_pass (pass_data_early_inline, ctxt)
2963   {}
2964
2965   /* opt_pass methods: */
2966   virtual unsigned int execute (function *);
2967
2968 }; // class pass_early_inline
2969
2970 unsigned int
2971 pass_early_inline::execute (function *fun)
2972 {
2973   return early_inliner (fun);
2974 }
2975
2976 } // anon namespace
2977
2978 gimple_opt_pass *
2979 make_pass_early_inline (gcc::context *ctxt)
2980 {
2981   return new pass_early_inline (ctxt);
2982 }
2983
2984 namespace {
2985
2986 const pass_data pass_data_ipa_inline =
2987 {
2988   IPA_PASS, /* type */
2989   "inline", /* name */
2990   OPTGROUP_INLINE, /* optinfo_flags */
2991   TV_IPA_INLINING, /* tv_id */
2992   0, /* properties_required */
2993   0, /* properties_provided */
2994   0, /* properties_destroyed */
2995   0, /* todo_flags_start */
2996   ( TODO_dump_symtab ), /* todo_flags_finish */
2997 };
2998
2999 class pass_ipa_inline : public ipa_opt_pass_d
3000 {
3001 public:
3002   pass_ipa_inline (gcc::context *ctxt)
3003     : ipa_opt_pass_d (pass_data_ipa_inline, ctxt,
3004                       NULL, /* generate_summary */
3005                       NULL, /* write_summary */
3006                       NULL, /* read_summary */
3007                       NULL, /* write_optimization_summary */
3008                       NULL, /* read_optimization_summary */
3009                       NULL, /* stmt_fixup */
3010                       0, /* function_transform_todo_flags_start */
3011                       inline_transform, /* function_transform */
3012                       NULL) /* variable_transform */
3013   {}
3014
3015   /* opt_pass methods: */
3016   virtual unsigned int execute (function *) { return ipa_inline (); }
3017
3018 }; // class pass_ipa_inline
3019
3020 } // anon namespace
3021
3022 ipa_opt_pass_d *
3023 make_pass_ipa_inline (gcc::context *ctxt)
3024 {
3025   return new pass_ipa_inline (ctxt);
3026 }