gcc/ipa-inline-transform.c

   1 /* Callgraph transformations to handle inlining
   2    Copyright (C) 2003-2019 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* The inline decisions are stored in callgraph in "inline plan" and
  22    applied later.
  23
  24    To mark given call inline, use inline_call function.
  25    The function marks the edge inlinable and, if necessary, produces
  26    virtual clone in the callgraph representing the new copy of callee's
  27    function body.
  28
  29    The inline plan is applied on given function body by inline_transform.  */
  30
  31 #include "config.h"
  32 #include "system.h"
  33 #include "coretypes.h"
  34 #include "tm.h"
  35 #include "function.h"
  36 #include "tree.h"
  37 #include "alloc-pool.h"
  38 #include "tree-pass.h"
  39 #include "cgraph.h"
  40 #include "tree-cfg.h"
  41 #include "symbol-summary.h"
  42 #include "tree-vrp.h"
  43 #include "ipa-prop.h"
  44 #include "ipa-fnsummary.h"
  45 #include "ipa-inline.h"
  46 #include "tree-inline.h"
  47 #include "function.h"
  48 #include "cfg.h"
  49 #include "basic-block.h"
  50 #include "ipa-utils.h"
  51
  52 int ncalls_inlined;
  53 int nfunctions_inlined;
  54
  55 /* Scale counts of NODE edges by NUM/DEN.  */
  56
  57 static void
  58 update_noncloned_counts (struct cgraph_node *node,
  59                          profile_count num, profile_count den)
  60 {
  61   struct cgraph_edge *e;
  62
  63   profile_count::adjust_for_ipa_scaling (&num, &den);
  64
  65   for (e = node->callees; e; e = e->next_callee)
  66     {
  67       if (!e->inline_failed)
  68         update_noncloned_counts (e->callee, num, den);
  69       e->count = e->count.apply_scale (num, den);
  70     }
  71   for (e = node->indirect_calls; e; e = e->next_callee)
  72     e->count = e->count.apply_scale (num, den);
  73   node->count = node->count.apply_scale (num, den);
  74 }
  75
  76 /* We removed or are going to remove the last call to NODE.
  77    Return true if we can and want proactively remove the NODE now.
  78    This is important to do, since we want inliner to know when offline
  79    copy of function was removed.  */
  80
  81 static bool
  82 can_remove_node_now_p_1 (struct cgraph_node *node, struct cgraph_edge *e)
  83 {
  84   ipa_ref *ref;
  85
  86   FOR_EACH_ALIAS (node, ref)
  87     {
  88       cgraph_node *alias = dyn_cast <cgraph_node *> (ref->referring);
  89       if ((alias->callers && alias->callers != e)
  90           || !can_remove_node_now_p_1 (alias, e))
  91         return false;
  92     }
  93   /* FIXME: When address is taken of DECL_EXTERNAL function we still
  94      can remove its offline copy, but we would need to keep unanalyzed node in
  95      the callgraph so references can point to it.
  96
  97      Also for comdat group we can ignore references inside a group as we
  98      want to prove the group as a whole to be dead.  */
  99   return (!node->address_taken
 100           && node->can_remove_if_no_direct_calls_and_refs_p ()
 101           /* Inlining might enable more devirtualizing, so we want to remove
 102              those only after all devirtualizable virtual calls are processed.
 103              Lacking may edges in callgraph we just preserve them post
 104              inlining.  */
 105           && (!DECL_VIRTUAL_P (node->decl)
 106               || !opt_for_fn (node->decl, flag_devirtualize))
 107           /* During early inlining some unanalyzed cgraph nodes might be in the
 108              callgraph and they might refer the function in question.  */
 109           && !cgraph_new_nodes.exists ());
 110 }
 111
 112 /* We are going to eliminate last direct call to NODE (or alias of it) via edge E.
 113    Verify that the NODE can be removed from unit and if it is contained in comdat
 114    group that the whole comdat group is removable.  */
 115
 116 static bool
 117 can_remove_node_now_p (struct cgraph_node *node, struct cgraph_edge *e)
 118 {
 119   struct cgraph_node *next;
 120   if (!can_remove_node_now_p_1 (node, e))
 121     return false;
 122
 123   /* When we see same comdat group, we need to be sure that all
 124      items can be removed.  */
 125   if (!node->same_comdat_group || !node->externally_visible)
 126     return true;
 127   for (next = dyn_cast<cgraph_node *> (node->same_comdat_group);
 128        next != node; next = dyn_cast<cgraph_node *> (next->same_comdat_group))
 129     {
 130       if (next->alias)
 131         continue;
 132       if ((next->callers && next->callers != e)
 133           || !can_remove_node_now_p_1 (next, e))
 134         return false;
 135     }
 136   return true;
 137 }
 138
 139 /* Return true if NODE is a master clone with non-inline clones.  */
 140
 141 static bool
 142 master_clone_with_noninline_clones_p (struct cgraph_node *node)
 143 {
 144   if (node->clone_of)
 145     return false;
 146
 147   for (struct cgraph_node *n = node->clones; n; n = n->next_sibling_clone)
 148     if (n->decl != node->decl)
 149       return true;
 150
 151   return false;
 152 }
 153
 154 /* E is expected to be an edge being inlined.  Clone destination node of
 155    the edge and redirect it to the new clone.
 156    DUPLICATE is used for bookkeeping on whether we are actually creating new
 157    clones or re-using node originally representing out-of-line function call.
 158    By default the offline copy is removed, when it appears dead after inlining.
 159    UPDATE_ORIGINAL prevents this transformation.
 160    If OVERALL_SIZE is non-NULL, the size is updated to reflect the
 161    transformation.  */
 162
 163 void
 164 clone_inlined_nodes (struct cgraph_edge *e, bool duplicate,
 165                      bool update_original, int *overall_size)
 166 {
 167   struct cgraph_node *inlining_into;
 168   struct cgraph_edge *next;
 169
 170   if (e->caller->inlined_to)
 171     inlining_into = e->caller->inlined_to;
 172   else
 173     inlining_into = e->caller;
 174
 175   if (duplicate)
 176     {
 177       /* We may eliminate the need for out-of-line copy to be output.
 178          In that case just go ahead and re-use it.  This is not just an
 179          memory optimization.  Making offline copy of function disappear
 180          from the program will improve future decisions on inlining.  */
 181       if (!e->callee->callers->next_caller
 182           /* Recursive inlining never wants the master clone to
 183              be overwritten.  */
 184           && update_original
 185           && can_remove_node_now_p (e->callee, e)
 186           /* We cannot overwrite a master clone with non-inline clones
 187              until after these clones are materialized.  */
 188           && !master_clone_with_noninline_clones_p (e->callee))
 189         {
 190           /* TODO: When callee is in a comdat group, we could remove all of it,
 191              including all inline clones inlined into it.  That would however
 192              need small function inlining to register edge removal hook to
 193              maintain the priority queue.
 194
 195              For now we keep the other functions in the group in program until
 196              cgraph_remove_unreachable_functions gets rid of them.  */
 197           gcc_assert (!e->callee->inlined_to);
 198           e->callee->remove_from_same_comdat_group ();
 199           if (e->callee->definition
 200               && inline_account_function_p (e->callee))
 201             {
 202               gcc_assert (!e->callee->alias);
 203               if (overall_size)
 204                 *overall_size -= ipa_size_summaries->get (e->callee)->size;
 205               nfunctions_inlined++;
 206             }
 207           duplicate = false;
 208           e->callee->externally_visible = false;
 209           update_noncloned_counts (e->callee, e->count, e->callee->count);
 210
 211           dump_callgraph_transformation (e->callee, inlining_into,
 212                                          "inlining to");
 213         }
 214       else
 215         {
 216           struct cgraph_node *n;
 217
 218           n = e->callee->create_clone (e->callee->decl,
 219                                        e->count,
 220                                        update_original, vNULL, true,
 221                                        inlining_into,
 222                                        NULL);
 223           n->used_as_abstract_origin = e->callee->used_as_abstract_origin;
 224           e->redirect_callee (n);
 225         }
 226     }
 227   else
 228     e->callee->remove_from_same_comdat_group ();
 229
 230   e->callee->inlined_to = inlining_into;
 231
 232   /* Recursively clone all bodies.  */
 233   for (e = e->callee->callees; e; e = next)
 234     {
 235       next = e->next_callee;
 236       if (!e->inline_failed)
 237         clone_inlined_nodes (e, duplicate, update_original, overall_size);
 238     }
 239 }
 240
 241 /* Check all speculations in N and if any seem useless, resolve them.  When a
 242    first edge is resolved, pop all edges from NEW_EDGES and insert them to
 243    EDGE_SET.  Then remove each resolved edge from EDGE_SET, if it is there.  */
 244
 245 static bool
 246 check_speculations_1 (cgraph_node *n, vec<cgraph_edge *> *new_edges,
 247                       hash_set <cgraph_edge *> *edge_set)
 248 {
 249   bool speculation_removed = false;
 250   cgraph_edge *next;
 251
 252   for (cgraph_edge *e = n->callees; e; e = next)
 253     {
 254       next = e->next_callee;
 255       if (e->speculative && !speculation_useful_p (e, true))
 256         {
 257           while (new_edges && !new_edges->is_empty ())
 258             edge_set->add (new_edges->pop ());
 259           edge_set->remove (e);
 260
 261           e->resolve_speculation (NULL);
 262           speculation_removed = true;
 263         }
 264       else if (!e->inline_failed)
 265         speculation_removed |= check_speculations_1 (e->callee, new_edges,
 266                                                      edge_set);
 267     }
 268   return speculation_removed;
 269 }
 270
 271 /* Push E to NEW_EDGES.  Called from hash_set traverse method, which
 272    unfortunately means this function has to have external linkage, otherwise
 273    the code will not compile with gcc 4.8.  */
 274
 275 bool
 276 push_all_edges_in_set_to_vec (cgraph_edge * const &e,
 277                               vec<cgraph_edge *> *new_edges)
 278 {
 279   new_edges->safe_push (e);
 280   return true;
 281 }
 282
 283 /* Check all speculations in N and if any seem useless, resolve them and remove
 284    them from NEW_EDGES.  */
 285
 286 static bool
 287 check_speculations (cgraph_node *n, vec<cgraph_edge *> *new_edges)
 288 {
 289   hash_set <cgraph_edge *> edge_set;
 290   bool res = check_speculations_1 (n, new_edges, &edge_set);
 291   if (!edge_set.is_empty ())
 292     edge_set.traverse <vec<cgraph_edge *> *,
 293                        push_all_edges_in_set_to_vec> (new_edges);
 294   return res;
 295 }
 296
 297 /* Mark all call graph edges coming out of NODE and all nodes that have been
 298    inlined to it as in_polymorphic_cdtor.  */
 299
 300 static void
 301 mark_all_inlined_calls_cdtor (cgraph_node *node)
 302 {
 303   for (cgraph_edge *cs = node->callees; cs; cs = cs->next_callee)
 304     {
 305       cs->in_polymorphic_cdtor = true;
 306       if (!cs->inline_failed)
 307         mark_all_inlined_calls_cdtor (cs->callee);
 308     }
 309   for (cgraph_edge *cs = node->indirect_calls; cs; cs = cs->next_callee)
 310     cs->in_polymorphic_cdtor = true;
 311 }
 312
 313
 314 /* Mark edge E as inlined and update callgraph accordingly.  UPDATE_ORIGINAL
 315    specify whether profile of original function should be updated.  If any new
 316    indirect edges are discovered in the process, add them to NEW_EDGES, unless
 317    it is NULL. If UPDATE_OVERALL_SUMMARY is false, do not bother to recompute overall
 318    size of caller after inlining. Caller is required to eventually do it via
 319    ipa_update_overall_fn_summary.
 320    If callee_removed is non-NULL, set it to true if we removed callee node.
 321
 322    Return true iff any new callgraph edges were discovered as a
 323    result of inlining.  */
 324
 325 bool
 326 inline_call (struct cgraph_edge *e, bool update_original,
 327              vec<cgraph_edge *> *new_edges,
 328              int *overall_size, bool update_overall_summary,
 329              bool *callee_removed)
 330 {
 331   int old_size = 0, new_size = 0;
 332   struct cgraph_node *to = NULL;
 333   struct cgraph_edge *curr = e;
 334   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 335   bool new_edges_found = false;
 336
 337   int estimated_growth = 0;
 338   if (! update_overall_summary)
 339     estimated_growth = estimate_edge_growth (e);
 340   /* This is used only for assert bellow.  */
 341 #if 0
 342   bool predicated = inline_edge_summary (e)->predicate != NULL;
 343 #endif
 344
 345   /* Don't inline inlined edges.  */
 346   gcc_assert (e->inline_failed);
 347   /* Don't even think of inlining inline clone.  */
 348   gcc_assert (!callee->inlined_to);
 349
 350   to = e->caller;
 351   if (to->inlined_to)
 352     to = to->inlined_to;
 353   if (to->thunk.thunk_p)
 354     {
 355       struct cgraph_node *target = to->callees->callee;
 356       thunk_expansion = true;
 357       symtab->call_cgraph_removal_hooks (to);
 358       if (in_lto_p)
 359         to->get_untransformed_body ();
 360       to->expand_thunk (false, true);
 361       /* When thunk is instrumented we may have multiple callees.  */
 362       for (e = to->callees; e && e->callee != target; e = e->next_callee)
 363         ;
 364       symtab->call_cgraph_insertion_hooks (to);
 365       thunk_expansion = false;
 366       gcc_assert (e);
 367     }
 368
 369
 370   e->inline_failed = CIF_OK;
 371   DECL_POSSIBLY_INLINED (callee->decl) = true;
 372
 373   if (DECL_FUNCTION_PERSONALITY (callee->decl))
 374     DECL_FUNCTION_PERSONALITY (to->decl)
 375       = DECL_FUNCTION_PERSONALITY (callee->decl);
 376
 377   bool reload_optimization_node = false;
 378   if (!opt_for_fn (callee->decl, flag_strict_aliasing)
 379       && opt_for_fn (to->decl, flag_strict_aliasing))
 380     {
 381       struct gcc_options opts = global_options;
 382
 383       cl_optimization_restore (&opts, opts_for_fn (to->decl));
 384       opts.x_flag_strict_aliasing = false;
 385       if (dump_file)
 386         fprintf (dump_file, "Dropping flag_strict_aliasing on %s\n",
 387                  to->dump_name ());
 388       DECL_FUNCTION_SPECIFIC_OPTIMIZATION (to->decl)
 389          = build_optimization_node (&opts);
 390       reload_optimization_node = true;
 391     }
 392
 393   ipa_fn_summary *caller_info = ipa_fn_summaries->get (to);
 394   ipa_fn_summary *callee_info = ipa_fn_summaries->get (callee);
 395   if (!caller_info->fp_expressions && callee_info->fp_expressions)
 396     {
 397       caller_info->fp_expressions = true;
 398       if (opt_for_fn (callee->decl, flag_rounding_math)
 399           != opt_for_fn (to->decl, flag_rounding_math)
 400           || opt_for_fn (callee->decl, flag_trapping_math)
 401              != opt_for_fn (to->decl, flag_trapping_math)
 402           || opt_for_fn (callee->decl, flag_unsafe_math_optimizations)
 403              != opt_for_fn (to->decl, flag_unsafe_math_optimizations)
 404           || opt_for_fn (callee->decl, flag_finite_math_only)
 405              != opt_for_fn (to->decl, flag_finite_math_only)
 406           || opt_for_fn (callee->decl, flag_signaling_nans)
 407              != opt_for_fn (to->decl, flag_signaling_nans)
 408           || opt_for_fn (callee->decl, flag_cx_limited_range)
 409              != opt_for_fn (to->decl, flag_cx_limited_range)
 410           || opt_for_fn (callee->decl, flag_signed_zeros)
 411              != opt_for_fn (to->decl, flag_signed_zeros)
 412           || opt_for_fn (callee->decl, flag_associative_math)
 413              != opt_for_fn (to->decl, flag_associative_math)
 414           || opt_for_fn (callee->decl, flag_reciprocal_math)
 415              != opt_for_fn (to->decl, flag_reciprocal_math)
 416           || opt_for_fn (callee->decl, flag_fp_int_builtin_inexact)
 417              != opt_for_fn (to->decl, flag_fp_int_builtin_inexact)
 418           || opt_for_fn (callee->decl, flag_errno_math)
 419              != opt_for_fn (to->decl, flag_errno_math))
 420         {
 421           struct gcc_options opts = global_options;
 422
 423           cl_optimization_restore (&opts, opts_for_fn (to->decl));
 424           opts.x_flag_rounding_math
 425             = opt_for_fn (callee->decl, flag_rounding_math);
 426           opts.x_flag_trapping_math
 427             = opt_for_fn (callee->decl, flag_trapping_math);
 428           opts.x_flag_unsafe_math_optimizations
 429             = opt_for_fn (callee->decl, flag_unsafe_math_optimizations);
 430           opts.x_flag_finite_math_only
 431             = opt_for_fn (callee->decl, flag_finite_math_only);
 432           opts.x_flag_signaling_nans
 433             = opt_for_fn (callee->decl, flag_signaling_nans);
 434           opts.x_flag_cx_limited_range
 435             = opt_for_fn (callee->decl, flag_cx_limited_range);
 436           opts.x_flag_signed_zeros
 437             = opt_for_fn (callee->decl, flag_signed_zeros);
 438           opts.x_flag_associative_math
 439             = opt_for_fn (callee->decl, flag_associative_math);
 440           opts.x_flag_reciprocal_math
 441             = opt_for_fn (callee->decl, flag_reciprocal_math);
 442           opts.x_flag_fp_int_builtin_inexact
 443             = opt_for_fn (callee->decl, flag_fp_int_builtin_inexact);
 444           opts.x_flag_errno_math
 445             = opt_for_fn (callee->decl, flag_errno_math);
 446           if (dump_file)
 447             fprintf (dump_file, "Copying FP flags from %s to %s\n",
 448                      callee->dump_name (), to->dump_name ());
 449           DECL_FUNCTION_SPECIFIC_OPTIMIZATION (to->decl)
 450              = build_optimization_node (&opts);
 451           reload_optimization_node = true;
 452         }
 453     }
 454
 455   /* Reload global optimization flags.  */
 456   if (reload_optimization_node && DECL_STRUCT_FUNCTION (to->decl) == cfun)
 457     set_cfun (cfun, true);
 458
 459   /* If aliases are involved, redirect edge to the actual destination and
 460      possibly remove the aliases.  */
 461   if (e->callee != callee)
 462     {
 463       struct cgraph_node *alias = e->callee, *next_alias;
 464       e->redirect_callee (callee);
 465       while (alias && alias != callee)
 466         {
 467           if (!alias->callers
 468               && can_remove_node_now_p (alias,
 469                                         !e->next_caller && !e->prev_caller ? e : NULL))
 470             {
 471               next_alias = alias->get_alias_target ();
 472               alias->remove ();
 473               if (callee_removed)
 474                 *callee_removed = true;
 475               alias = next_alias;
 476             }
 477           else
 478             break;
 479         }
 480     }
 481
 482   clone_inlined_nodes (e, true, update_original, overall_size);
 483
 484   gcc_assert (curr->callee->inlined_to == to);
 485
 486   old_size = ipa_size_summaries->get (to)->size;
 487   ipa_merge_fn_summary_after_inlining (e);
 488   if (e->in_polymorphic_cdtor)
 489     mark_all_inlined_calls_cdtor (e->callee);
 490   if (opt_for_fn (e->caller->decl, optimize))
 491     new_edges_found = ipa_propagate_indirect_call_infos (curr, new_edges);
 492   bool removed_p = check_speculations (e->callee, new_edges);
 493   if (update_overall_summary)
 494     ipa_update_overall_fn_summary (to, new_edges_found || removed_p);
 495   else
 496     /* Update self size by the estimate so overall function growth limits
 497        work for further inlining into this function.  Before inlining
 498        the function we inlined to again we expect the caller to update
 499        the overall summary.  */
 500     ipa_size_summaries->get (to)->size += estimated_growth;
 501   new_size = ipa_size_summaries->get (to)->size;
 502
 503   if (callee->calls_comdat_local)
 504     to->calls_comdat_local = true;
 505   else if (to->calls_comdat_local && callee->comdat_local_p ())
 506     {
 507       struct cgraph_edge *se = to->callees;
 508       for (; se; se = se->next_callee)
 509         if (se->inline_failed && se->callee->comdat_local_p ())
 510           break;
 511       if (se == NULL)
 512         to->calls_comdat_local = false;
 513     }
 514
 515   /* FIXME: This assert suffers from roundoff errors, disable it for GCC 5
 516      and revisit it after conversion to sreals in GCC 6.
 517      See PR 65654.  */
 518 #if 0
 519   /* Verify that estimated growth match real growth.  Allow off-by-one
 520      error due to ipa_fn_summary::size_scale roudoff errors.  */
 521   gcc_assert (!update_overall_summary || !overall_size || new_edges_found
 522               || abs (estimated_growth - (new_size - old_size)) <= 1
 523               || speculation_removed
 524               /* FIXME: a hack.  Edges with false predicate are accounted
 525                  wrong, we should remove them from callgraph.  */
 526               || predicated);
 527 #endif
 528
 529   /* Account the change of overall unit size; external functions will be
 530      removed and are thus not accounted.  */
 531   if (overall_size && inline_account_function_p (to))
 532     *overall_size += new_size - old_size;
 533   ncalls_inlined++;
 534
 535   /* This must happen after ipa_merge_fn_summary_after_inlining that rely on jump
 536      functions of callee to not be updated.  */
 537   return new_edges_found;
 538 }
 539
 540
 541 /* Copy function body of NODE and redirect all inline clones to it.
 542    This is done before inline plan is applied to NODE when there are
 543    still some inline clones if it.
 544
 545    This is necessary because inline decisions are not really transitive
 546    and the other inline clones may have different bodies.  */
 547
 548 static struct cgraph_node *
 549 save_inline_function_body (struct cgraph_node *node)
 550 {
 551   struct cgraph_node *first_clone, *n;
 552
 553   if (dump_file)
 554     fprintf (dump_file, "\nSaving body of %s for later reuse\n",
 555              node->name ());
 556
 557   gcc_assert (node == cgraph_node::get (node->decl));
 558
 559   /* first_clone will be turned into real function.  */
 560   first_clone = node->clones;
 561
 562   /* Arrange first clone to not be thunk as those do not have bodies.  */
 563   if (first_clone->thunk.thunk_p)
 564     {
 565       while (first_clone->thunk.thunk_p)
 566         first_clone = first_clone->next_sibling_clone;
 567       first_clone->prev_sibling_clone->next_sibling_clone
 568         = first_clone->next_sibling_clone;
 569       if (first_clone->next_sibling_clone)
 570         first_clone->next_sibling_clone->prev_sibling_clone
 571            = first_clone->prev_sibling_clone;
 572       first_clone->next_sibling_clone = node->clones;
 573       first_clone->prev_sibling_clone = NULL;
 574       node->clones->prev_sibling_clone = first_clone;
 575       node->clones = first_clone;
 576     }
 577   first_clone->decl = copy_node (node->decl);
 578   first_clone->decl->decl_with_vis.symtab_node = first_clone;
 579   gcc_assert (first_clone == cgraph_node::get (first_clone->decl));
 580
 581   /* Now reshape the clone tree, so all other clones descends from
 582      first_clone.  */
 583   if (first_clone->next_sibling_clone)
 584     {
 585       for (n = first_clone->next_sibling_clone; n->next_sibling_clone;
 586            n = n->next_sibling_clone)
 587         n->clone_of = first_clone;
 588       n->clone_of = first_clone;
 589       n->next_sibling_clone = first_clone->clones;
 590       if (first_clone->clones)
 591         first_clone->clones->prev_sibling_clone = n;
 592       first_clone->clones = first_clone->next_sibling_clone;
 593       first_clone->next_sibling_clone->prev_sibling_clone = NULL;
 594       first_clone->next_sibling_clone = NULL;
 595       gcc_assert (!first_clone->prev_sibling_clone);
 596     }
 597   first_clone->clone_of = NULL;
 598
 599   /* Now node in question has no clones.  */
 600   node->clones = NULL;
 601
 602   /* Inline clones share decl with the function they are cloned
 603      from.  Walk the whole clone tree and redirect them all to the
 604      new decl.  */
 605   if (first_clone->clones)
 606     for (n = first_clone->clones; n != first_clone;)
 607       {
 608         gcc_assert (n->decl == node->decl);
 609         n->decl = first_clone->decl;
 610         if (n->clones)
 611           n = n->clones;
 612         else if (n->next_sibling_clone)
 613           n = n->next_sibling_clone;
 614         else
 615           {
 616             while (n != first_clone && !n->next_sibling_clone)
 617               n = n->clone_of;
 618             if (n != first_clone)
 619               n = n->next_sibling_clone;
 620           }
 621       }
 622
 623   /* Copy the OLD_VERSION_NODE function tree to the new version.  */
 624   tree_function_versioning (node->decl, first_clone->decl,
 625                             NULL, NULL, true, NULL, NULL);
 626
 627   /* The function will be short lived and removed after we inline all the clones,
 628      but make it internal so we won't confuse ourself.  */
 629   DECL_EXTERNAL (first_clone->decl) = 0;
 630   TREE_PUBLIC (first_clone->decl) = 0;
 631   DECL_COMDAT (first_clone->decl) = 0;
 632   first_clone->ipa_transforms_to_apply.release ();
 633
 634   /* When doing recursive inlining, the clone may become unnecessary.
 635      This is possible i.e. in the case when the recursive function is proved to be
 636      non-throwing and the recursion happens only in the EH landing pad.
 637      We cannot remove the clone until we are done with saving the body.
 638      Remove it now.  */
 639   if (!first_clone->callers)
 640     {
 641       first_clone->remove_symbol_and_inline_clones ();
 642       first_clone = NULL;
 643     }
 644   else if (flag_checking)
 645     first_clone->verify ();
 646
 647   return first_clone;
 648 }
 649
 650 /* Return true when function body of DECL still needs to be kept around
 651    for later re-use.  */
 652 static bool
 653 preserve_function_body_p (struct cgraph_node *node)
 654 {
 655   gcc_assert (symtab->global_info_ready);
 656   gcc_assert (!node->alias && !node->thunk.thunk_p);
 657
 658   /* Look if there is any non-thunk clone around.  */
 659   for (node = node->clones; node; node = node->next_sibling_clone)
 660     if (!node->thunk.thunk_p)
 661       return true;
 662   return false;
 663 }
 664
 665 /* Apply inline plan to function.  */
 666
 667 unsigned int
 668 inline_transform (struct cgraph_node *node)
 669 {
 670   unsigned int todo = 0;
 671   struct cgraph_edge *e, *next;
 672   bool has_inline = false;
 673
 674   /* FIXME: Currently the pass manager is adding inline transform more than
 675      once to some clones.  This needs revisiting after WPA cleanups.  */
 676   if (cfun->after_inlining)
 677     return 0;
 678
 679   /* We might need the body of this function so that we can expand
 680      it inline somewhere else.  */
 681   if (preserve_function_body_p (node))
 682     save_inline_function_body (node);
 683
 684   profile_count num = node->count;
 685   profile_count den = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
 686   bool scale = num.initialized_p () && !(num == den);
 687   if (scale)
 688     {
 689       profile_count::adjust_for_ipa_scaling (&num, &den);
 690       if (dump_file)
 691         {
 692           fprintf (dump_file, "Applying count scale ");
 693           num.dump (dump_file);
 694           fprintf (dump_file, "/");
 695           den.dump (dump_file);
 696           fprintf (dump_file, "\n");
 697         }
 698
 699       basic_block bb;
 700       cfun->cfg->count_max = profile_count::uninitialized ();
 701       FOR_ALL_BB_FN (bb, cfun)
 702         {
 703           bb->count = bb->count.apply_scale (num, den);
 704           cfun->cfg->count_max = cfun->cfg->count_max.max (bb->count);
 705         }
 706       ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = node->count;
 707     }
 708
 709   for (e = node->callees; e; e = next)
 710     {
 711       if (!e->inline_failed)
 712         has_inline = true;
 713       next = e->next_callee;
 714       e->redirect_call_stmt_to_callee ();
 715     }
 716   node->remove_all_references ();
 717
 718   timevar_push (TV_INTEGRATION);
 719   if (node->callees && (opt_for_fn (node->decl, optimize) || has_inline))
 720     {
 721       todo = optimize_inline_calls (current_function_decl);
 722     }
 723   timevar_pop (TV_INTEGRATION);
 724
 725   cfun->always_inline_functions_inlined = true;
 726   cfun->after_inlining = true;
 727   todo |= execute_fixup_cfg ();
 728
 729   if (!(todo & TODO_update_ssa_any))
 730     /* Redirecting edges might lead to a need for vops to be recomputed.  */
 731     todo |= TODO_update_ssa_only_virtuals;
 732
 733   return todo;
 734 }