]> git.ipfire.org Git - thirdparty/gcc.git/blame - gcc/lto/lto-partition.c
IPA REF refactoring
[thirdparty/gcc.git] / gcc / lto / lto-partition.c
CommitLineData
a66dc285 1/* LTO partitioning logic routines.
23a5b65a 2 Copyright (C) 2009-2014 Free Software Foundation, Inc.
a66dc285
JH
3
4This file is part of GCC.
5
6GCC is free software; you can redistribute it and/or modify it under
7the terms of the GNU General Public License as published by the Free
8Software Foundation; either version 3, or (at your option) any later
9version.
10
11GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12WARRANTY; without even the implied warranty of MERCHANTABILITY or
13FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14for more details.
15
16You should have received a copy of the GNU General Public License
17along with GCC; see the file COPYING3. If not see
18<http://www.gnu.org/licenses/>. */
19
20#include "config.h"
21#include "system.h"
22#include "coretypes.h"
23#include "toplev.h"
24#include "tree.h"
d8a2d370 25#include "gcc-symtab.h"
2fb9a547
AM
26#include "basic-block.h"
27#include "tree-ssa-alias.h"
28#include "internal-fn.h"
29#include "gimple-expr.h"
30#include "is-a.h"
8e9055ae 31#include "gimple.h"
a66dc285
JH
32#include "tm.h"
33#include "cgraph.h"
34#include "lto-streamer.h"
35#include "timevar.h"
36#include "params.h"
37#include "ipa-inline.h"
38#include "ipa-utils.h"
39#include "lto-partition.h"
40
9771b263 41vec<ltrans_partition> ltrans_partitions;
a66dc285 42
5e20cdc9 43static void add_symbol_to_partition (ltrans_partition part, symtab_node *node);
c3c445e1 44
a66dc285
JH
45
46/* Create new partition with name NAME. */
c3c445e1 47
a66dc285
JH
48static ltrans_partition
49new_partition (const char *name)
50{
51 ltrans_partition part = XCNEW (struct ltrans_partition_def);
e75f8f79 52 part->encoder = lto_symtab_encoder_new (false);
a66dc285
JH
53 part->name = name;
54 part->insns = 0;
9771b263 55 ltrans_partitions.safe_push (part);
a66dc285
JH
56 return part;
57}
58
59/* Free memory used by ltrans datastructures. */
c3c445e1 60
a66dc285
JH
61void
62free_ltrans_partitions (void)
63{
64 unsigned int idx;
65 ltrans_partition part;
9771b263 66 for (idx = 0; ltrans_partitions.iterate (idx, &part); idx++)
a66dc285 67 {
c3c445e1
JH
68 if (part->initializers_visited)
69 pointer_set_destroy (part->initializers_visited);
7b99cca4 70 /* Symtab encoder is freed after streaming. */
a66dc285
JH
71 free (part);
72 }
9771b263 73 ltrans_partitions.release ();
a66dc285
JH
74}
75
c3c445e1
JH
76/* Return true if symbol is already in some partition. */
77
78static inline bool
5e20cdc9 79symbol_partitioned_p (symtab_node *node)
a66dc285 80{
67348ccc 81 return node->aux;
1cdbb3f9
JH
82}
83
c3c445e1 84/* Add references into the partition. */
1cdbb3f9 85static void
5e20cdc9 86add_references_to_partition (ltrans_partition part, symtab_node *node)
1cdbb3f9
JH
87{
88 int i;
d122681a 89 struct ipa_ref *ref = NULL;
1cdbb3f9 90
c3c445e1 91 /* Add all duplicated references to the partition. */
d122681a 92 for (i = 0; node->iterate_reference (i, ref); i++)
96451279 93 if (symtab_get_symbol_partitioning_class (ref->referred) == SYMBOL_DUPLICATE)
c3c445e1
JH
94 add_symbol_to_partition (part, ref->referred);
95 /* References to a readonly variable may be constant foled into its value.
96 Recursively look into the initializers of the constant variable and add
97 references, too. */
7de90a6c 98 else if (is_a <varpool_node *> (ref->referred)
67348ccc 99 && ctor_for_folding (ref->referred->decl) != error_mark_node
c3c445e1 100 && !lto_symtab_encoder_in_partition_p (part->encoder, ref->referred))
1cdbb3f9 101 {
c3c445e1
JH
102 if (!part->initializers_visited)
103 part->initializers_visited = pointer_set_create ();
104 if (!pointer_set_insert (part->initializers_visited, ref->referred))
105 add_references_to_partition (part, ref->referred);
1cdbb3f9 106 }
a66dc285
JH
107}
108
c3c445e1
JH
109/* Helper function for add_symbol_to_partition doing the actual dirty work
110 of adding NODE to PART. */
a66dc285
JH
111
112static bool
5e20cdc9 113add_symbol_to_partition_1 (ltrans_partition part, symtab_node *node)
a66dc285 114{
96451279 115 enum symbol_partitioning_class c = symtab_get_symbol_partitioning_class (node);
c3c445e1 116 int i;
d122681a 117 struct ipa_ref *ref = NULL;
5e20cdc9 118 symtab_node *node1;
a66dc285 119
c3c445e1 120 /* If NODE is already there, we have nothing to do. */
67348ccc 121 if (lto_symtab_encoder_in_partition_p (part->encoder, node))
c3c445e1
JH
122 return true;
123
124 /* non-duplicated aliases or tunks of a duplicated symbol needs to be output
125 just once.
126
127 Be lax about comdats; they may or may not be duplicated and we may
128 end up in need to duplicate keyed comdat because it has unkeyed alias. */
67348ccc 129 if (c == SYMBOL_PARTITION && !DECL_COMDAT (node->decl)
c3c445e1 130 && symbol_partitioned_p (node))
1cdbb3f9
JH
131 return false;
132
c3c445e1
JH
133 /* Be sure that we never try to duplicate partitioned symbol
134 or add external symbol. */
135 gcc_assert (c != SYMBOL_EXTERNAL
136 && (c == SYMBOL_DUPLICATE || !symbol_partitioned_p (node)));
137
67348ccc 138 lto_set_symtab_encoder_in_partition (part->encoder, node);
a66dc285 139
c3c445e1 140 if (symbol_partitioned_p (node))
a66dc285 141 {
67348ccc 142 node->in_other_partition = 1;
a66dc285 143 if (cgraph_dump_file)
c3c445e1 144 fprintf (cgraph_dump_file, "Symbol node %s now used in multiple partitions\n",
fec39fa6 145 node->name ());
a66dc285 146 }
67348ccc 147 node->aux = (void *)((size_t)node->aux + 1);
a66dc285 148
7de90a6c 149 if (cgraph_node *cnode = dyn_cast <cgraph_node *> (node))
c3c445e1 150 {
c3c445e1 151 struct cgraph_edge *e;
39434bce
JH
152 if (!node->alias)
153 part->insns += inline_summary (cnode)->self_size;
c3c445e1
JH
154
155 /* Add all inline clones and callees that are duplicated. */
156 for (e = cnode->callees; e; e = e->next_callee)
157 if (!e->inline_failed)
67348ccc 158 add_symbol_to_partition_1 (part, e->callee);
96451279 159 else if (symtab_get_symbol_partitioning_class (e->callee) == SYMBOL_DUPLICATE)
67348ccc 160 add_symbol_to_partition (part, e->callee);
c3c445e1
JH
161
162 /* Add all thunks associated with the function. */
163 for (e = cnode->callers; e; e = e->next_caller)
164 if (e->caller->thunk.thunk_p)
67348ccc 165 add_symbol_to_partition_1 (part, e->caller);
c3c445e1 166 }
a66dc285 167
c3c445e1 168 add_references_to_partition (part, node);
a66dc285 169
c3c445e1 170 /* Add all aliases associated with the symbol. */
d122681a 171 for (i = 0; node->iterate_referring (i, ref); i++)
67348ccc 172 if (ref->use == IPA_REF_ALIAS && !node->weakref)
c3c445e1 173 add_symbol_to_partition_1 (part, ref->referring);
a66dc285 174
c3c445e1 175 /* Ensure that SAME_COMDAT_GROUP lists all allways added in a group. */
67348ccc
DM
176 if (node->same_comdat_group)
177 for (node1 = node->same_comdat_group;
178 node1 != node; node1 = node1->same_comdat_group)
96451279
JH
179 if (!node->alias)
180 {
181 bool added = add_symbol_to_partition_1 (part, node1);
182 gcc_assert (added);
183 }
c3c445e1 184 return true;
a66dc285
JH
185}
186
c3c445e1
JH
187/* If symbol NODE is really part of other symbol's definition (i.e. it is
188 internal label, thunk, alias or so), return the outer symbol.
189 When add_symbol_to_partition_1 is called on the outer symbol it must
190 eventually add NODE, too. */
5e20cdc9
DM
191static symtab_node *
192contained_in_symbol (symtab_node *node)
c3c445e1
JH
193{
194 /* Weakrefs are never contained in anything. */
67348ccc 195 if (node->weakref)
c3c445e1 196 return node;
7de90a6c 197 if (cgraph_node *cnode = dyn_cast <cgraph_node *> (node))
c3c445e1 198 {
5d59b5e1 199 cnode = cgraph_function_node (cnode, NULL);
c3c445e1
JH
200 if (cnode->global.inlined_to)
201 cnode = cnode->global.inlined_to;
67348ccc 202 return cnode;
c3c445e1 203 }
7de90a6c 204 else if (varpool_node *vnode = dyn_cast <varpool_node *> (node))
67348ccc 205 return varpool_variable_node (vnode, NULL);
c3c445e1
JH
206 return node;
207}
208
209/* Add symbol NODE to partition. When definition of NODE is part
210 of other symbol definition, add the other symbol, too. */
a66dc285
JH
211
212static void
5e20cdc9 213add_symbol_to_partition (ltrans_partition part, symtab_node *node)
a66dc285 214{
5e20cdc9 215 symtab_node *node1;
a66dc285 216
c3c445e1 217 /* Verify that we do not try to duplicate something that can not be. */
96451279 218 gcc_checking_assert (symtab_get_symbol_partitioning_class (node) == SYMBOL_DUPLICATE
c3c445e1 219 || !symbol_partitioned_p (node));
a66dc285 220
c3c445e1
JH
221 while ((node1 = contained_in_symbol (node)) != node)
222 node = node1;
a66dc285 223
c3c445e1
JH
224 /* If we have duplicated symbol contained in something we can not duplicate,
225 we are very badly screwed. The other way is possible, so we do not
226 assert this in add_symbol_to_partition_1.
227
228 Be lax about comdats; they may or may not be duplicated and we may
229 end up in need to duplicate keyed comdat because it has unkeyed alias. */
9cec31f4 230
96451279 231 gcc_assert (symtab_get_symbol_partitioning_class (node) == SYMBOL_DUPLICATE
67348ccc 232 || DECL_COMDAT (node->decl)
c3c445e1 233 || !symbol_partitioned_p (node));
9cec31f4 234
c3c445e1 235 add_symbol_to_partition_1 (part, node);
a66dc285
JH
236}
237
238/* Undo all additions until number of cgraph nodes in PARITION is N_CGRAPH_NODES
239 and number of varpool nodes is N_VARPOOL_NODES. */
240
241static void
7b99cca4 242undo_partition (ltrans_partition partition, unsigned int n_nodes)
a66dc285 243{
7b99cca4 244 while (lto_symtab_encoder_size (partition->encoder) > (int)n_nodes)
a66dc285 245 {
5e20cdc9 246 symtab_node *node = lto_symtab_encoder_deref (partition->encoder,
7b99cca4 247 n_nodes);
39434bce 248 cgraph_node *cnode;
c3c445e1
JH
249
250 /* After UNDO we no longer know what was visited. */
251 if (partition->initializers_visited)
252 pointer_set_destroy (partition->initializers_visited);
253 partition->initializers_visited = NULL;
254
7de90a6c 255 if (!node->alias && (cnode = dyn_cast <cgraph_node *> (node)))
5d59b5e1 256 partition->insns -= inline_summary (cnode)->self_size;
7b99cca4 257 lto_symtab_encoder_delete_node (partition->encoder, node);
67348ccc 258 node->aux = (void *)((size_t)node->aux - 1);
a66dc285
JH
259 }
260}
261
a66dc285
JH
262/* Group cgrah nodes by input files. This is used mainly for testing
263 right now. */
264
265void
266lto_1_to_1_map (void)
267{
5e20cdc9 268 symtab_node *node;
a66dc285
JH
269 struct lto_file_decl_data *file_data;
270 struct pointer_map_t *pmap;
271 ltrans_partition partition;
272 void **slot;
273 int npartitions = 0;
274
a66dc285
JH
275 pmap = pointer_map_create ();
276
c3c445e1 277 FOR_EACH_SYMBOL (node)
a66dc285 278 {
96451279 279 if (symtab_get_symbol_partitioning_class (node) != SYMBOL_PARTITION
c3c445e1 280 || symbol_partitioned_p (node))
a66dc285
JH
281 continue;
282
67348ccc 283 file_data = node->lto_file_data;
a66dc285
JH
284
285 if (file_data)
286 {
287 slot = pointer_map_contains (pmap, file_data);
288 if (slot)
289 partition = (ltrans_partition) *slot;
290 else
291 {
292 partition = new_partition (file_data->file_name);
293 slot = pointer_map_insert (pmap, file_data);
294 *slot = partition;
295 npartitions++;
296 }
297 }
9771b263
DN
298 else if (!file_data && ltrans_partitions.length ())
299 partition = ltrans_partitions[0];
a66dc285
JH
300 else
301 {
302 partition = new_partition ("");
303 slot = pointer_map_insert (pmap, NULL);
304 *slot = partition;
305 npartitions++;
306 }
307
67348ccc 308 add_symbol_to_partition (partition, node);
a66dc285 309 }
a66dc285
JH
310
311 /* If the cgraph is empty, create one cgraph node set so that there is still
312 an output file for any variables that need to be exported in a DSO. */
313 if (!npartitions)
314 new_partition ("empty");
315
316 pointer_map_destroy (pmap);
317
c3c445e1
JH
318}
319
320/* Maximal partitioning. Put every new symbol into new partition if possible. */
a66dc285 321
c3c445e1
JH
322void
323lto_max_map (void)
324{
5e20cdc9 325 symtab_node *node;
c3c445e1
JH
326 ltrans_partition partition;
327 int npartitions = 0;
328
329 FOR_EACH_SYMBOL (node)
330 {
96451279 331 if (symtab_get_symbol_partitioning_class (node) != SYMBOL_PARTITION
c3c445e1
JH
332 || symbol_partitioned_p (node))
333 continue;
fec39fa6 334 partition = new_partition (node->asm_name ());
67348ccc 335 add_symbol_to_partition (partition, node);
c3c445e1
JH
336 npartitions++;
337 }
338 if (!npartitions)
339 new_partition ("empty");
a66dc285
JH
340}
341
342/* Helper function for qsort; sort nodes by order. */
343static int
344node_cmp (const void *pa, const void *pb)
345{
346 const struct cgraph_node *a = *(const struct cgraph_node * const *) pa;
347 const struct cgraph_node *b = *(const struct cgraph_node * const *) pb;
9cec31f4
ML
348
349 /* Profile reorder flag enables function reordering based on first execution
350 of a function. All functions with profile are placed in ascending
351 order at the beginning. */
352
353 if (flag_profile_reorder_functions)
354 {
355 /* Functions with time profile are sorted in ascending order. */
356 if (a->tp_first_run && b->tp_first_run)
357 return a->tp_first_run != b->tp_first_run
358 ? a->tp_first_run - b->tp_first_run
359 : a->order - b->order;
360
361 /* Functions with time profile are sorted before the functions
362 that do not have the profile. */
363 if (a->tp_first_run || b->tp_first_run)
364 return b->tp_first_run - a->tp_first_run;
365 }
366
67348ccc 367 return b->order - a->order;
a66dc285
JH
368}
369
370/* Helper function for qsort; sort nodes by order. */
371static int
372varpool_node_cmp (const void *pa, const void *pb)
373{
2c8326a5
OE
374 const varpool_node *a = *(const varpool_node * const *) pa;
375 const varpool_node *b = *(const varpool_node * const *) pb;
67348ccc 376 return b->order - a->order;
a66dc285
JH
377}
378
379/* Group cgraph nodes into equally-sized partitions.
380
381 The partitioning algorithm is simple: nodes are taken in predefined order.
382 The order corresponds to the order we want functions to have in the final
383 output. In the future this will be given by function reordering pass, but
384 at the moment we use the topological order, which is a good approximation.
385
386 The goal is to partition this linear order into intervals (partitions) so
387 that all the partitions have approximately the same size and the number of
388 callgraph or IPA reference edges crossing boundaries is minimal.
389
390 This is a lot faster (O(n) in size of callgraph) than algorithms doing
391 priority-based graph clustering that are generally O(n^2) and, since
392 WHOPR is designed to make things go well across partitions, it leads
393 to good results.
394
395 We compute the expected size of a partition as:
396
397 max (total_size / lto_partitions, min_partition_size)
398
399 We use dynamic expected size of partition so small programs are partitioned
400 into enough partitions to allow use of multiple CPUs, while large programs
401 are not partitioned too much. Creating too many partitions significantly
402 increases the streaming overhead.
403
404 In the future, we would like to bound the maximal size of partitions so as
405 to prevent the LTRANS stage from consuming too much memory. At the moment,
406 however, the WPA stage is the most memory intensive for large benchmarks,
407 since too many types and declarations are read into memory.
408
409 The function implements a simple greedy algorithm. Nodes are being added
410 to the current partition until after 3/4 of the expected partition size is
411 reached. Past this threshold, we keep track of boundary size (number of
412 edges going to other partitions) and continue adding functions until after
413 the current partition has grown to twice the expected partition size. Then
414 the process is undone to the point where the minimal ratio of boundary size
415 and in-partition calls was reached. */
416
417void
783dab6b 418lto_balanced_map (int n_lto_partitions)
a66dc285
JH
419{
420 int n_nodes = 0;
c525ba9a 421 int n_varpool_nodes = 0, varpool_pos = 0, best_varpool_pos = 0;
a66dc285 422 struct cgraph_node **order = XNEWVEC (struct cgraph_node *, cgraph_max_uid);
2c8326a5 423 varpool_node **varpool_order = NULL;
6a49f3c9 424 int i;
a66dc285
JH
425 struct cgraph_node *node;
426 int total_size = 0, best_total_size = 0;
427 int partition_size;
428 ltrans_partition partition;
7b99cca4 429 int last_visited_node = 0;
2c8326a5 430 varpool_node *vnode;
a66dc285 431 int cost = 0, internal = 0;
7b99cca4 432 int best_n_nodes = 0, best_i = 0, best_cost =
a66dc285
JH
433 INT_MAX, best_internal = 0;
434 int npartitions;
435 int current_order = -1;
436
65c70e6b 437 FOR_EACH_VARIABLE (vnode)
67348ccc 438 gcc_assert (!vnode->aux);
a66dc285 439
6a49f3c9 440 FOR_EACH_DEFINED_FUNCTION (node)
96451279 441 if (symtab_get_symbol_partitioning_class (node) == SYMBOL_PARTITION)
6a49f3c9
JH
442 {
443 order[n_nodes++] = node;
39434bce
JH
444 if (!node->alias)
445 total_size += inline_summary (node)->size;
6a49f3c9 446 }
a66dc285 447
6a49f3c9
JH
448 /* Streaming works best when the source units do not cross partition
449 boundaries much. This is because importing function from a source
450 unit tends to import a lot of global trees defined there. We should
451 get better about minimizing the function bounday, but until that
452 things works smoother if we order in source order. */
453 qsort (order, n_nodes, sizeof (struct cgraph_node *), node_cmp);
9cec31f4
ML
454
455 if (cgraph_dump_file)
456 for(i = 0; i < n_nodes; i++)
457 fprintf (cgraph_dump_file, "Balanced map symbol order:%s:%u\n", order[i]->name (), order[i]->tp_first_run);
458
a66dc285
JH
459 if (!flag_toplevel_reorder)
460 {
65c70e6b 461 FOR_EACH_VARIABLE (vnode)
96451279 462 if (symtab_get_symbol_partitioning_class (vnode) == SYMBOL_PARTITION)
a66dc285 463 n_varpool_nodes++;
2c8326a5 464 varpool_order = XNEWVEC (varpool_node *, n_varpool_nodes);
a66dc285
JH
465
466 n_varpool_nodes = 0;
65c70e6b 467 FOR_EACH_VARIABLE (vnode)
96451279 468 if (symtab_get_symbol_partitioning_class (vnode) == SYMBOL_PARTITION)
a66dc285 469 varpool_order[n_varpool_nodes++] = vnode;
2c8326a5 470 qsort (varpool_order, n_varpool_nodes, sizeof (varpool_node *),
a66dc285
JH
471 varpool_node_cmp);
472 }
473
474 /* Compute partition size and create the first partition. */
783dab6b 475 partition_size = total_size / n_lto_partitions;
a66dc285
JH
476 if (partition_size < PARAM_VALUE (MIN_PARTITION_SIZE))
477 partition_size = PARAM_VALUE (MIN_PARTITION_SIZE);
478 npartitions = 1;
479 partition = new_partition ("");
480 if (cgraph_dump_file)
481 fprintf (cgraph_dump_file, "Total unit size: %i, partition size: %i\n",
482 total_size, partition_size);
483
484 for (i = 0; i < n_nodes; i++)
485 {
67348ccc 486 if (symbol_partitioned_p (order[i]))
a66dc285
JH
487 continue;
488
67348ccc 489 current_order = order[i]->order;
a66dc285
JH
490
491 if (!flag_toplevel_reorder)
960bfb69 492 while (varpool_pos < n_varpool_nodes
67348ccc 493 && varpool_order[varpool_pos]->order < current_order)
a66dc285 494 {
67348ccc
DM
495 if (!symbol_partitioned_p (varpool_order[varpool_pos]))
496 add_symbol_to_partition (partition, varpool_order[varpool_pos]);
a66dc285
JH
497 varpool_pos++;
498 }
499
67348ccc 500 add_symbol_to_partition (partition, order[i]);
39434bce
JH
501 if (!order[i]->alias)
502 total_size -= inline_summary (order[i])->size;
a66dc285
JH
503
504
505 /* Once we added a new node to the partition, we also want to add
506 all referenced variables unless they was already added into some
507 earlier partition.
c3c445e1 508 add_symbol_to_partition adds possibly multiple nodes and
a66dc285
JH
509 variables that are needed to satisfy needs of ORDER[i].
510 We remember last visited cgraph and varpool node from last iteration
511 of outer loop that allows us to process every new addition.
512
513 At the same time we compute size of the boundary into COST. Every
514 callgraph or IPA reference edge leaving the partition contributes into
515 COST. Every edge inside partition was earlier computed as one leaving
516 it and thus we need to subtract it from COST. */
7b99cca4 517 while (last_visited_node < lto_symtab_encoder_size (partition->encoder))
a66dc285 518 {
d122681a 519 symtab_node *refs_node;
a66dc285 520 int j;
d122681a 521 struct ipa_ref *ref = NULL;
5e20cdc9 522 symtab_node *snode = lto_symtab_encoder_deref (partition->encoder,
7b99cca4 523 last_visited_node);
a66dc285 524
7de90a6c 525 if (cgraph_node *node = dyn_cast <cgraph_node *> (snode))
a66dc285
JH
526 {
527 struct cgraph_edge *edge;
528
d122681a 529 refs_node = node;
a66dc285 530
7b99cca4 531 last_visited_node++;
a66dc285 532
67348ccc 533 gcc_assert (node->definition || node->weakref);
a66dc285
JH
534
535 /* Compute boundary cost of callgraph edges. */
536 for (edge = node->callees; edge; edge = edge->next_callee)
67348ccc 537 if (edge->callee->definition)
a66dc285
JH
538 {
539 int edge_cost = edge->frequency;
7b99cca4 540 int index;
a66dc285
JH
541
542 if (!edge_cost)
543 edge_cost = 1;
544 gcc_assert (edge_cost > 0);
7b99cca4 545 index = lto_symtab_encoder_lookup (partition->encoder,
67348ccc 546 edge->callee);
7b99cca4
JH
547 if (index != LCC_NOT_FOUND
548 && index < last_visited_node - 1)
549 cost -= edge_cost, internal += edge_cost;
a66dc285
JH
550 else
551 cost += edge_cost;
552 }
553 for (edge = node->callers; edge; edge = edge->next_caller)
554 {
555 int edge_cost = edge->frequency;
7b99cca4 556 int index;
a66dc285 557
67348ccc 558 gcc_assert (edge->caller->definition);
a66dc285
JH
559 if (!edge_cost)
560 edge_cost = 1;
561 gcc_assert (edge_cost > 0);
7b99cca4 562 index = lto_symtab_encoder_lookup (partition->encoder,
67348ccc 563 edge->caller);
7b99cca4
JH
564 if (index != LCC_NOT_FOUND
565 && index < last_visited_node - 1)
a66dc285
JH
566 cost -= edge_cost;
567 else
568 cost += edge_cost;
569 }
570 }
571 else
572 {
d122681a 573 refs_node = snode;
7b99cca4 574 last_visited_node++;
a66dc285
JH
575 }
576
577 /* Compute boundary cost of IPA REF edges and at the same time look into
578 variables referenced from current partition and try to add them. */
d122681a 579 for (j = 0; refs_node->iterate_reference (j, ref); j++)
7de90a6c 580 if (is_a <varpool_node *> (ref->referred))
a66dc285 581 {
7b99cca4 582 int index;
a66dc285 583
d122681a 584 vnode = dyn_cast <varpool_node *> (ref->referred);
67348ccc 585 if (!vnode->definition)
a66dc285 586 continue;
67348ccc 587 if (!symbol_partitioned_p (vnode) && flag_toplevel_reorder
96451279 588 && symtab_get_symbol_partitioning_class (vnode) == SYMBOL_PARTITION)
67348ccc 589 add_symbol_to_partition (partition, vnode);
7b99cca4 590 index = lto_symtab_encoder_lookup (partition->encoder,
67348ccc 591 vnode);
7b99cca4
JH
592 if (index != LCC_NOT_FOUND
593 && index < last_visited_node - 1)
a66dc285
JH
594 cost--, internal++;
595 else
596 cost++;
597 }
598 else
599 {
7b99cca4 600 int index;
a66dc285 601
d122681a 602 node = dyn_cast <cgraph_node *> (ref->referred);
67348ccc 603 if (!node->definition)
a66dc285 604 continue;
7b99cca4 605 index = lto_symtab_encoder_lookup (partition->encoder,
67348ccc 606 node);
7b99cca4
JH
607 if (index != LCC_NOT_FOUND
608 && index < last_visited_node - 1)
a66dc285
JH
609 cost--, internal++;
610 else
611 cost++;
612 }
d122681a 613 for (j = 0; refs_node->iterate_referring (j, ref); j++)
7de90a6c 614 if (is_a <varpool_node *> (ref->referring))
a66dc285 615 {
7b99cca4 616 int index;
a66dc285 617
d122681a 618 vnode = dyn_cast <varpool_node *> (ref->referring);
67348ccc 619 gcc_assert (vnode->definition);
39434bce
JH
620 /* It is better to couple variables with their users, because it allows them
621 to be removed. Coupling with objects they refer to only helps to reduce
622 number of symbols promoted to hidden. */
67348ccc 623 if (!symbol_partitioned_p (vnode) && flag_toplevel_reorder
39434bce 624 && !varpool_can_remove_if_no_refs (vnode)
96451279 625 && symtab_get_symbol_partitioning_class (vnode) == SYMBOL_PARTITION)
67348ccc 626 add_symbol_to_partition (partition, vnode);
7b99cca4 627 index = lto_symtab_encoder_lookup (partition->encoder,
67348ccc 628 vnode);
7b99cca4
JH
629 if (index != LCC_NOT_FOUND
630 && index < last_visited_node - 1)
a66dc285
JH
631 cost--;
632 else
633 cost++;
634 }
635 else
636 {
7b99cca4 637 int index;
a66dc285 638
d122681a 639 node = dyn_cast <cgraph_node *> (ref->referring);
67348ccc 640 gcc_assert (node->definition);
7b99cca4 641 index = lto_symtab_encoder_lookup (partition->encoder,
67348ccc 642 node);
7b99cca4
JH
643 if (index != LCC_NOT_FOUND
644 && index < last_visited_node - 1)
a66dc285
JH
645 cost--;
646 else
647 cost++;
648 }
649 }
650
651 /* If the partition is large enough, start looking for smallest boundary cost. */
652 if (partition->insns < partition_size * 3 / 4
653 || best_cost == INT_MAX
654 || ((!cost
655 || (best_internal * (HOST_WIDE_INT) cost
656 > (internal * (HOST_WIDE_INT)best_cost)))
657 && partition->insns < partition_size * 5 / 4))
658 {
659 best_cost = cost;
660 best_internal = internal;
661 best_i = i;
7b99cca4 662 best_n_nodes = lto_symtab_encoder_size (partition->encoder);
a66dc285 663 best_total_size = total_size;
c525ba9a 664 best_varpool_pos = varpool_pos;
a66dc285
JH
665 }
666 if (cgraph_dump_file)
9de04252
MJ
667 fprintf (cgraph_dump_file, "Step %i: added %s/%i, size %i, cost %i/%i "
668 "best %i/%i, step %i\n", i,
fec39fa6 669 order[i]->name (), order[i]->order,
9de04252 670 partition->insns, cost, internal,
a66dc285
JH
671 best_cost, best_internal, best_i);
672 /* Partition is too large, unwind into step when best cost was reached and
673 start new partition. */
674 if (partition->insns > 2 * partition_size)
675 {
676 if (best_i != i)
677 {
678 if (cgraph_dump_file)
679 fprintf (cgraph_dump_file, "Unwinding %i insertions to step %i\n",
680 i - best_i, best_i);
7b99cca4 681 undo_partition (partition, best_n_nodes);
c525ba9a 682 varpool_pos = best_varpool_pos;
a66dc285
JH
683 }
684 i = best_i;
685 /* When we are finished, avoid creating empty partition. */
67348ccc 686 while (i < n_nodes - 1 && symbol_partitioned_p (order[i + 1]))
a66dc285
JH
687 i++;
688 if (i == n_nodes - 1)
689 break;
690 partition = new_partition ("");
7b99cca4 691 last_visited_node = 0;
a66dc285
JH
692 total_size = best_total_size;
693 cost = 0;
694
695 if (cgraph_dump_file)
696 fprintf (cgraph_dump_file, "New partition\n");
697 best_n_nodes = 0;
a66dc285
JH
698 best_cost = INT_MAX;
699
700 /* Since the size of partitions is just approximate, update the size after
701 we finished current one. */
783dab6b
RB
702 if (npartitions < n_lto_partitions)
703 partition_size = total_size / (n_lto_partitions - npartitions);
a66dc285
JH
704 else
705 partition_size = INT_MAX;
706
707 if (partition_size < PARAM_VALUE (MIN_PARTITION_SIZE))
708 partition_size = PARAM_VALUE (MIN_PARTITION_SIZE);
709 npartitions ++;
710 }
711 }
712
713 /* Varables that are not reachable from the code go into last partition. */
714 if (flag_toplevel_reorder)
715 {
65c70e6b 716 FOR_EACH_VARIABLE (vnode)
96451279 717 if (symtab_get_symbol_partitioning_class (vnode) == SYMBOL_PARTITION
67348ccc
DM
718 && !symbol_partitioned_p (vnode))
719 add_symbol_to_partition (partition, vnode);
a66dc285
JH
720 }
721 else
722 {
723 while (varpool_pos < n_varpool_nodes)
724 {
67348ccc
DM
725 if (!symbol_partitioned_p (varpool_order[varpool_pos]))
726 add_symbol_to_partition (partition, varpool_order[varpool_pos]);
a66dc285
JH
727 varpool_pos++;
728 }
729 free (varpool_order);
730 }
731 free (order);
732}
733
64cfa6c0
JH
734/* Mangle NODE symbol name into a local name.
735 This is necessary to do
736 1) if two or more static vars of same assembler name
737 are merged into single ltrans unit.
738 2) if prevoiusly static var was promoted hidden to avoid possible conflict
739 with symbols defined out of the LTO world.
740*/
741
8ee05051 742static bool
5e20cdc9 743privatize_symbol_name (symtab_node *node)
64cfa6c0 744{
67348ccc 745 tree decl = node->decl;
64cfa6c0 746 const char *name = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (decl));
64cfa6c0
JH
747
748 /* Our renaming machinery do not handle more than one change of assembler name.
749 We should not need more than one anyway. */
67348ccc
DM
750 if (node->lto_file_data
751 && lto_get_decl_name_mapping (node->lto_file_data, name) != name)
64cfa6c0
JH
752 {
753 if (cgraph_dump_file)
754 fprintf (cgraph_dump_file,
755 "Not privatizing symbol name: %s. It privatized already.\n",
756 name);
8ee05051 757 return false;
64cfa6c0
JH
758 }
759 /* Avoid mangling of already mangled clones.
760 ??? should have a flag whether a symbol has a 'private' name already,
761 since we produce some symbols like that i.e. for global constructors
762 that are not really clones. */
67348ccc 763 if (node->unique_name)
64cfa6c0
JH
764 {
765 if (cgraph_dump_file)
766 fprintf (cgraph_dump_file,
767 "Not privatizing symbol name: %s. Has unique name.\n",
768 name);
8ee05051 769 return false;
64cfa6c0 770 }
64cfa6c0 771 change_decl_assembler_name (decl, clone_function_name (decl, "lto_priv"));
67348ccc
DM
772 if (node->lto_file_data)
773 lto_record_renamed_decl (node->lto_file_data, name,
64cfa6c0
JH
774 IDENTIFIER_POINTER
775 (DECL_ASSEMBLER_NAME (decl)));
776 if (cgraph_dump_file)
777 fprintf (cgraph_dump_file,
778 "Privatizing symbol name: %s -> %s\n",
779 name, IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (decl)));
8ee05051 780 return true;
64cfa6c0
JH
781}
782
a66dc285
JH
783/* Promote variable VNODE to be static. */
784
b4661bfe 785static void
5e20cdc9 786promote_symbol (symtab_node *node)
a66dc285 787{
b4661bfe 788 /* We already promoted ... */
67348ccc
DM
789 if (DECL_VISIBILITY (node->decl) == VISIBILITY_HIDDEN
790 && DECL_VISIBILITY_SPECIFIED (node->decl)
791 && TREE_PUBLIC (node->decl))
b4661bfe 792 return;
a66dc285 793
67348ccc
DM
794 gcc_checking_assert (!TREE_PUBLIC (node->decl)
795 && !DECL_EXTERNAL (node->decl));
64cfa6c0
JH
796 /* Be sure that newly public symbol does not conflict with anything already
797 defined by the non-LTO part. */
798 privatize_symbol_name (node);
67348ccc
DM
799 TREE_PUBLIC (node->decl) = 1;
800 DECL_VISIBILITY (node->decl) = VISIBILITY_HIDDEN;
801 DECL_VISIBILITY_SPECIFIED (node->decl) = true;
a66dc285
JH
802 if (cgraph_dump_file)
803 fprintf (cgraph_dump_file,
fec39fa6 804 "Promoting as hidden: %s\n", node->name ());
a66dc285
JH
805}
806
64cfa6c0
JH
807/* Return true if NODE needs named section even if it won't land in the partition
808 symbol table.
809 FIXME: we should really not use named sections for inline clones and master clones. */
810
811static bool
5e20cdc9 812may_need_named_section_p (lto_symtab_encoder_t encoder, symtab_node *node)
64cfa6c0 813{
7de90a6c 814 struct cgraph_node *cnode = dyn_cast <cgraph_node *> (node);
64cfa6c0
JH
815 if (!cnode)
816 return false;
817 if (symtab_real_symbol_p (node))
818 return false;
64cfa6c0
JH
819 return (!encoder
820 || (lto_symtab_encoder_lookup (encoder, node) != LCC_NOT_FOUND
821 && lto_symtab_encoder_encode_body_p (encoder,
822 cnode)));
823}
824
825/* If NODE represents a static variable. See if there are other variables
826 of the same name in partition ENCODER (or in whole compilation unit if
827 ENCODER is NULL) and if so, mangle the statics. Always mangle all
828 conflicting statics, so we reduce changes of silently miscompiling
9cec31f4 829 asm statements referring to them by symbol name. */
64cfa6c0
JH
830
831static void
5e20cdc9 832rename_statics (lto_symtab_encoder_t encoder, symtab_node *node)
64cfa6c0 833{
67348ccc 834 tree decl = node->decl;
5e20cdc9 835 symtab_node *s;
64cfa6c0
JH
836 tree name = DECL_ASSEMBLER_NAME (decl);
837
838 /* See if this is static symbol. */
67348ccc 839 if ((node->externally_visible
64cfa6c0
JH
840 /* FIXME: externally_visible is somewhat illogically not set for
841 external symbols (i.e. those not defined). Remove this test
842 once this is fixed. */
67348ccc 843 || DECL_EXTERNAL (node->decl)
64cfa6c0 844 || !symtab_real_symbol_p (node))
08346abd 845 && !may_need_named_section_p (encoder, node))
64cfa6c0
JH
846 return;
847
848 /* Now walk symbols sharing the same name and see if there are any conflicts.
849 (all types of symbols counts here, since we can not have static of the
850 same name as external or public symbol.) */
851 for (s = symtab_node_for_asm (name);
67348ccc 852 s; s = s->next_sharing_asm_name)
64cfa6c0 853 if ((symtab_real_symbol_p (s) || may_need_named_section_p (encoder, s))
67348ccc 854 && s->decl != node->decl
64cfa6c0
JH
855 && (!encoder
856 || lto_symtab_encoder_lookup (encoder, s) != LCC_NOT_FOUND))
857 break;
858
859 /* OK, no confict, so we have nothing to do. */
860 if (!s)
861 return;
862
863 if (cgraph_dump_file)
864 fprintf (cgraph_dump_file,
fec39fa6 865 "Renaming statics with asm name: %s\n", node->name ());
64cfa6c0
JH
866
867 /* Assign every symbol in the set that shares the same ASM name an unique
868 mangled name. */
869 for (s = symtab_node_for_asm (name); s;)
67348ccc 870 if (!s->externally_visible
64cfa6c0 871 && ((symtab_real_symbol_p (s)
67348ccc
DM
872 && !DECL_EXTERNAL (node->decl)
873 && !TREE_PUBLIC (node->decl))
64cfa6c0
JH
874 || may_need_named_section_p (encoder, s))
875 && (!encoder
876 || lto_symtab_encoder_lookup (encoder, s) != LCC_NOT_FOUND))
877 {
8ee05051 878 if (privatize_symbol_name (s))
1aa95df7 879 /* Re-start from beginning since we do not know how many symbols changed a name. */
8ee05051 880 s = symtab_node_for_asm (name);
67348ccc 881 else s = s->next_sharing_asm_name;
64cfa6c0 882 }
67348ccc 883 else s = s->next_sharing_asm_name;
64cfa6c0 884}
b4661bfe 885
a66dc285
JH
886/* Find out all static decls that need to be promoted to global because
887 of cross file sharing. This function must be run in the WPA mode after
888 all inlinees are added. */
889
890void
891lto_promote_cross_file_statics (void)
892{
a66dc285 893 unsigned i, n_sets;
a66dc285
JH
894
895 gcc_assert (flag_wpa);
896
b4661bfe 897 /* First compute boundaries. */
9771b263 898 n_sets = ltrans_partitions.length ();
a66dc285
JH
899 for (i = 0; i < n_sets; i++)
900 {
901 ltrans_partition part
9771b263 902 = ltrans_partitions[i];
b4661bfe
JH
903 part->encoder = compute_ltrans_boundary (part->encoder);
904 }
a66dc285 905
b4661bfe
JH
906 /* Look at boundaries and promote symbols as needed. */
907 for (i = 0; i < n_sets; i++)
908 {
909 lto_symtab_encoder_iterator lsei;
64cfa6c0 910 lto_symtab_encoder_t encoder = ltrans_partitions[i]->encoder;
a66dc285 911
b4661bfe
JH
912 for (lsei = lsei_start (encoder); !lsei_end_p (lsei);
913 lsei_next (&lsei))
914 {
5e20cdc9 915 symtab_node *node = lsei_node (lsei);
b4661bfe 916
64cfa6c0
JH
917 /* If symbol is static, rename it if its assembler name clash with
918 anything else in this unit. */
919 rename_statics (encoder, node);
920
b4661bfe 921 /* No need to promote if symbol already is externally visible ... */
67348ccc 922 if (node->externally_visible
b4661bfe
JH
923 /* ... or if it is part of current partition ... */
924 || lto_symtab_encoder_in_partition_p (encoder, node)
925 /* ... or if we do not partition it. This mean that it will
926 appear in every partition refernecing it. */
96451279 927 || symtab_get_symbol_partitioning_class (node) != SYMBOL_PARTITION)
b4661bfe 928 continue;
a66dc285 929
b4661bfe
JH
930 promote_symbol (node);
931 }
a66dc285 932 }
a66dc285 933}
64cfa6c0
JH
934
935/* Rename statics in the whole unit in the case that
936 we do -flto-partition=none. */
937
938void
939lto_promote_statics_nonwpa (void)
940{
5e20cdc9 941 symtab_node *node;
64cfa6c0
JH
942 FOR_EACH_SYMBOL (node)
943 rename_statics (NULL, node);
944}