]>
Commit | Line | Data |
---|---|---|
5d94cf4d | 1 | /* Tree inlining. |
711789cc | 2 | Copyright (C) 2001-2013 Free Software Foundation, Inc. |
1431bff6 | 3 | Contributed by Alexandre Oliva <aoliva@redhat.com> |
4 | ||
5a8b6e6a | 5 | This file is part of GCC. |
1431bff6 | 6 | |
5a8b6e6a | 7 | GCC is free software; you can redistribute it and/or modify |
1431bff6 | 8 | it under the terms of the GNU General Public License as published by |
8c4c00c1 | 9 | the Free Software Foundation; either version 3, or (at your option) |
1431bff6 | 10 | any later version. |
11 | ||
5a8b6e6a | 12 | GCC is distributed in the hope that it will be useful, |
1431bff6 | 13 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 | GNU General Public License for more details. | |
16 | ||
17 | You should have received a copy of the GNU General Public License | |
8c4c00c1 | 18 | along with GCC; see the file COPYING3. If not see |
19 | <http://www.gnu.org/licenses/>. */ | |
1431bff6 | 20 | |
21 | #include "config.h" | |
22 | #include "system.h" | |
805e22b2 | 23 | #include "coretypes.h" |
24 | #include "tm.h" | |
0b205f4c | 25 | #include "diagnostic-core.h" |
1431bff6 | 26 | #include "tree.h" |
9ed99284 | 27 | #include "stor-layout.h" |
28 | #include "calls.h" | |
1431bff6 | 29 | #include "tree-inline.h" |
e343483a | 30 | #include "flags.h" |
31 | #include "params.h" | |
32 | #include "input.h" | |
33 | #include "insn-config.h" | |
e343483a | 34 | #include "hashtab.h" |
b0278d39 | 35 | #include "langhooks.h" |
e27482aa | 36 | #include "basic-block.h" |
37 | #include "tree-iterator.h" | |
9bc3739f | 38 | #include "intl.h" |
bc61cadb | 39 | #include "pointer-set.h" |
40 | #include "tree-ssa-alias.h" | |
41 | #include "internal-fn.h" | |
42 | #include "gimple-fold.h" | |
43 | #include "tree-eh.h" | |
44 | #include "gimple-expr.h" | |
45 | #include "is-a.h" | |
e795d6e1 | 46 | #include "gimple.h" |
a8783bee | 47 | #include "gimplify.h" |
dcf1a1ec | 48 | #include "gimple-iterator.h" |
e795d6e1 | 49 | #include "gimplify-me.h" |
dcf1a1ec | 50 | #include "gimple-walk.h" |
073c1fd5 | 51 | #include "gimple-ssa.h" |
52 | #include "tree-cfg.h" | |
53 | #include "tree-phinodes.h" | |
54 | #include "ssa-iterators.h" | |
9ed99284 | 55 | #include "stringpool.h" |
073c1fd5 | 56 | #include "tree-ssanames.h" |
57 | #include "tree-into-ssa.h" | |
9ed99284 | 58 | #include "expr.h" |
073c1fd5 | 59 | #include "tree-dfa.h" |
69ee5dbb | 60 | #include "tree-ssa.h" |
b0cdf642 | 61 | #include "function.h" |
ce084dfc | 62 | #include "tree-pretty-print.h" |
e27482aa | 63 | #include "except.h" |
9e45f419 | 64 | #include "debug.h" |
c5235c0b | 65 | #include "ipa-prop.h" |
4992f399 | 66 | #include "value-prof.h" |
deff5ffd | 67 | #include "tree-pass.h" |
7cc6d7a8 | 68 | #include "target.h" |
f6568ea4 | 69 | #include "cfgloop.h" |
e343483a | 70 | |
8e3cb73b | 71 | #include "rtl.h" /* FIXME: For asm_str_count. */ |
72 | ||
4ee9c684 | 73 | /* I'm not real happy about this, but we need to handle gimple and |
74 | non-gimple trees. */ | |
1431bff6 | 75 | |
51a48c27 | 76 | /* Inlining, Cloning, Versioning, Parallelization |
e27482aa | 77 | |
78 | Inlining: a function body is duplicated, but the PARM_DECLs are | |
79 | remapped into VAR_DECLs, and non-void RETURN_EXPRs become | |
75a70cf9 | 80 | MODIFY_EXPRs that store to a dedicated returned-value variable. |
e27482aa | 81 | The duplicated eh_region info of the copy will later be appended |
82 | to the info for the caller; the eh_region info in copied throwing | |
e38def9c | 83 | statements and RESX statements are adjusted accordingly. |
e27482aa | 84 | |
e27482aa | 85 | Cloning: (only in C++) We have one body for a con/de/structor, and |
86 | multiple function decls, each with a unique parameter list. | |
87 | Duplicate the body, using the given splay tree; some parameters | |
88 | will become constants (like 0 or 1). | |
89 | ||
51a48c27 | 90 | Versioning: a function body is duplicated and the result is a new |
91 | function rather than into blocks of an existing function as with | |
92 | inlining. Some parameters will become constants. | |
93 | ||
94 | Parallelization: a region of a function is duplicated resulting in | |
95 | a new function. Variables may be replaced with complex expressions | |
96 | to enable shared variable semantics. | |
97 | ||
e27482aa | 98 | All of these will simultaneously lookup any callgraph edges. If |
99 | we're going to inline the duplicated function body, and the given | |
100 | function has some cloned callgraph nodes (one for each place this | |
101 | function will be inlined) those callgraph edges will be duplicated. | |
51a48c27 | 102 | If we're cloning the body, those callgraph edges will be |
e27482aa | 103 | updated to point into the new body. (Note that the original |
104 | callgraph node and edge list will not be altered.) | |
105 | ||
75a70cf9 | 106 | See the CALL_EXPR handling case in copy_tree_body_r (). */ |
e27482aa | 107 | |
e343483a | 108 | /* To Do: |
109 | ||
110 | o In order to make inlining-on-trees work, we pessimized | |
111 | function-local static constants. In particular, they are now | |
112 | always output, even when not addressed. Fix this by treating | |
113 | function-local static constants just like global static | |
114 | constants; the back-end already knows not to output them if they | |
115 | are not needed. | |
116 | ||
117 | o Provide heuristics to clamp inlining of recursive template | |
118 | calls? */ | |
119 | ||
bc8bb825 | 120 | |
bc8bb825 | 121 | /* Weights that estimate_num_insns uses to estimate the size of the |
122 | produced code. */ | |
123 | ||
124 | eni_weights eni_size_weights; | |
125 | ||
126 | /* Weights that estimate_num_insns uses to estimate the time necessary | |
127 | to execute the produced code. */ | |
128 | ||
129 | eni_weights eni_time_weights; | |
130 | ||
e343483a | 131 | /* Prototypes. */ |
132 | ||
524a0531 | 133 | static tree declare_return_variable (copy_body_data *, tree, tree, basic_block); |
51a48c27 | 134 | static void remap_block (tree *, copy_body_data *); |
51a48c27 | 135 | static void copy_bind_expr (tree *, int *, copy_body_data *); |
e27482aa | 136 | static void declare_inline_vars (tree, tree); |
8c143e71 | 137 | static void remap_save_expr (tree *, void *, int *); |
cb302f29 | 138 | static void prepend_lexical_block (tree current_block, tree new_block); |
51a48c27 | 139 | static tree copy_decl_to_var (tree, copy_body_data *); |
25b3017b | 140 | static tree copy_result_decl_to_var (tree, copy_body_data *); |
51a48c27 | 141 | static tree copy_decl_maybe_to_var (tree, copy_body_data *); |
75a70cf9 | 142 | static gimple remap_gimple_stmt (gimple, copy_body_data *); |
31359ae8 | 143 | static bool delete_unreachable_blocks_update_callgraph (copy_body_data *id); |
e27482aa | 144 | |
fcc73461 | 145 | /* Insert a tree->tree mapping for ID. Despite the name suggests |
146 | that the trees should be variables, it is used for more than that. */ | |
147 | ||
51a48c27 | 148 | void |
149 | insert_decl_map (copy_body_data *id, tree key, tree value) | |
fcc73461 | 150 | { |
e3022db7 | 151 | *pointer_map_insert (id->decl_map, key) = value; |
fcc73461 | 152 | |
153 | /* Always insert an identity map as well. If we see this same new | |
154 | node again, we won't want to duplicate it a second time. */ | |
155 | if (key != value) | |
e3022db7 | 156 | *pointer_map_insert (id->decl_map, value) = value; |
fcc73461 | 157 | } |
158 | ||
9845d120 | 159 | /* Insert a tree->tree mapping for ID. This is only used for |
160 | variables. */ | |
161 | ||
162 | static void | |
163 | insert_debug_decl_map (copy_body_data *id, tree key, tree value) | |
164 | { | |
165 | if (!gimple_in_ssa_p (id->src_cfun)) | |
166 | return; | |
167 | ||
168 | if (!MAY_HAVE_DEBUG_STMTS) | |
169 | return; | |
170 | ||
171 | if (!target_for_debug_bind (key)) | |
172 | return; | |
173 | ||
174 | gcc_assert (TREE_CODE (key) == PARM_DECL); | |
175 | gcc_assert (TREE_CODE (value) == VAR_DECL); | |
176 | ||
177 | if (!id->debug_map) | |
178 | id->debug_map = pointer_map_create (); | |
179 | ||
180 | *pointer_map_insert (id->debug_map, key) = value; | |
181 | } | |
182 | ||
9f28a7ee | 183 | /* If nonzero, we're remapping the contents of inlined debug |
184 | statements. If negative, an error has occurred, such as a | |
185 | reference to a variable that isn't available in the inlined | |
186 | context. */ | |
187 | static int processing_debug_stmt = 0; | |
188 | ||
deff5ffd | 189 | /* Construct new SSA name for old NAME. ID is the inline context. */ |
190 | ||
191 | static tree | |
192 | remap_ssa_name (tree name, copy_body_data *id) | |
193 | { | |
ec11736b | 194 | tree new_tree, var; |
e3022db7 | 195 | tree *n; |
deff5ffd | 196 | |
197 | gcc_assert (TREE_CODE (name) == SSA_NAME); | |
198 | ||
e3022db7 | 199 | n = (tree *) pointer_map_contains (id->decl_map, name); |
deff5ffd | 200 | if (n) |
50828ed8 | 201 | return unshare_expr (*n); |
deff5ffd | 202 | |
9f28a7ee | 203 | if (processing_debug_stmt) |
204 | { | |
2f4ec87c | 205 | if (SSA_NAME_IS_DEFAULT_DEF (name) |
206 | && TREE_CODE (SSA_NAME_VAR (name)) == PARM_DECL | |
841424cc | 207 | && id->entry_bb == NULL |
34154e27 | 208 | && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (cfun))) |
841424cc | 209 | { |
210 | tree vexpr = make_node (DEBUG_EXPR_DECL); | |
211 | gimple def_temp; | |
212 | gimple_stmt_iterator gsi; | |
213 | tree val = SSA_NAME_VAR (name); | |
214 | ||
215 | n = (tree *) pointer_map_contains (id->decl_map, val); | |
216 | if (n != NULL) | |
217 | val = *n; | |
218 | if (TREE_CODE (val) != PARM_DECL) | |
219 | { | |
220 | processing_debug_stmt = -1; | |
221 | return name; | |
222 | } | |
223 | def_temp = gimple_build_debug_source_bind (vexpr, val, NULL); | |
224 | DECL_ARTIFICIAL (vexpr) = 1; | |
225 | TREE_TYPE (vexpr) = TREE_TYPE (name); | |
226 | DECL_MODE (vexpr) = DECL_MODE (SSA_NAME_VAR (name)); | |
34154e27 | 227 | gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun))); |
841424cc | 228 | gsi_insert_before (&gsi, def_temp, GSI_SAME_STMT); |
229 | return vexpr; | |
230 | } | |
231 | ||
9f28a7ee | 232 | processing_debug_stmt = -1; |
233 | return name; | |
234 | } | |
235 | ||
ec11736b | 236 | /* Remap anonymous SSA names or SSA names of anonymous decls. */ |
237 | var = SSA_NAME_VAR (name); | |
238 | if (!var | |
239 | || (!SSA_NAME_IS_DEFAULT_DEF (name) | |
240 | && TREE_CODE (var) == VAR_DECL | |
241 | && !VAR_DECL_IS_VIRTUAL_OPERAND (var) | |
242 | && DECL_ARTIFICIAL (var) | |
243 | && DECL_IGNORED_P (var) | |
244 | && !DECL_NAME (var))) | |
245 | { | |
246 | struct ptr_info_def *pi; | |
247 | new_tree = make_ssa_name (remap_type (TREE_TYPE (name), id), NULL); | |
248 | if (!var && SSA_NAME_IDENTIFIER (name)) | |
249 | SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree, SSA_NAME_IDENTIFIER (name)); | |
250 | insert_decl_map (id, name, new_tree); | |
251 | SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree) | |
252 | = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name); | |
253 | /* At least IPA points-to info can be directly transferred. */ | |
254 | if (id->src_cfun->gimple_df | |
255 | && id->src_cfun->gimple_df->ipa_pta | |
256 | && (pi = SSA_NAME_PTR_INFO (name)) | |
257 | && !pi->pt.anything) | |
258 | { | |
259 | struct ptr_info_def *new_pi = get_ptr_info (new_tree); | |
260 | new_pi->pt = pi->pt; | |
261 | } | |
262 | return new_tree; | |
263 | } | |
264 | ||
deff5ffd | 265 | /* Do not set DEF_STMT yet as statement is not copied yet. We do that |
266 | in copy_bb. */ | |
ec11736b | 267 | new_tree = remap_decl (var, id); |
75a70cf9 | 268 | |
deff5ffd | 269 | /* We might've substituted constant or another SSA_NAME for |
48e1416a | 270 | the variable. |
deff5ffd | 271 | |
272 | Replace the SSA name representing RESULT_DECL by variable during | |
273 | inlining: this saves us from need to introduce PHI node in a case | |
274 | return value is just partly initialized. */ | |
f4e36c33 | 275 | if ((TREE_CODE (new_tree) == VAR_DECL || TREE_CODE (new_tree) == PARM_DECL) |
ec11736b | 276 | && (!SSA_NAME_VAR (name) |
277 | || TREE_CODE (SSA_NAME_VAR (name)) != RESULT_DECL | |
deff5ffd | 278 | || !id->transform_return_to_modify)) |
279 | { | |
1a981e1a | 280 | struct ptr_info_def *pi; |
f4e36c33 | 281 | new_tree = make_ssa_name (new_tree, NULL); |
282 | insert_decl_map (id, name, new_tree); | |
283 | SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree) | |
deff5ffd | 284 | = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name); |
1a981e1a | 285 | /* At least IPA points-to info can be directly transferred. */ |
286 | if (id->src_cfun->gimple_df | |
287 | && id->src_cfun->gimple_df->ipa_pta | |
288 | && (pi = SSA_NAME_PTR_INFO (name)) | |
289 | && !pi->pt.anything) | |
290 | { | |
291 | struct ptr_info_def *new_pi = get_ptr_info (new_tree); | |
292 | new_pi->pt = pi->pt; | |
293 | } | |
c6dfe037 | 294 | if (SSA_NAME_IS_DEFAULT_DEF (name)) |
186f5fff | 295 | { |
296 | /* By inlining function having uninitialized variable, we might | |
297 | extend the lifetime (variable might get reused). This cause | |
298 | ICE in the case we end up extending lifetime of SSA name across | |
f0b5f617 | 299 | abnormal edge, but also increase register pressure. |
186f5fff | 300 | |
75a70cf9 | 301 | We simply initialize all uninitialized vars by 0 except |
302 | for case we are inlining to very first BB. We can avoid | |
303 | this for all BBs that are not inside strongly connected | |
304 | regions of the CFG, but this is expensive to test. */ | |
305 | if (id->entry_bb | |
2e661451 | 306 | && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name) |
ec11736b | 307 | && (!SSA_NAME_VAR (name) |
308 | || TREE_CODE (SSA_NAME_VAR (name)) != PARM_DECL) | |
34154e27 | 309 | && (id->entry_bb != EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), |
310 | 0)->dest | |
186f5fff | 311 | || EDGE_COUNT (id->entry_bb->preds) != 1)) |
312 | { | |
75a70cf9 | 313 | gimple_stmt_iterator gsi = gsi_last_bb (id->entry_bb); |
314 | gimple init_stmt; | |
385f3f36 | 315 | tree zero = build_zero_cst (TREE_TYPE (new_tree)); |
48e1416a | 316 | |
385f3f36 | 317 | init_stmt = gimple_build_assign (new_tree, zero); |
75a70cf9 | 318 | gsi_insert_after (&gsi, init_stmt, GSI_NEW_STMT); |
f4e36c33 | 319 | SSA_NAME_IS_DEFAULT_DEF (new_tree) = 0; |
186f5fff | 320 | } |
321 | else | |
322 | { | |
f4e36c33 | 323 | SSA_NAME_DEF_STMT (new_tree) = gimple_build_nop (); |
c6dfe037 | 324 | set_ssa_default_def (cfun, SSA_NAME_VAR (new_tree), new_tree); |
186f5fff | 325 | } |
326 | } | |
deff5ffd | 327 | } |
328 | else | |
f4e36c33 | 329 | insert_decl_map (id, name, new_tree); |
330 | return new_tree; | |
deff5ffd | 331 | } |
332 | ||
e27482aa | 333 | /* Remap DECL during the copying of the BLOCK tree for the function. */ |
e343483a | 334 | |
51a48c27 | 335 | tree |
336 | remap_decl (tree decl, copy_body_data *id) | |
e343483a | 337 | { |
e3022db7 | 338 | tree *n; |
e27482aa | 339 | |
340 | /* We only remap local variables in the current function. */ | |
ecba2e4c | 341 | |
e27482aa | 342 | /* See if we have remapped this declaration. */ |
343 | ||
e3022db7 | 344 | n = (tree *) pointer_map_contains (id->decl_map, decl); |
e27482aa | 345 | |
9845d120 | 346 | if (!n && processing_debug_stmt) |
347 | { | |
348 | processing_debug_stmt = -1; | |
349 | return decl; | |
350 | } | |
351 | ||
e27482aa | 352 | /* If we didn't already have an equivalent for this declaration, |
353 | create one now. */ | |
e343483a | 354 | if (!n) |
355 | { | |
e343483a | 356 | /* Make a copy of the variable or label. */ |
51a48c27 | 357 | tree t = id->copy_decl (decl, id); |
48e1416a | 358 | |
f10b7a77 | 359 | /* Remember it, so that if we encounter this local entity again |
360 | we can reuse this copy. Do this early because remap_type may | |
361 | need this decl for TYPE_STUB_DECL. */ | |
362 | insert_decl_map (id, decl, t); | |
363 | ||
51a48c27 | 364 | if (!DECL_P (t)) |
365 | return t; | |
366 | ||
ecba2e4c | 367 | /* Remap types, if necessary. */ |
368 | TREE_TYPE (t) = remap_type (TREE_TYPE (t), id); | |
369 | if (TREE_CODE (t) == TYPE_DECL) | |
370 | DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id); | |
ecba2e4c | 371 | |
372 | /* Remap sizes as necessary. */ | |
75a70cf9 | 373 | walk_tree (&DECL_SIZE (t), copy_tree_body_r, id, NULL); |
374 | walk_tree (&DECL_SIZE_UNIT (t), copy_tree_body_r, id, NULL); | |
e343483a | 375 | |
fbf0afd1 | 376 | /* If fields, do likewise for offset and qualifier. */ |
1f8a6ff8 | 377 | if (TREE_CODE (t) == FIELD_DECL) |
378 | { | |
75a70cf9 | 379 | walk_tree (&DECL_FIELD_OFFSET (t), copy_tree_body_r, id, NULL); |
1f8a6ff8 | 380 | if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE) |
75a70cf9 | 381 | walk_tree (&DECL_QUALIFIER (t), copy_tree_body_r, id, NULL); |
1f8a6ff8 | 382 | } |
383 | ||
fcc73461 | 384 | return t; |
e343483a | 385 | } |
386 | ||
4189e677 | 387 | if (id->do_not_unshare) |
388 | return *n; | |
389 | else | |
390 | return unshare_expr (*n); | |
e343483a | 391 | } |
392 | ||
ecba2e4c | 393 | static tree |
51a48c27 | 394 | remap_type_1 (tree type, copy_body_data *id) |
ecba2e4c | 395 | { |
f4e36c33 | 396 | tree new_tree, t; |
ecba2e4c | 397 | |
a3575815 | 398 | /* We do need a copy. build and register it now. If this is a pointer or |
399 | reference type, remap the designated type and make a new pointer or | |
400 | reference type. */ | |
401 | if (TREE_CODE (type) == POINTER_TYPE) | |
402 | { | |
f4e36c33 | 403 | new_tree = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id), |
a3575815 | 404 | TYPE_MODE (type), |
405 | TYPE_REF_CAN_ALIAS_ALL (type)); | |
e1f1071c | 406 | if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type)) |
407 | new_tree = build_type_attribute_qual_variant (new_tree, | |
408 | TYPE_ATTRIBUTES (type), | |
409 | TYPE_QUALS (type)); | |
f4e36c33 | 410 | insert_decl_map (id, type, new_tree); |
411 | return new_tree; | |
a3575815 | 412 | } |
413 | else if (TREE_CODE (type) == REFERENCE_TYPE) | |
414 | { | |
f4e36c33 | 415 | new_tree = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id), |
a3575815 | 416 | TYPE_MODE (type), |
417 | TYPE_REF_CAN_ALIAS_ALL (type)); | |
e1f1071c | 418 | if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type)) |
419 | new_tree = build_type_attribute_qual_variant (new_tree, | |
420 | TYPE_ATTRIBUTES (type), | |
421 | TYPE_QUALS (type)); | |
f4e36c33 | 422 | insert_decl_map (id, type, new_tree); |
423 | return new_tree; | |
a3575815 | 424 | } |
425 | else | |
f4e36c33 | 426 | new_tree = copy_node (type); |
a3575815 | 427 | |
f4e36c33 | 428 | insert_decl_map (id, type, new_tree); |
ecba2e4c | 429 | |
430 | /* This is a new type, not a copy of an old type. Need to reassociate | |
431 | variants. We can handle everything except the main variant lazily. */ | |
432 | t = TYPE_MAIN_VARIANT (type); | |
433 | if (type != t) | |
434 | { | |
435 | t = remap_type (t, id); | |
f4e36c33 | 436 | TYPE_MAIN_VARIANT (new_tree) = t; |
437 | TYPE_NEXT_VARIANT (new_tree) = TYPE_NEXT_VARIANT (t); | |
438 | TYPE_NEXT_VARIANT (t) = new_tree; | |
ecba2e4c | 439 | } |
440 | else | |
441 | { | |
f4e36c33 | 442 | TYPE_MAIN_VARIANT (new_tree) = new_tree; |
443 | TYPE_NEXT_VARIANT (new_tree) = NULL; | |
ecba2e4c | 444 | } |
445 | ||
f10b7a77 | 446 | if (TYPE_STUB_DECL (type)) |
f4e36c33 | 447 | TYPE_STUB_DECL (new_tree) = remap_decl (TYPE_STUB_DECL (type), id); |
f10b7a77 | 448 | |
ecba2e4c | 449 | /* Lazily create pointer and reference types. */ |
f4e36c33 | 450 | TYPE_POINTER_TO (new_tree) = NULL; |
451 | TYPE_REFERENCE_TO (new_tree) = NULL; | |
ecba2e4c | 452 | |
f4e36c33 | 453 | switch (TREE_CODE (new_tree)) |
ecba2e4c | 454 | { |
455 | case INTEGER_TYPE: | |
456 | case REAL_TYPE: | |
06f0b99c | 457 | case FIXED_POINT_TYPE: |
ecba2e4c | 458 | case ENUMERAL_TYPE: |
459 | case BOOLEAN_TYPE: | |
f4e36c33 | 460 | t = TYPE_MIN_VALUE (new_tree); |
ecba2e4c | 461 | if (t && TREE_CODE (t) != INTEGER_CST) |
f4e36c33 | 462 | walk_tree (&TYPE_MIN_VALUE (new_tree), copy_tree_body_r, id, NULL); |
ab7083b0 | 463 | |
f4e36c33 | 464 | t = TYPE_MAX_VALUE (new_tree); |
ecba2e4c | 465 | if (t && TREE_CODE (t) != INTEGER_CST) |
f4e36c33 | 466 | walk_tree (&TYPE_MAX_VALUE (new_tree), copy_tree_body_r, id, NULL); |
467 | return new_tree; | |
b27ac6b5 | 468 | |
ecba2e4c | 469 | case FUNCTION_TYPE: |
f4e36c33 | 470 | TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id); |
471 | walk_tree (&TYPE_ARG_TYPES (new_tree), copy_tree_body_r, id, NULL); | |
472 | return new_tree; | |
ecba2e4c | 473 | |
474 | case ARRAY_TYPE: | |
f4e36c33 | 475 | TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id); |
476 | TYPE_DOMAIN (new_tree) = remap_type (TYPE_DOMAIN (new_tree), id); | |
ecba2e4c | 477 | break; |
478 | ||
479 | case RECORD_TYPE: | |
480 | case UNION_TYPE: | |
481 | case QUAL_UNION_TYPE: | |
03908818 | 482 | { |
483 | tree f, nf = NULL; | |
484 | ||
1767a056 | 485 | for (f = TYPE_FIELDS (new_tree); f ; f = DECL_CHAIN (f)) |
03908818 | 486 | { |
487 | t = remap_decl (f, id); | |
f4e36c33 | 488 | DECL_CONTEXT (t) = new_tree; |
1767a056 | 489 | DECL_CHAIN (t) = nf; |
03908818 | 490 | nf = t; |
491 | } | |
f4e36c33 | 492 | TYPE_FIELDS (new_tree) = nreverse (nf); |
03908818 | 493 | } |
ecba2e4c | 494 | break; |
495 | ||
ecba2e4c | 496 | case OFFSET_TYPE: |
497 | default: | |
498 | /* Shouldn't have been thought variable sized. */ | |
8c0963c4 | 499 | gcc_unreachable (); |
ecba2e4c | 500 | } |
501 | ||
f4e36c33 | 502 | walk_tree (&TYPE_SIZE (new_tree), copy_tree_body_r, id, NULL); |
503 | walk_tree (&TYPE_SIZE_UNIT (new_tree), copy_tree_body_r, id, NULL); | |
ecba2e4c | 504 | |
f4e36c33 | 505 | return new_tree; |
ecba2e4c | 506 | } |
507 | ||
51a48c27 | 508 | tree |
509 | remap_type (tree type, copy_body_data *id) | |
03908818 | 510 | { |
e3022db7 | 511 | tree *node; |
ed6049c8 | 512 | tree tmp; |
03908818 | 513 | |
514 | if (type == NULL) | |
515 | return type; | |
516 | ||
517 | /* See if we have remapped this type. */ | |
e3022db7 | 518 | node = (tree *) pointer_map_contains (id->decl_map, type); |
03908818 | 519 | if (node) |
e3022db7 | 520 | return *node; |
03908818 | 521 | |
522 | /* The type only needs remapping if it's variably modified. */ | |
51a48c27 | 523 | if (! variably_modified_type_p (type, id->src_fn)) |
03908818 | 524 | { |
525 | insert_decl_map (id, type, type); | |
526 | return type; | |
527 | } | |
528 | ||
ed6049c8 | 529 | id->remapping_type_depth++; |
530 | tmp = remap_type_1 (type, id); | |
531 | id->remapping_type_depth--; | |
532 | ||
533 | return tmp; | |
03908818 | 534 | } |
535 | ||
4b5d70fd | 536 | /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */ |
48e1416a | 537 | |
4b5d70fd | 538 | static bool |
539 | can_be_nonlocal (tree decl, copy_body_data *id) | |
540 | { | |
541 | /* We can not duplicate function decls. */ | |
542 | if (TREE_CODE (decl) == FUNCTION_DECL) | |
543 | return true; | |
544 | ||
545 | /* Local static vars must be non-local or we get multiple declaration | |
546 | problems. */ | |
547 | if (TREE_CODE (decl) == VAR_DECL | |
548 | && !auto_var_in_fn_p (decl, id->src_fn)) | |
549 | return true; | |
550 | ||
4ae5778c | 551 | return false; |
4b5d70fd | 552 | } |
553 | ||
4ee9c684 | 554 | static tree |
d66d56be | 555 | remap_decls (tree decls, vec<tree, va_gc> **nonlocalized_list, |
f1f41a6c | 556 | copy_body_data *id) |
e343483a | 557 | { |
4ee9c684 | 558 | tree old_var; |
559 | tree new_decls = NULL_TREE; | |
e343483a | 560 | |
4ee9c684 | 561 | /* Remap its variables. */ |
1767a056 | 562 | for (old_var = decls; old_var; old_var = DECL_CHAIN (old_var)) |
e343483a | 563 | { |
4ee9c684 | 564 | tree new_var; |
565 | ||
4b5d70fd | 566 | if (can_be_nonlocal (old_var, id)) |
127d7f21 | 567 | { |
4ae5778c | 568 | /* We need to add this variable to the local decls as otherwise |
569 | nothing else will do so. */ | |
4b5d70fd | 570 | if (TREE_CODE (old_var) == VAR_DECL |
4ae5778c | 571 | && ! DECL_EXTERNAL (old_var)) |
2ab2ce89 | 572 | add_local_decl (cfun, old_var); |
0c1c155a | 573 | if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE) |
4b5d70fd | 574 | && !DECL_IGNORED_P (old_var) |
575 | && nonlocalized_list) | |
d66d56be | 576 | vec_safe_push (*nonlocalized_list, old_var); |
127d7f21 | 577 | continue; |
578 | } | |
579 | ||
4ee9c684 | 580 | /* Remap the variable. */ |
581 | new_var = remap_decl (old_var, id); | |
582 | ||
75a70cf9 | 583 | /* If we didn't remap this variable, we can't mess with its |
4ee9c684 | 584 | TREE_CHAIN. If we remapped this variable to the return slot, it's |
585 | already declared somewhere else, so don't declare it here. */ | |
48e1416a | 586 | |
4b5d70fd | 587 | if (new_var == id->retvar) |
4ee9c684 | 588 | ; |
4b5d70fd | 589 | else if (!new_var) |
590 | { | |
0c1c155a | 591 | if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE) |
4b5d70fd | 592 | && !DECL_IGNORED_P (old_var) |
593 | && nonlocalized_list) | |
d66d56be | 594 | vec_safe_push (*nonlocalized_list, old_var); |
4b5d70fd | 595 | } |
e343483a | 596 | else |
597 | { | |
8c0963c4 | 598 | gcc_assert (DECL_P (new_var)); |
1767a056 | 599 | DECL_CHAIN (new_var) = new_decls; |
4ee9c684 | 600 | new_decls = new_var; |
cd3ece53 | 601 | |
602 | /* Also copy value-expressions. */ | |
603 | if (TREE_CODE (new_var) == VAR_DECL | |
604 | && DECL_HAS_VALUE_EXPR_P (new_var)) | |
605 | { | |
606 | tree tem = DECL_VALUE_EXPR (new_var); | |
607 | bool old_regimplify = id->regimplify; | |
608 | id->remapping_type_depth++; | |
609 | walk_tree (&tem, copy_tree_body_r, id, NULL); | |
610 | id->remapping_type_depth--; | |
611 | id->regimplify = old_regimplify; | |
612 | SET_DECL_VALUE_EXPR (new_var, tem); | |
613 | } | |
e343483a | 614 | } |
e343483a | 615 | } |
e343483a | 616 | |
4ee9c684 | 617 | return nreverse (new_decls); |
618 | } | |
619 | ||
620 | /* Copy the BLOCK to contain remapped versions of the variables | |
621 | therein. And hook the new block into the block-tree. */ | |
622 | ||
623 | static void | |
51a48c27 | 624 | remap_block (tree *block, copy_body_data *id) |
4ee9c684 | 625 | { |
d57cd35f | 626 | tree old_block; |
627 | tree new_block; | |
d57cd35f | 628 | |
629 | /* Make the new block. */ | |
630 | old_block = *block; | |
631 | new_block = make_node (BLOCK); | |
632 | TREE_USED (new_block) = TREE_USED (old_block); | |
633 | BLOCK_ABSTRACT_ORIGIN (new_block) = old_block; | |
44276901 | 634 | BLOCK_SOURCE_LOCATION (new_block) = BLOCK_SOURCE_LOCATION (old_block); |
4b5d70fd | 635 | BLOCK_NONLOCALIZED_VARS (new_block) |
f1f41a6c | 636 | = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block)); |
d57cd35f | 637 | *block = new_block; |
638 | ||
639 | /* Remap its variables. */ | |
4b5d70fd | 640 | BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block), |
d66d56be | 641 | &BLOCK_NONLOCALIZED_VARS (new_block), |
4b5d70fd | 642 | id); |
d57cd35f | 643 | |
51a48c27 | 644 | if (id->transform_lang_insert_block) |
32020b10 | 645 | id->transform_lang_insert_block (new_block); |
51a48c27 | 646 | |
d57cd35f | 647 | /* Remember the remapped block. */ |
4ee9c684 | 648 | insert_decl_map (id, old_block, new_block); |
e343483a | 649 | } |
650 | ||
b3d24a23 | 651 | /* Copy the whole block tree and root it in id->block. */ |
652 | static tree | |
51a48c27 | 653 | remap_blocks (tree block, copy_body_data *id) |
b3d24a23 | 654 | { |
655 | tree t; | |
f4e36c33 | 656 | tree new_tree = block; |
b3d24a23 | 657 | |
658 | if (!block) | |
659 | return NULL; | |
660 | ||
f4e36c33 | 661 | remap_block (&new_tree, id); |
662 | gcc_assert (new_tree != block); | |
b3d24a23 | 663 | for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t)) |
cb302f29 | 664 | prepend_lexical_block (new_tree, remap_blocks (t, id)); |
665 | /* Blocks are in arbitrary order, but make things slightly prettier and do | |
666 | not swap order when producing a copy. */ | |
667 | BLOCK_SUBBLOCKS (new_tree) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree)); | |
f4e36c33 | 668 | return new_tree; |
b3d24a23 | 669 | } |
670 | ||
c251ba7f | 671 | /* Remap the block tree rooted at BLOCK to nothing. */ |
672 | static void | |
673 | remap_blocks_to_null (tree block, copy_body_data *id) | |
674 | { | |
675 | tree t; | |
676 | insert_decl_map (id, block, NULL_TREE); | |
677 | for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t)) | |
678 | remap_blocks_to_null (t, id); | |
679 | } | |
680 | ||
e343483a | 681 | static void |
4ee9c684 | 682 | copy_statement_list (tree *tp) |
e343483a | 683 | { |
4ee9c684 | 684 | tree_stmt_iterator oi, ni; |
f4e36c33 | 685 | tree new_tree; |
4ee9c684 | 686 | |
f4e36c33 | 687 | new_tree = alloc_stmt_list (); |
688 | ni = tsi_start (new_tree); | |
4ee9c684 | 689 | oi = tsi_start (*tp); |
29f90295 | 690 | TREE_TYPE (new_tree) = TREE_TYPE (*tp); |
f4e36c33 | 691 | *tp = new_tree; |
4ee9c684 | 692 | |
693 | for (; !tsi_end_p (oi); tsi_next (&oi)) | |
bfec3452 | 694 | { |
695 | tree stmt = tsi_stmt (oi); | |
18642e81 | 696 | if (TREE_CODE (stmt) == STATEMENT_LIST) |
697 | /* This copy is not redundant; tsi_link_after will smash this | |
698 | STATEMENT_LIST into the end of the one we're building, and we | |
699 | don't want to do that with the original. */ | |
700 | copy_statement_list (&stmt); | |
bfec3452 | 701 | tsi_link_after (&ni, stmt, TSI_CONTINUE_LINKING); |
702 | } | |
4ee9c684 | 703 | } |
e343483a | 704 | |
4ee9c684 | 705 | static void |
51a48c27 | 706 | copy_bind_expr (tree *tp, int *walk_subtrees, copy_body_data *id) |
4ee9c684 | 707 | { |
708 | tree block = BIND_EXPR_BLOCK (*tp); | |
e343483a | 709 | /* Copy (and replace) the statement. */ |
710 | copy_tree_r (tp, walk_subtrees, NULL); | |
4ee9c684 | 711 | if (block) |
712 | { | |
713 | remap_block (&block, id); | |
714 | BIND_EXPR_BLOCK (*tp) = block; | |
715 | } | |
e343483a | 716 | |
4ee9c684 | 717 | if (BIND_EXPR_VARS (*tp)) |
cd3ece53 | 718 | /* This will remap a lot of the same decls again, but this should be |
719 | harmless. */ | |
720 | BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), NULL, id); | |
e343483a | 721 | } |
722 | ||
75a70cf9 | 723 | |
724 | /* Create a new gimple_seq by remapping all the statements in BODY | |
725 | using the inlining information in ID. */ | |
726 | ||
6f932b06 | 727 | static gimple_seq |
75a70cf9 | 728 | remap_gimple_seq (gimple_seq body, copy_body_data *id) |
729 | { | |
730 | gimple_stmt_iterator si; | |
731 | gimple_seq new_body = NULL; | |
732 | ||
733 | for (si = gsi_start (body); !gsi_end_p (si); gsi_next (&si)) | |
734 | { | |
735 | gimple new_stmt = remap_gimple_stmt (gsi_stmt (si), id); | |
736 | gimple_seq_add_stmt (&new_body, new_stmt); | |
737 | } | |
738 | ||
739 | return new_body; | |
740 | } | |
741 | ||
742 | ||
743 | /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its | |
744 | block using the mapping information in ID. */ | |
745 | ||
746 | static gimple | |
747 | copy_gimple_bind (gimple stmt, copy_body_data *id) | |
748 | { | |
749 | gimple new_bind; | |
750 | tree new_block, new_vars; | |
751 | gimple_seq body, new_body; | |
752 | ||
753 | /* Copy the statement. Note that we purposely don't use copy_stmt | |
754 | here because we need to remap statements as we copy. */ | |
755 | body = gimple_bind_body (stmt); | |
756 | new_body = remap_gimple_seq (body, id); | |
757 | ||
758 | new_block = gimple_bind_block (stmt); | |
759 | if (new_block) | |
760 | remap_block (&new_block, id); | |
761 | ||
762 | /* This will remap a lot of the same decls again, but this should be | |
763 | harmless. */ | |
764 | new_vars = gimple_bind_vars (stmt); | |
765 | if (new_vars) | |
4b5d70fd | 766 | new_vars = remap_decls (new_vars, NULL, id); |
75a70cf9 | 767 | |
768 | new_bind = gimple_build_bind (new_vars, new_body, new_block); | |
769 | ||
770 | return new_bind; | |
771 | } | |
772 | ||
6b99cb5e | 773 | /* Return true if DECL is a parameter or a SSA_NAME for a parameter. */ |
774 | ||
775 | static bool | |
776 | is_parm (tree decl) | |
777 | { | |
778 | if (TREE_CODE (decl) == SSA_NAME) | |
779 | { | |
780 | decl = SSA_NAME_VAR (decl); | |
781 | if (!decl) | |
782 | return false; | |
783 | } | |
784 | ||
785 | return (TREE_CODE (decl) == PARM_DECL); | |
786 | } | |
75a70cf9 | 787 | |
788 | /* Remap the GIMPLE operand pointed to by *TP. DATA is really a | |
789 | 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'. | |
790 | WALK_SUBTREES is used to indicate walk_gimple_op whether to keep | |
791 | recursing into the children nodes of *TP. */ | |
792 | ||
793 | static tree | |
794 | remap_gimple_op_r (tree *tp, int *walk_subtrees, void *data) | |
795 | { | |
796 | struct walk_stmt_info *wi_p = (struct walk_stmt_info *) data; | |
797 | copy_body_data *id = (copy_body_data *) wi_p->info; | |
798 | tree fn = id->src_fn; | |
799 | ||
800 | if (TREE_CODE (*tp) == SSA_NAME) | |
801 | { | |
802 | *tp = remap_ssa_name (*tp, id); | |
803 | *walk_subtrees = 0; | |
804 | return NULL; | |
805 | } | |
806 | else if (auto_var_in_fn_p (*tp, fn)) | |
807 | { | |
808 | /* Local variables and labels need to be replaced by equivalent | |
809 | variables. We don't want to copy static variables; there's | |
810 | only one of those, no matter how many times we inline the | |
811 | containing function. Similarly for globals from an outer | |
812 | function. */ | |
813 | tree new_decl; | |
814 | ||
815 | /* Remap the declaration. */ | |
816 | new_decl = remap_decl (*tp, id); | |
817 | gcc_assert (new_decl); | |
818 | /* Replace this variable with the copy. */ | |
819 | STRIP_TYPE_NOPS (new_decl); | |
ae2a9b00 | 820 | /* ??? The C++ frontend uses void * pointer zero to initialize |
821 | any other type. This confuses the middle-end type verification. | |
822 | As cloned bodies do not go through gimplification again the fixup | |
823 | there doesn't trigger. */ | |
824 | if (TREE_CODE (new_decl) == INTEGER_CST | |
825 | && !useless_type_conversion_p (TREE_TYPE (*tp), TREE_TYPE (new_decl))) | |
826 | new_decl = fold_convert (TREE_TYPE (*tp), new_decl); | |
75a70cf9 | 827 | *tp = new_decl; |
828 | *walk_subtrees = 0; | |
829 | } | |
830 | else if (TREE_CODE (*tp) == STATEMENT_LIST) | |
831 | gcc_unreachable (); | |
832 | else if (TREE_CODE (*tp) == SAVE_EXPR) | |
833 | gcc_unreachable (); | |
834 | else if (TREE_CODE (*tp) == LABEL_DECL | |
835 | && (!DECL_CONTEXT (*tp) | |
836 | || decl_function_context (*tp) == id->src_fn)) | |
837 | /* These may need to be remapped for EH handling. */ | |
838 | *tp = remap_decl (*tp, id); | |
eaf1e576 | 839 | else if (TREE_CODE (*tp) == FIELD_DECL) |
840 | { | |
841 | /* If the enclosing record type is variably_modified_type_p, the field | |
842 | has already been remapped. Otherwise, it need not be. */ | |
843 | tree *n = (tree *) pointer_map_contains (id->decl_map, *tp); | |
844 | if (n) | |
845 | *tp = *n; | |
846 | *walk_subtrees = 0; | |
847 | } | |
75a70cf9 | 848 | else if (TYPE_P (*tp)) |
849 | /* Types may need remapping as well. */ | |
850 | *tp = remap_type (*tp, id); | |
851 | else if (CONSTANT_CLASS_P (*tp)) | |
852 | { | |
853 | /* If this is a constant, we have to copy the node iff the type | |
854 | will be remapped. copy_tree_r will not copy a constant. */ | |
855 | tree new_type = remap_type (TREE_TYPE (*tp), id); | |
856 | ||
857 | if (new_type == TREE_TYPE (*tp)) | |
858 | *walk_subtrees = 0; | |
859 | ||
860 | else if (TREE_CODE (*tp) == INTEGER_CST) | |
861 | *tp = build_int_cst_wide (new_type, TREE_INT_CST_LOW (*tp), | |
862 | TREE_INT_CST_HIGH (*tp)); | |
863 | else | |
864 | { | |
865 | *tp = copy_node (*tp); | |
866 | TREE_TYPE (*tp) = new_type; | |
867 | } | |
868 | } | |
869 | else | |
870 | { | |
871 | /* Otherwise, just copy the node. Note that copy_tree_r already | |
872 | knows not to copy VAR_DECLs, etc., so this is safe. */ | |
a37d97a5 | 873 | |
182cf5a9 | 874 | if (TREE_CODE (*tp) == MEM_REF) |
75a70cf9 | 875 | { |
182cf5a9 | 876 | /* We need to re-canonicalize MEM_REFs from inline substitutions |
7003a7e5 | 877 | that can happen when a pointer argument is an ADDR_EXPR. |
878 | Recurse here manually to allow that. */ | |
6b99cb5e | 879 | tree ptr = TREE_OPERAND (*tp, 0); |
880 | tree type = remap_type (TREE_TYPE (*tp), id); | |
881 | tree old = *tp; | |
7003a7e5 | 882 | walk_tree (&ptr, remap_gimple_op_r, data, NULL); |
6b99cb5e | 883 | *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1)); |
72dbeb36 | 884 | TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old); |
0adec5fc | 885 | TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old); |
7003a7e5 | 886 | TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old); |
6b99cb5e | 887 | /* We cannot propagate the TREE_THIS_NOTRAP flag if we have |
888 | remapped a parameter as the property might be valid only | |
889 | for the parameter itself. */ | |
890 | if (TREE_THIS_NOTRAP (old) | |
891 | && (!is_parm (TREE_OPERAND (old, 0)) | |
892 | || (!id->transform_parameter && is_parm (ptr)))) | |
893 | TREE_THIS_NOTRAP (*tp) = 1; | |
7003a7e5 | 894 | *walk_subtrees = 0; |
895 | return NULL; | |
75a70cf9 | 896 | } |
897 | ||
898 | /* Here is the "usual case". Copy this tree node, and then | |
899 | tweak some special cases. */ | |
900 | copy_tree_r (tp, walk_subtrees, NULL); | |
901 | ||
a37d97a5 | 902 | if (TREE_CODE (*tp) != OMP_CLAUSE) |
903 | TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id); | |
904 | ||
75a70cf9 | 905 | if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3)) |
906 | { | |
907 | /* The copied TARGET_EXPR has never been expanded, even if the | |
908 | original node was expanded already. */ | |
909 | TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3); | |
910 | TREE_OPERAND (*tp, 3) = NULL_TREE; | |
911 | } | |
912 | else if (TREE_CODE (*tp) == ADDR_EXPR) | |
913 | { | |
914 | /* Variable substitution need not be simple. In particular, | |
182cf5a9 | 915 | the MEM_REF substitution above. Make sure that |
5169661d | 916 | TREE_CONSTANT and friends are up-to-date. */ |
75a70cf9 | 917 | int invariant = is_gimple_min_invariant (*tp); |
d603fd86 | 918 | walk_tree (&TREE_OPERAND (*tp, 0), remap_gimple_op_r, data, NULL); |
182cf5a9 | 919 | recompute_tree_invariant_for_addr_expr (*tp); |
75a70cf9 | 920 | |
921 | /* If this used to be invariant, but is not any longer, | |
922 | then regimplification is probably needed. */ | |
923 | if (invariant && !is_gimple_min_invariant (*tp)) | |
924 | id->regimplify = true; | |
925 | ||
926 | *walk_subtrees = 0; | |
927 | } | |
928 | } | |
929 | ||
5169661d | 930 | /* Update the TREE_BLOCK for the cloned expr. */ |
931 | if (EXPR_P (*tp)) | |
932 | { | |
933 | tree new_block = id->remapping_type_depth == 0 ? id->block : NULL; | |
934 | tree old_block = TREE_BLOCK (*tp); | |
935 | if (old_block) | |
936 | { | |
937 | tree *n; | |
938 | n = (tree *) pointer_map_contains (id->decl_map, | |
939 | TREE_BLOCK (*tp)); | |
940 | if (n) | |
941 | new_block = *n; | |
942 | } | |
943 | TREE_SET_BLOCK (*tp, new_block); | |
944 | } | |
945 | ||
75a70cf9 | 946 | /* Keep iterating. */ |
947 | return NULL_TREE; | |
948 | } | |
949 | ||
950 | ||
951 | /* Called from copy_body_id via walk_tree. DATA is really a | |
51a48c27 | 952 | `copy_body_data *'. */ |
5ff0afa2 | 953 | |
51a48c27 | 954 | tree |
75a70cf9 | 955 | copy_tree_body_r (tree *tp, int *walk_subtrees, void *data) |
e343483a | 956 | { |
51a48c27 | 957 | copy_body_data *id = (copy_body_data *) data; |
958 | tree fn = id->src_fn; | |
b3d24a23 | 959 | tree new_block; |
e343483a | 960 | |
e27482aa | 961 | /* Begin by recognizing trees that we'll completely rewrite for the |
962 | inlining context. Our output for these trees is completely | |
963 | different from out input (e.g. RETURN_EXPR is deleted, and morphs | |
964 | into an edge). Further down, we'll handle trees that get | |
965 | duplicated and/or tweaked. */ | |
e343483a | 966 | |
51a48c27 | 967 | /* When requested, RETURN_EXPRs should be transformed to just the |
75a70cf9 | 968 | contained MODIFY_EXPR. The branch semantics of the return will |
51a48c27 | 969 | be handled elsewhere by manipulating the CFG rather than a statement. */ |
970 | if (TREE_CODE (*tp) == RETURN_EXPR && id->transform_return_to_modify) | |
e343483a | 971 | { |
e27482aa | 972 | tree assignment = TREE_OPERAND (*tp, 0); |
e343483a | 973 | |
974 | /* If we're returning something, just turn that into an | |
e27482aa | 975 | assignment into the equivalent of the original RESULT_DECL. |
976 | If the "assignment" is just the result decl, the result | |
977 | decl has already been set (e.g. a recent "foo (&result_decl, | |
978 | ...)"); just toss the entire RETURN_EXPR. */ | |
75a70cf9 | 979 | if (assignment && TREE_CODE (assignment) == MODIFY_EXPR) |
e27482aa | 980 | { |
981 | /* Replace the RETURN_EXPR with (a copy of) the | |
75a70cf9 | 982 | MODIFY_EXPR hanging underneath. */ |
e27482aa | 983 | *tp = copy_node (assignment); |
984 | } | |
985 | else /* Else the RETURN_EXPR returns no value. */ | |
986 | { | |
987 | *tp = NULL; | |
a9c6c0e3 | 988 | return (tree) (void *)1; |
e27482aa | 989 | } |
e343483a | 990 | } |
deff5ffd | 991 | else if (TREE_CODE (*tp) == SSA_NAME) |
992 | { | |
993 | *tp = remap_ssa_name (*tp, id); | |
994 | *walk_subtrees = 0; | |
995 | return NULL; | |
996 | } | |
e27482aa | 997 | |
e343483a | 998 | /* Local variables and labels need to be replaced by equivalent |
999 | variables. We don't want to copy static variables; there's only | |
1000 | one of those, no matter how many times we inline the containing | |
1f8a6ff8 | 1001 | function. Similarly for globals from an outer function. */ |
2ef41604 | 1002 | else if (auto_var_in_fn_p (*tp, fn)) |
e343483a | 1003 | { |
1004 | tree new_decl; | |
1005 | ||
1006 | /* Remap the declaration. */ | |
1007 | new_decl = remap_decl (*tp, id); | |
8c0963c4 | 1008 | gcc_assert (new_decl); |
e343483a | 1009 | /* Replace this variable with the copy. */ |
1010 | STRIP_TYPE_NOPS (new_decl); | |
1011 | *tp = new_decl; | |
db7439ff | 1012 | *walk_subtrees = 0; |
e343483a | 1013 | } |
4ee9c684 | 1014 | else if (TREE_CODE (*tp) == STATEMENT_LIST) |
1015 | copy_statement_list (tp); | |
bfec3452 | 1016 | else if (TREE_CODE (*tp) == SAVE_EXPR |
1017 | || TREE_CODE (*tp) == TARGET_EXPR) | |
67c155cb | 1018 | remap_save_expr (tp, id->decl_map, walk_subtrees); |
8266b8c5 | 1019 | else if (TREE_CODE (*tp) == LABEL_DECL |
1020 | && (! DECL_CONTEXT (*tp) | |
51a48c27 | 1021 | || decl_function_context (*tp) == id->src_fn)) |
e27482aa | 1022 | /* These may need to be remapped for EH handling. */ |
8266b8c5 | 1023 | *tp = remap_decl (*tp, id); |
4ee9c684 | 1024 | else if (TREE_CODE (*tp) == BIND_EXPR) |
1025 | copy_bind_expr (tp, walk_subtrees, id); | |
ecba2e4c | 1026 | /* Types may need remapping as well. */ |
1027 | else if (TYPE_P (*tp)) | |
1028 | *tp = remap_type (*tp, id); | |
1029 | ||
bfc01d24 | 1030 | /* If this is a constant, we have to copy the node iff the type will be |
1031 | remapped. copy_tree_r will not copy a constant. */ | |
0b7784b5 | 1032 | else if (CONSTANT_CLASS_P (*tp)) |
bfc01d24 | 1033 | { |
1034 | tree new_type = remap_type (TREE_TYPE (*tp), id); | |
1035 | ||
1036 | if (new_type == TREE_TYPE (*tp)) | |
1037 | *walk_subtrees = 0; | |
1038 | ||
1039 | else if (TREE_CODE (*tp) == INTEGER_CST) | |
1040 | *tp = build_int_cst_wide (new_type, TREE_INT_CST_LOW (*tp), | |
1041 | TREE_INT_CST_HIGH (*tp)); | |
1042 | else | |
1043 | { | |
1044 | *tp = copy_node (*tp); | |
1045 | TREE_TYPE (*tp) = new_type; | |
1046 | } | |
1047 | } | |
1048 | ||
e343483a | 1049 | /* Otherwise, just copy the node. Note that copy_tree_r already |
1050 | knows not to copy VAR_DECLs, etc., so this is safe. */ | |
1051 | else | |
1052 | { | |
e27482aa | 1053 | /* Here we handle trees that are not completely rewritten. |
1054 | First we detect some inlining-induced bogosities for | |
1055 | discarding. */ | |
75a70cf9 | 1056 | if (TREE_CODE (*tp) == MODIFY_EXPR |
1057 | && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1) | |
1058 | && (auto_var_in_fn_p (TREE_OPERAND (*tp, 0), fn))) | |
e343483a | 1059 | { |
1060 | /* Some assignments VAR = VAR; don't generate any rtl code | |
1061 | and thus don't count as variable modification. Avoid | |
1062 | keeping bogosities like 0 = 0. */ | |
75a70cf9 | 1063 | tree decl = TREE_OPERAND (*tp, 0), value; |
e3022db7 | 1064 | tree *n; |
e343483a | 1065 | |
e3022db7 | 1066 | n = (tree *) pointer_map_contains (id->decl_map, decl); |
e343483a | 1067 | if (n) |
1068 | { | |
e3022db7 | 1069 | value = *n; |
e343483a | 1070 | STRIP_TYPE_NOPS (value); |
9c2a0c05 | 1071 | if (TREE_CONSTANT (value) || TREE_READONLY (value)) |
ffee01dc | 1072 | { |
e60a6f7b | 1073 | *tp = build_empty_stmt (EXPR_LOCATION (*tp)); |
75a70cf9 | 1074 | return copy_tree_body_r (tp, walk_subtrees, data); |
ffee01dc | 1075 | } |
e343483a | 1076 | } |
1077 | } | |
51a48c27 | 1078 | else if (TREE_CODE (*tp) == INDIRECT_REF) |
4ee9c684 | 1079 | { |
1080 | /* Get rid of *& from inline substitutions that can happen when a | |
1081 | pointer argument is an ADDR_EXPR. */ | |
eb0fefdb | 1082 | tree decl = TREE_OPERAND (*tp, 0); |
6b99cb5e | 1083 | tree *n = (tree *) pointer_map_contains (id->decl_map, decl); |
4ee9c684 | 1084 | if (n) |
1085 | { | |
51fc648f | 1086 | /* If we happen to get an ADDR_EXPR in n->value, strip |
1087 | it manually here as we'll eventually get ADDR_EXPRs | |
1088 | which lie about their types pointed to. In this case | |
1089 | build_fold_indirect_ref wouldn't strip the INDIRECT_REF, | |
9ea9fcf0 | 1090 | but we absolutely rely on that. As fold_indirect_ref |
1091 | does other useful transformations, try that first, though. */ | |
6b99cb5e | 1092 | tree type = TREE_TYPE (*tp); |
1093 | tree ptr = id->do_not_unshare ? *n : unshare_expr (*n); | |
1094 | tree old = *tp; | |
1095 | *tp = gimple_fold_indirect_ref (ptr); | |
9ea9fcf0 | 1096 | if (! *tp) |
1097 | { | |
6b99cb5e | 1098 | if (TREE_CODE (ptr) == ADDR_EXPR) |
db812c94 | 1099 | { |
6b99cb5e | 1100 | *tp |
1101 | = fold_indirect_ref_1 (EXPR_LOCATION (ptr), type, ptr); | |
db812c94 | 1102 | /* ??? We should either assert here or build |
1103 | a VIEW_CONVERT_EXPR instead of blindly leaking | |
1104 | incompatible types to our IL. */ | |
1105 | if (! *tp) | |
6b99cb5e | 1106 | *tp = TREE_OPERAND (ptr, 0); |
db812c94 | 1107 | } |
9ea9fcf0 | 1108 | else |
e4a492cd | 1109 | { |
6b99cb5e | 1110 | *tp = build1 (INDIRECT_REF, type, ptr); |
e4a492cd | 1111 | TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old); |
74cbc691 | 1112 | TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old); |
a67e70de | 1113 | TREE_READONLY (*tp) = TREE_READONLY (old); |
6b99cb5e | 1114 | /* We cannot propagate the TREE_THIS_NOTRAP flag if we |
1115 | have remapped a parameter as the property might be | |
1116 | valid only for the parameter itself. */ | |
1117 | if (TREE_THIS_NOTRAP (old) | |
1118 | && (!is_parm (TREE_OPERAND (old, 0)) | |
1119 | || (!id->transform_parameter && is_parm (ptr)))) | |
1120 | TREE_THIS_NOTRAP (*tp) = 1; | |
e4a492cd | 1121 | } |
9ea9fcf0 | 1122 | } |
eb0fefdb | 1123 | *walk_subtrees = 0; |
1124 | return NULL; | |
ffee01dc | 1125 | } |
1126 | } | |
182cf5a9 | 1127 | else if (TREE_CODE (*tp) == MEM_REF) |
1128 | { | |
b94b4cf4 | 1129 | /* We need to re-canonicalize MEM_REFs from inline substitutions |
1130 | that can happen when a pointer argument is an ADDR_EXPR. | |
1131 | Recurse here manually to allow that. */ | |
6b99cb5e | 1132 | tree ptr = TREE_OPERAND (*tp, 0); |
1133 | tree type = remap_type (TREE_TYPE (*tp), id); | |
1134 | tree old = *tp; | |
b94b4cf4 | 1135 | walk_tree (&ptr, copy_tree_body_r, data, NULL); |
6b99cb5e | 1136 | *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1)); |
b94b4cf4 | 1137 | TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old); |
1138 | TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old); | |
1139 | TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old); | |
6b99cb5e | 1140 | /* We cannot propagate the TREE_THIS_NOTRAP flag if we have |
1141 | remapped a parameter as the property might be valid only | |
1142 | for the parameter itself. */ | |
1143 | if (TREE_THIS_NOTRAP (old) | |
1144 | && (!is_parm (TREE_OPERAND (old, 0)) | |
1145 | || (!id->transform_parameter && is_parm (ptr)))) | |
1146 | TREE_THIS_NOTRAP (*tp) = 1; | |
b94b4cf4 | 1147 | *walk_subtrees = 0; |
1148 | return NULL; | |
182cf5a9 | 1149 | } |
ffee01dc | 1150 | |
e27482aa | 1151 | /* Here is the "usual case". Copy this tree node, and then |
1152 | tweak some special cases. */ | |
51a48c27 | 1153 | copy_tree_r (tp, walk_subtrees, NULL); |
deff5ffd | 1154 | |
b3d24a23 | 1155 | /* If EXPR has block defined, map it to newly constructed block. |
1156 | When inlining we want EXPRs without block appear in the block | |
edbb328f | 1157 | of function call if we are not remapping a type. */ |
75a70cf9 | 1158 | if (EXPR_P (*tp)) |
b3d24a23 | 1159 | { |
edbb328f | 1160 | new_block = id->remapping_type_depth == 0 ? id->block : NULL; |
b3d24a23 | 1161 | if (TREE_BLOCK (*tp)) |
1162 | { | |
e3022db7 | 1163 | tree *n; |
1164 | n = (tree *) pointer_map_contains (id->decl_map, | |
1165 | TREE_BLOCK (*tp)); | |
cd3ece53 | 1166 | if (n) |
1167 | new_block = *n; | |
b3d24a23 | 1168 | } |
5169661d | 1169 | TREE_SET_BLOCK (*tp, new_block); |
b3d24a23 | 1170 | } |
ffee01dc | 1171 | |
75a70cf9 | 1172 | if (TREE_CODE (*tp) != OMP_CLAUSE) |
35cc02b5 | 1173 | TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id); |
ecba2e4c | 1174 | |
ffee01dc | 1175 | /* The copied TARGET_EXPR has never been expanded, even if the |
1176 | original node was expanded already. */ | |
1177 | if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3)) | |
1178 | { | |
1179 | TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3); | |
1180 | TREE_OPERAND (*tp, 3) = NULL_TREE; | |
1181 | } | |
579a1f45 | 1182 | |
1183 | /* Variable substitution need not be simple. In particular, the | |
1184 | INDIRECT_REF substitution above. Make sure that TREE_CONSTANT | |
1185 | and friends are up-to-date. */ | |
1186 | else if (TREE_CODE (*tp) == ADDR_EXPR) | |
1187 | { | |
71d9af81 | 1188 | int invariant = is_gimple_min_invariant (*tp); |
75a70cf9 | 1189 | walk_tree (&TREE_OPERAND (*tp, 0), copy_tree_body_r, id, NULL); |
1190 | ||
52a7bd0e | 1191 | /* Handle the case where we substituted an INDIRECT_REF |
1192 | into the operand of the ADDR_EXPR. */ | |
1193 | if (TREE_CODE (TREE_OPERAND (*tp, 0)) == INDIRECT_REF) | |
1194 | *tp = TREE_OPERAND (TREE_OPERAND (*tp, 0), 0); | |
1195 | else | |
1196 | recompute_tree_invariant_for_addr_expr (*tp); | |
75a70cf9 | 1197 | |
3d053ea5 | 1198 | /* If this used to be invariant, but is not any longer, |
1199 | then regimplification is probably needed. */ | |
71d9af81 | 1200 | if (invariant && !is_gimple_min_invariant (*tp)) |
3d053ea5 | 1201 | id->regimplify = true; |
75a70cf9 | 1202 | |
579a1f45 | 1203 | *walk_subtrees = 0; |
1204 | } | |
e343483a | 1205 | } |
1206 | ||
1207 | /* Keep iterating. */ | |
1208 | return NULL_TREE; | |
1209 | } | |
1210 | ||
e38def9c | 1211 | /* Helper for remap_gimple_stmt. Given an EH region number for the |
1212 | source function, map that to the duplicate EH region number in | |
1213 | the destination function. */ | |
1214 | ||
1215 | static int | |
1216 | remap_eh_region_nr (int old_nr, copy_body_data *id) | |
1217 | { | |
1218 | eh_region old_r, new_r; | |
1219 | void **slot; | |
1220 | ||
1221 | old_r = get_eh_region_from_number_fn (id->src_cfun, old_nr); | |
1222 | slot = pointer_map_contains (id->eh_map, old_r); | |
1223 | new_r = (eh_region) *slot; | |
1224 | ||
1225 | return new_r->index; | |
1226 | } | |
1227 | ||
1228 | /* Similar, but operate on INTEGER_CSTs. */ | |
1229 | ||
1230 | static tree | |
1231 | remap_eh_region_tree_nr (tree old_t_nr, copy_body_data *id) | |
1232 | { | |
1233 | int old_nr, new_nr; | |
1234 | ||
fcb97e84 | 1235 | old_nr = tree_to_shwi (old_t_nr); |
e38def9c | 1236 | new_nr = remap_eh_region_nr (old_nr, id); |
1237 | ||
b3d480fb | 1238 | return build_int_cst (integer_type_node, new_nr); |
e38def9c | 1239 | } |
75a70cf9 | 1240 | |
1241 | /* Helper for copy_bb. Remap statement STMT using the inlining | |
1242 | information in ID. Return the new statement copy. */ | |
1243 | ||
1244 | static gimple | |
1245 | remap_gimple_stmt (gimple stmt, copy_body_data *id) | |
1246 | { | |
1247 | gimple copy = NULL; | |
1248 | struct walk_stmt_info wi; | |
508d0d3f | 1249 | bool skip_first = false; |
75a70cf9 | 1250 | |
1251 | /* Begin by recognizing trees that we'll completely rewrite for the | |
1252 | inlining context. Our output for these trees is completely | |
1253 | different from out input (e.g. RETURN_EXPR is deleted, and morphs | |
1254 | into an edge). Further down, we'll handle trees that get | |
1255 | duplicated and/or tweaked. */ | |
1256 | ||
1257 | /* When requested, GIMPLE_RETURNs should be transformed to just the | |
1258 | contained GIMPLE_ASSIGN. The branch semantics of the return will | |
1259 | be handled elsewhere by manipulating the CFG rather than the | |
1260 | statement. */ | |
1261 | if (gimple_code (stmt) == GIMPLE_RETURN && id->transform_return_to_modify) | |
1262 | { | |
1263 | tree retval = gimple_return_retval (stmt); | |
1264 | ||
1265 | /* If we're returning something, just turn that into an | |
1266 | assignment into the equivalent of the original RESULT_DECL. | |
1267 | If RETVAL is just the result decl, the result decl has | |
1268 | already been set (e.g. a recent "foo (&result_decl, ...)"); | |
1269 | just toss the entire GIMPLE_RETURN. */ | |
524a0531 | 1270 | if (retval |
1271 | && (TREE_CODE (retval) != RESULT_DECL | |
1272 | && (TREE_CODE (retval) != SSA_NAME | |
ec11736b | 1273 | || ! SSA_NAME_VAR (retval) |
524a0531 | 1274 | || TREE_CODE (SSA_NAME_VAR (retval)) != RESULT_DECL))) |
508d0d3f | 1275 | { |
1276 | copy = gimple_build_assign (id->retvar, retval); | |
1277 | /* id->retvar is already substituted. Skip it on later remapping. */ | |
1278 | skip_first = true; | |
1279 | } | |
75a70cf9 | 1280 | else |
1281 | return gimple_build_nop (); | |
1282 | } | |
1283 | else if (gimple_has_substatements (stmt)) | |
1284 | { | |
1285 | gimple_seq s1, s2; | |
1286 | ||
1287 | /* When cloning bodies from the C++ front end, we will be handed bodies | |
1288 | in High GIMPLE form. Handle here all the High GIMPLE statements that | |
1289 | have embedded statements. */ | |
1290 | switch (gimple_code (stmt)) | |
1291 | { | |
1292 | case GIMPLE_BIND: | |
1293 | copy = copy_gimple_bind (stmt, id); | |
1294 | break; | |
1295 | ||
1296 | case GIMPLE_CATCH: | |
1297 | s1 = remap_gimple_seq (gimple_catch_handler (stmt), id); | |
1298 | copy = gimple_build_catch (gimple_catch_types (stmt), s1); | |
1299 | break; | |
1300 | ||
1301 | case GIMPLE_EH_FILTER: | |
1302 | s1 = remap_gimple_seq (gimple_eh_filter_failure (stmt), id); | |
1303 | copy = gimple_build_eh_filter (gimple_eh_filter_types (stmt), s1); | |
1304 | break; | |
1305 | ||
1306 | case GIMPLE_TRY: | |
1307 | s1 = remap_gimple_seq (gimple_try_eval (stmt), id); | |
1308 | s2 = remap_gimple_seq (gimple_try_cleanup (stmt), id); | |
48e1416a | 1309 | copy = gimple_build_try (s1, s2, gimple_try_kind (stmt)); |
75a70cf9 | 1310 | break; |
1311 | ||
1312 | case GIMPLE_WITH_CLEANUP_EXPR: | |
1313 | s1 = remap_gimple_seq (gimple_wce_cleanup (stmt), id); | |
1314 | copy = gimple_build_wce (s1); | |
1315 | break; | |
1316 | ||
1317 | case GIMPLE_OMP_PARALLEL: | |
1318 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1319 | copy = gimple_build_omp_parallel | |
1320 | (s1, | |
1321 | gimple_omp_parallel_clauses (stmt), | |
1322 | gimple_omp_parallel_child_fn (stmt), | |
1323 | gimple_omp_parallel_data_arg (stmt)); | |
1324 | break; | |
1325 | ||
1326 | case GIMPLE_OMP_TASK: | |
1327 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1328 | copy = gimple_build_omp_task | |
1329 | (s1, | |
1330 | gimple_omp_task_clauses (stmt), | |
1331 | gimple_omp_task_child_fn (stmt), | |
1332 | gimple_omp_task_data_arg (stmt), | |
1333 | gimple_omp_task_copy_fn (stmt), | |
1334 | gimple_omp_task_arg_size (stmt), | |
1335 | gimple_omp_task_arg_align (stmt)); | |
1336 | break; | |
1337 | ||
1338 | case GIMPLE_OMP_FOR: | |
1339 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1340 | s2 = remap_gimple_seq (gimple_omp_for_pre_body (stmt), id); | |
3d483a94 | 1341 | copy = gimple_build_omp_for (s1, gimple_omp_for_kind (stmt), |
1342 | gimple_omp_for_clauses (stmt), | |
75a70cf9 | 1343 | gimple_omp_for_collapse (stmt), s2); |
1344 | { | |
1345 | size_t i; | |
1346 | for (i = 0; i < gimple_omp_for_collapse (stmt); i++) | |
1347 | { | |
1348 | gimple_omp_for_set_index (copy, i, | |
1349 | gimple_omp_for_index (stmt, i)); | |
1350 | gimple_omp_for_set_initial (copy, i, | |
1351 | gimple_omp_for_initial (stmt, i)); | |
1352 | gimple_omp_for_set_final (copy, i, | |
1353 | gimple_omp_for_final (stmt, i)); | |
1354 | gimple_omp_for_set_incr (copy, i, | |
1355 | gimple_omp_for_incr (stmt, i)); | |
1356 | gimple_omp_for_set_cond (copy, i, | |
1357 | gimple_omp_for_cond (stmt, i)); | |
1358 | } | |
1359 | } | |
1360 | break; | |
1361 | ||
1362 | case GIMPLE_OMP_MASTER: | |
1363 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1364 | copy = gimple_build_omp_master (s1); | |
1365 | break; | |
1366 | ||
bc7bff74 | 1367 | case GIMPLE_OMP_TASKGROUP: |
1368 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1369 | copy = gimple_build_omp_taskgroup (s1); | |
1370 | break; | |
1371 | ||
75a70cf9 | 1372 | case GIMPLE_OMP_ORDERED: |
1373 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1374 | copy = gimple_build_omp_ordered (s1); | |
1375 | break; | |
1376 | ||
1377 | case GIMPLE_OMP_SECTION: | |
1378 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1379 | copy = gimple_build_omp_section (s1); | |
1380 | break; | |
1381 | ||
1382 | case GIMPLE_OMP_SECTIONS: | |
1383 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1384 | copy = gimple_build_omp_sections | |
1385 | (s1, gimple_omp_sections_clauses (stmt)); | |
1386 | break; | |
1387 | ||
1388 | case GIMPLE_OMP_SINGLE: | |
1389 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1390 | copy = gimple_build_omp_single | |
1391 | (s1, gimple_omp_single_clauses (stmt)); | |
1392 | break; | |
1393 | ||
bc7bff74 | 1394 | case GIMPLE_OMP_TARGET: |
1395 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1396 | copy = gimple_build_omp_target | |
1397 | (s1, gimple_omp_target_kind (stmt), | |
1398 | gimple_omp_target_clauses (stmt)); | |
1399 | break; | |
1400 | ||
1401 | case GIMPLE_OMP_TEAMS: | |
1402 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1403 | copy = gimple_build_omp_teams | |
1404 | (s1, gimple_omp_teams_clauses (stmt)); | |
1405 | break; | |
1406 | ||
12d3d5cb | 1407 | case GIMPLE_OMP_CRITICAL: |
1408 | s1 = remap_gimple_seq (gimple_omp_body (stmt), id); | |
1409 | copy | |
1410 | = gimple_build_omp_critical (s1, gimple_omp_critical_name (stmt)); | |
1411 | break; | |
1412 | ||
4c0315d0 | 1413 | case GIMPLE_TRANSACTION: |
1414 | s1 = remap_gimple_seq (gimple_transaction_body (stmt), id); | |
1415 | copy = gimple_build_transaction (s1, gimple_transaction_label (stmt)); | |
1416 | gimple_transaction_set_subcode (copy, gimple_transaction_subcode (stmt)); | |
1417 | break; | |
1418 | ||
75a70cf9 | 1419 | default: |
1420 | gcc_unreachable (); | |
1421 | } | |
1422 | } | |
1423 | else | |
1424 | { | |
1425 | if (gimple_assign_copy_p (stmt) | |
1426 | && gimple_assign_lhs (stmt) == gimple_assign_rhs1 (stmt) | |
1427 | && auto_var_in_fn_p (gimple_assign_lhs (stmt), id->src_fn)) | |
1428 | { | |
1429 | /* Here we handle statements that are not completely rewritten. | |
1430 | First we detect some inlining-induced bogosities for | |
1431 | discarding. */ | |
1432 | ||
1433 | /* Some assignments VAR = VAR; don't generate any rtl code | |
1434 | and thus don't count as variable modification. Avoid | |
1435 | keeping bogosities like 0 = 0. */ | |
1436 | tree decl = gimple_assign_lhs (stmt), value; | |
1437 | tree *n; | |
1438 | ||
1439 | n = (tree *) pointer_map_contains (id->decl_map, decl); | |
1440 | if (n) | |
1441 | { | |
1442 | value = *n; | |
1443 | STRIP_TYPE_NOPS (value); | |
1444 | if (TREE_CONSTANT (value) || TREE_READONLY (value)) | |
1445 | return gimple_build_nop (); | |
1446 | } | |
1447 | } | |
1448 | ||
da51794e | 1449 | /* For *ptr_N ={v} {CLOBBER}, if ptr_N is SSA_NAME defined |
1450 | in a block that we aren't copying during tree_function_versioning, | |
1451 | just drop the clobber stmt. */ | |
1452 | if (id->blocks_to_copy && gimple_clobber_p (stmt)) | |
1453 | { | |
1454 | tree lhs = gimple_assign_lhs (stmt); | |
1455 | if (TREE_CODE (lhs) == MEM_REF | |
1456 | && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME) | |
1457 | { | |
1458 | gimple def_stmt = SSA_NAME_DEF_STMT (TREE_OPERAND (lhs, 0)); | |
1459 | if (gimple_bb (def_stmt) | |
1460 | && !bitmap_bit_p (id->blocks_to_copy, | |
1461 | gimple_bb (def_stmt)->index)) | |
1462 | return gimple_build_nop (); | |
1463 | } | |
1464 | } | |
1465 | ||
9845d120 | 1466 | if (gimple_debug_bind_p (stmt)) |
1467 | { | |
1468 | copy = gimple_build_debug_bind (gimple_debug_bind_get_var (stmt), | |
1469 | gimple_debug_bind_get_value (stmt), | |
1470 | stmt); | |
f1f41a6c | 1471 | id->debug_stmts.safe_push (copy); |
9845d120 | 1472 | return copy; |
1473 | } | |
841424cc | 1474 | if (gimple_debug_source_bind_p (stmt)) |
1475 | { | |
1476 | copy = gimple_build_debug_source_bind | |
1477 | (gimple_debug_source_bind_get_var (stmt), | |
1478 | gimple_debug_source_bind_get_value (stmt), stmt); | |
f1f41a6c | 1479 | id->debug_stmts.safe_push (copy); |
841424cc | 1480 | return copy; |
1481 | } | |
e38def9c | 1482 | |
1483 | /* Create a new deep copy of the statement. */ | |
1484 | copy = gimple_copy (stmt); | |
1485 | ||
1486 | /* Remap the region numbers for __builtin_eh_{pointer,filter}, | |
1487 | RESX and EH_DISPATCH. */ | |
1488 | if (id->eh_map) | |
1489 | switch (gimple_code (copy)) | |
1490 | { | |
1491 | case GIMPLE_CALL: | |
1492 | { | |
1493 | tree r, fndecl = gimple_call_fndecl (copy); | |
1494 | if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL) | |
1495 | switch (DECL_FUNCTION_CODE (fndecl)) | |
1496 | { | |
1497 | case BUILT_IN_EH_COPY_VALUES: | |
1498 | r = gimple_call_arg (copy, 1); | |
1499 | r = remap_eh_region_tree_nr (r, id); | |
1500 | gimple_call_set_arg (copy, 1, r); | |
1501 | /* FALLTHRU */ | |
1502 | ||
1503 | case BUILT_IN_EH_POINTER: | |
1504 | case BUILT_IN_EH_FILTER: | |
1505 | r = gimple_call_arg (copy, 0); | |
1506 | r = remap_eh_region_tree_nr (r, id); | |
1507 | gimple_call_set_arg (copy, 0, r); | |
1508 | break; | |
1509 | ||
1510 | default: | |
1511 | break; | |
1512 | } | |
cb245216 | 1513 | |
1a981e1a | 1514 | /* Reset alias info if we didn't apply measures to |
1515 | keep it valid over inlining by setting DECL_PT_UID. */ | |
1516 | if (!id->src_cfun->gimple_df | |
1517 | || !id->src_cfun->gimple_df->ipa_pta) | |
1518 | gimple_call_reset_alias_info (copy); | |
e38def9c | 1519 | } |
1520 | break; | |
1521 | ||
1522 | case GIMPLE_RESX: | |
1523 | { | |
1524 | int r = gimple_resx_region (copy); | |
1525 | r = remap_eh_region_nr (r, id); | |
1526 | gimple_resx_set_region (copy, r); | |
1527 | } | |
1528 | break; | |
1529 | ||
1530 | case GIMPLE_EH_DISPATCH: | |
1531 | { | |
1532 | int r = gimple_eh_dispatch_region (copy); | |
1533 | r = remap_eh_region_nr (r, id); | |
1534 | gimple_eh_dispatch_set_region (copy, r); | |
1535 | } | |
1536 | break; | |
1537 | ||
1538 | default: | |
1539 | break; | |
1540 | } | |
75a70cf9 | 1541 | } |
1542 | ||
1543 | /* If STMT has a block defined, map it to the newly constructed | |
688b0b5b | 1544 | block. */ |
75a70cf9 | 1545 | if (gimple_block (copy)) |
1546 | { | |
1547 | tree *n; | |
1548 | n = (tree *) pointer_map_contains (id->decl_map, gimple_block (copy)); | |
1549 | gcc_assert (n); | |
688b0b5b | 1550 | gimple_set_block (copy, *n); |
75a70cf9 | 1551 | } |
1552 | ||
841424cc | 1553 | if (gimple_debug_bind_p (copy) || gimple_debug_source_bind_p (copy)) |
9845d120 | 1554 | return copy; |
1555 | ||
75a70cf9 | 1556 | /* Remap all the operands in COPY. */ |
1557 | memset (&wi, 0, sizeof (wi)); | |
1558 | wi.info = id; | |
508d0d3f | 1559 | if (skip_first) |
1560 | walk_tree (gimple_op_ptr (copy, 1), remap_gimple_op_r, &wi, NULL); | |
1561 | else | |
48e1416a | 1562 | walk_gimple_op (copy, remap_gimple_op_r, &wi); |
75a70cf9 | 1563 | |
dd277d48 | 1564 | /* Clear the copied virtual operands. We are not remapping them here |
1565 | but are going to recreate them from scratch. */ | |
1566 | if (gimple_has_mem_ops (copy)) | |
1567 | { | |
1568 | gimple_set_vdef (copy, NULL_TREE); | |
1569 | gimple_set_vuse (copy, NULL_TREE); | |
1570 | } | |
1571 | ||
75a70cf9 | 1572 | return copy; |
1573 | } | |
1574 | ||
1575 | ||
e27482aa | 1576 | /* Copy basic block, scale profile accordingly. Edges will be taken care of |
1577 | later */ | |
1578 | ||
1579 | static basic_block | |
5b17b7ae | 1580 | copy_bb (copy_body_data *id, basic_block bb, int frequency_scale, |
1581 | gcov_type count_scale) | |
e27482aa | 1582 | { |
b236ac0e | 1583 | gimple_stmt_iterator gsi, copy_gsi, seq_gsi; |
e27482aa | 1584 | basic_block copy_basic_block; |
75a70cf9 | 1585 | tree decl; |
e2d3f422 | 1586 | gcov_type freq; |
b06ab5fa | 1587 | basic_block prev; |
1588 | ||
1589 | /* Search for previous copied basic block. */ | |
1590 | prev = bb->prev_bb; | |
1591 | while (!prev->aux) | |
1592 | prev = prev->prev_bb; | |
e27482aa | 1593 | |
1594 | /* create_basic_block() will append every new block to | |
1595 | basic_block_info automatically. */ | |
a9c6c0e3 | 1596 | copy_basic_block = create_basic_block (NULL, (void *) 0, |
b06ab5fa | 1597 | (basic_block) prev->aux); |
70074000 | 1598 | copy_basic_block->count = apply_scale (bb->count, count_scale); |
4ae20857 | 1599 | |
75a70cf9 | 1600 | /* We are going to rebuild frequencies from scratch. These values |
1601 | have just small importance to drive canonicalize_loop_headers. */ | |
70074000 | 1602 | freq = apply_scale ((gcov_type)bb->frequency, frequency_scale); |
75a70cf9 | 1603 | |
e2d3f422 | 1604 | /* We recompute frequencies after inlining, so this is quite safe. */ |
1605 | if (freq > BB_FREQ_MAX) | |
1606 | freq = BB_FREQ_MAX; | |
1607 | copy_basic_block->frequency = freq; | |
e27482aa | 1608 | |
75a70cf9 | 1609 | copy_gsi = gsi_start_bb (copy_basic_block); |
1610 | ||
1611 | for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi)) | |
e27482aa | 1612 | { |
75a70cf9 | 1613 | gimple stmt = gsi_stmt (gsi); |
1614 | gimple orig_stmt = stmt; | |
e27482aa | 1615 | |
3d053ea5 | 1616 | id->regimplify = false; |
75a70cf9 | 1617 | stmt = remap_gimple_stmt (stmt, id); |
1618 | if (gimple_nop_p (stmt)) | |
1619 | continue; | |
1620 | ||
1621 | gimple_duplicate_stmt_histograms (cfun, stmt, id->src_cfun, orig_stmt); | |
b236ac0e | 1622 | seq_gsi = copy_gsi; |
75a70cf9 | 1623 | |
1624 | /* With return slot optimization we can end up with | |
1625 | non-gimple (foo *)&this->m, fix that here. */ | |
da143e71 | 1626 | if (is_gimple_assign (stmt) |
1627 | && gimple_assign_rhs_code (stmt) == NOP_EXPR | |
1628 | && !is_gimple_val (gimple_assign_rhs1 (stmt))) | |
e27482aa | 1629 | { |
75a70cf9 | 1630 | tree new_rhs; |
b236ac0e | 1631 | new_rhs = force_gimple_operand_gsi (&seq_gsi, |
567cd518 | 1632 | gimple_assign_rhs1 (stmt), |
09cfc275 | 1633 | true, NULL, false, |
1634 | GSI_CONTINUE_LINKING); | |
75a70cf9 | 1635 | gimple_assign_set_rhs1 (stmt, new_rhs); |
b236ac0e | 1636 | id->regimplify = false; |
75a70cf9 | 1637 | } |
5bfb60b4 | 1638 | |
b236ac0e | 1639 | gsi_insert_after (&seq_gsi, stmt, GSI_NEW_STMT); |
1640 | ||
1641 | if (id->regimplify) | |
1642 | gimple_regimplify_operands (stmt, &seq_gsi); | |
1643 | ||
1644 | /* If copy_basic_block has been empty at the start of this iteration, | |
1645 | call gsi_start_bb again to get at the newly added statements. */ | |
1646 | if (gsi_end_p (copy_gsi)) | |
1647 | copy_gsi = gsi_start_bb (copy_basic_block); | |
1648 | else | |
1649 | gsi_next (©_gsi); | |
deff5ffd | 1650 | |
75a70cf9 | 1651 | /* Process the new statement. The call to gimple_regimplify_operands |
1652 | possibly turned the statement into multiple statements, we | |
1653 | need to process all of them. */ | |
b236ac0e | 1654 | do |
75a70cf9 | 1655 | { |
ccf4ab6b | 1656 | tree fn; |
1657 | ||
b236ac0e | 1658 | stmt = gsi_stmt (copy_gsi); |
75a70cf9 | 1659 | if (is_gimple_call (stmt) |
1660 | && gimple_call_va_arg_pack_p (stmt) | |
1661 | && id->gimple_call) | |
1662 | { | |
1663 | /* __builtin_va_arg_pack () should be replaced by | |
1664 | all arguments corresponding to ... in the caller. */ | |
1665 | tree p; | |
1666 | gimple new_call; | |
f1f41a6c | 1667 | vec<tree> argarray; |
75a70cf9 | 1668 | size_t nargs = gimple_call_num_args (id->gimple_call); |
1669 | size_t n; | |
1670 | ||
1767a056 | 1671 | for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p)) |
75a70cf9 | 1672 | nargs--; |
1673 | ||
1674 | /* Create the new array of arguments. */ | |
1675 | n = nargs + gimple_call_num_args (stmt); | |
f1f41a6c | 1676 | argarray.create (n); |
1677 | argarray.safe_grow_cleared (n); | |
75a70cf9 | 1678 | |
1679 | /* Copy all the arguments before '...' */ | |
f1f41a6c | 1680 | memcpy (argarray.address (), |
75a70cf9 | 1681 | gimple_call_arg_ptr (stmt, 0), |
1682 | gimple_call_num_args (stmt) * sizeof (tree)); | |
1683 | ||
1684 | /* Append the arguments passed in '...' */ | |
f1f41a6c | 1685 | memcpy (argarray.address () + gimple_call_num_args (stmt), |
75a70cf9 | 1686 | gimple_call_arg_ptr (id->gimple_call, 0) |
1687 | + (gimple_call_num_args (id->gimple_call) - nargs), | |
1688 | nargs * sizeof (tree)); | |
1689 | ||
1690 | new_call = gimple_build_call_vec (gimple_call_fn (stmt), | |
1691 | argarray); | |
1692 | ||
f1f41a6c | 1693 | argarray.release (); |
75a70cf9 | 1694 | |
1695 | /* Copy all GIMPLE_CALL flags, location and block, except | |
1696 | GF_CALL_VA_ARG_PACK. */ | |
1697 | gimple_call_copy_flags (new_call, stmt); | |
1698 | gimple_call_set_va_arg_pack (new_call, false); | |
1699 | gimple_set_location (new_call, gimple_location (stmt)); | |
1700 | gimple_set_block (new_call, gimple_block (stmt)); | |
1701 | gimple_call_set_lhs (new_call, gimple_call_lhs (stmt)); | |
1702 | ||
1703 | gsi_replace (©_gsi, new_call, false); | |
1704 | stmt = new_call; | |
1705 | } | |
1706 | else if (is_gimple_call (stmt) | |
1707 | && id->gimple_call | |
1708 | && (decl = gimple_call_fndecl (stmt)) | |
1709 | && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL | |
1710 | && DECL_FUNCTION_CODE (decl) == BUILT_IN_VA_ARG_PACK_LEN) | |
9bfec7c2 | 1711 | { |
75a70cf9 | 1712 | /* __builtin_va_arg_pack_len () should be replaced by |
1713 | the number of anonymous arguments. */ | |
1714 | size_t nargs = gimple_call_num_args (id->gimple_call); | |
1715 | tree count, p; | |
1716 | gimple new_stmt; | |
1717 | ||
1767a056 | 1718 | for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p)) |
75a70cf9 | 1719 | nargs--; |
1720 | ||
1721 | count = build_int_cst (integer_type_node, nargs); | |
1722 | new_stmt = gimple_build_assign (gimple_call_lhs (stmt), count); | |
1723 | gsi_replace (©_gsi, new_stmt, false); | |
1724 | stmt = new_stmt; | |
1725 | } | |
3e9045dd | 1726 | |
75a70cf9 | 1727 | /* Statements produced by inlining can be unfolded, especially |
1728 | when we constant propagated some operands. We can't fold | |
1729 | them right now for two reasons: | |
1730 | 1) folding require SSA_NAME_DEF_STMTs to be correct | |
1731 | 2) we can't change function calls to builtins. | |
1732 | So we just mark statement for later folding. We mark | |
1733 | all new statements, instead just statements that has changed | |
1734 | by some nontrivial substitution so even statements made | |
1735 | foldable indirectly are updated. If this turns out to be | |
1736 | expensive, copy_body can be told to watch for nontrivial | |
1737 | changes. */ | |
1738 | if (id->statements_to_fold) | |
1739 | pointer_set_insert (id->statements_to_fold, stmt); | |
1740 | ||
1741 | /* We're duplicating a CALL_EXPR. Find any corresponding | |
1742 | callgraph edges and update or duplicate them. */ | |
1743 | if (is_gimple_call (stmt)) | |
1744 | { | |
da50fe8f | 1745 | struct cgraph_edge *edge; |
28efe441 | 1746 | int flags; |
48dc2227 | 1747 | |
75a70cf9 | 1748 | switch (id->transform_call_graph_edges) |
9bfec7c2 | 1749 | { |
da50fe8f | 1750 | case CB_CGE_DUPLICATE: |
1751 | edge = cgraph_edge (id->src_node, orig_stmt); | |
1752 | if (edge) | |
e2d3f422 | 1753 | { |
1754 | int edge_freq = edge->frequency; | |
4d044066 | 1755 | int new_freq; |
1756 | struct cgraph_edge *old_edge = edge; | |
e2d3f422 | 1757 | edge = cgraph_clone_edge (edge, id->dst_node, stmt, |
1758 | gimple_uid (stmt), | |
1759 | REG_BR_PROB_BASE, CGRAPH_FREQ_BASE, | |
0835ad03 | 1760 | true); |
e2d3f422 | 1761 | /* We could also just rescale the frequency, but |
1762 | doing so would introduce roundoff errors and make | |
1763 | verifier unhappy. */ | |
02774f2d | 1764 | new_freq = compute_call_stmt_bb_frequency (id->dst_node->decl, |
4d044066 | 1765 | copy_basic_block); |
1766 | ||
1767 | /* Speculative calls consist of two edges - direct and indirect. | |
1768 | Duplicate the whole thing and distribute frequencies accordingly. */ | |
1769 | if (edge->speculative) | |
e2d3f422 | 1770 | { |
4d044066 | 1771 | struct cgraph_edge *direct, *indirect; |
1772 | struct ipa_ref *ref; | |
1773 | ||
1774 | gcc_assert (!edge->indirect_unknown_callee); | |
1775 | cgraph_speculative_call_info (old_edge, direct, indirect, ref); | |
1776 | indirect = cgraph_clone_edge (indirect, id->dst_node, stmt, | |
1777 | gimple_uid (stmt), | |
1778 | REG_BR_PROB_BASE, CGRAPH_FREQ_BASE, | |
1779 | true); | |
1780 | if (old_edge->frequency + indirect->frequency) | |
1781 | { | |
1782 | edge->frequency = MIN (RDIV ((gcov_type)new_freq * old_edge->frequency, | |
1783 | (old_edge->frequency + indirect->frequency)), | |
1784 | CGRAPH_FREQ_MAX); | |
1785 | indirect->frequency = MIN (RDIV ((gcov_type)new_freq * indirect->frequency, | |
1786 | (old_edge->frequency + indirect->frequency)), | |
1787 | CGRAPH_FREQ_MAX); | |
1788 | } | |
02774f2d | 1789 | ipa_clone_ref (ref, id->dst_node, stmt); |
4d044066 | 1790 | } |
1791 | else | |
1792 | { | |
1793 | edge->frequency = new_freq; | |
1794 | if (dump_file | |
1795 | && profile_status_for_function (cfun) != PROFILE_ABSENT | |
1796 | && (edge_freq > edge->frequency + 10 | |
1797 | || edge_freq < edge->frequency - 10)) | |
1798 | { | |
1799 | fprintf (dump_file, "Edge frequency estimated by " | |
1800 | "cgraph %i diverge from inliner's estimate %i\n", | |
1801 | edge_freq, | |
1802 | edge->frequency); | |
1803 | fprintf (dump_file, | |
1804 | "Orig bb: %i, orig bb freq %i, new bb freq %i\n", | |
1805 | bb->index, | |
1806 | bb->frequency, | |
1807 | copy_basic_block->frequency); | |
1808 | } | |
e2d3f422 | 1809 | } |
1810 | } | |
da50fe8f | 1811 | break; |
1812 | ||
1813 | case CB_CGE_MOVE_CLONES: | |
1814 | cgraph_set_call_stmt_including_clones (id->dst_node, | |
1815 | orig_stmt, stmt); | |
1816 | edge = cgraph_edge (id->dst_node, stmt); | |
1817 | break; | |
1818 | ||
1819 | case CB_CGE_MOVE: | |
1820 | edge = cgraph_edge (id->dst_node, orig_stmt); | |
1821 | if (edge) | |
1822 | cgraph_set_call_stmt (edge, stmt); | |
1823 | break; | |
1824 | ||
1825 | default: | |
1826 | gcc_unreachable (); | |
deff5ffd | 1827 | } |
28efe441 | 1828 | |
da50fe8f | 1829 | /* Constant propagation on argument done during inlining |
1830 | may create new direct call. Produce an edge for it. */ | |
48e1416a | 1831 | if ((!edge |
799c8711 | 1832 | || (edge->indirect_inlining_edge |
da50fe8f | 1833 | && id->transform_call_graph_edges == CB_CGE_MOVE_CLONES)) |
02774f2d | 1834 | && id->dst_node->definition |
da50fe8f | 1835 | && (fn = gimple_call_fndecl (stmt)) != NULL) |
1836 | { | |
fd6a3c41 | 1837 | struct cgraph_node *dest = cgraph_get_node (fn); |
da50fe8f | 1838 | |
1839 | /* We have missing edge in the callgraph. This can happen | |
1840 | when previous inlining turned an indirect call into a | |
6d1cc52c | 1841 | direct call by constant propagating arguments or we are |
292233cd | 1842 | producing dead clone (for further cloning). In all |
da50fe8f | 1843 | other cases we hit a bug (incorrect node sharing is the |
1844 | most common reason for missing edges). */ | |
02774f2d | 1845 | gcc_assert (!dest->definition |
1846 | || dest->address_taken | |
1847 | || !id->src_node->definition | |
1848 | || !id->dst_node->definition); | |
da50fe8f | 1849 | if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES) |
1850 | cgraph_create_edge_including_clones | |
ee3f5fc0 | 1851 | (id->dst_node, dest, orig_stmt, stmt, bb->count, |
02774f2d | 1852 | compute_call_stmt_bb_frequency (id->dst_node->decl, |
e2d3f422 | 1853 | copy_basic_block), |
0835ad03 | 1854 | CIF_ORIGINALLY_INDIRECT_CALL); |
da50fe8f | 1855 | else |
1856 | cgraph_create_edge (id->dst_node, dest, stmt, | |
ee3f5fc0 | 1857 | bb->count, |
1858 | compute_call_stmt_bb_frequency | |
02774f2d | 1859 | (id->dst_node->decl, |
7d0d0ce1 | 1860 | copy_basic_block))->inline_failed |
da50fe8f | 1861 | = CIF_ORIGINALLY_INDIRECT_CALL; |
1862 | if (dump_file) | |
1863 | { | |
b06ab5fa | 1864 | fprintf (dump_file, "Created new direct edge to %s\n", |
f1c8b4d7 | 1865 | dest->name ()); |
da50fe8f | 1866 | } |
1867 | } | |
ccf4ab6b | 1868 | |
28efe441 | 1869 | flags = gimple_call_flags (stmt); |
28efe441 | 1870 | if (flags & ECF_MAY_BE_ALLOCA) |
1871 | cfun->calls_alloca = true; | |
1872 | if (flags & ECF_RETURNS_TWICE) | |
1873 | cfun->calls_setjmp = true; | |
75a70cf9 | 1874 | } |
e27482aa | 1875 | |
e38def9c | 1876 | maybe_duplicate_eh_stmt_fn (cfun, stmt, id->src_cfun, orig_stmt, |
1877 | id->eh_map, id->eh_lp_nr); | |
75a70cf9 | 1878 | |
9845d120 | 1879 | if (gimple_in_ssa_p (cfun) && !is_gimple_debug (stmt)) |
75a70cf9 | 1880 | { |
1881 | ssa_op_iter i; | |
1882 | tree def; | |
1883 | ||
75a70cf9 | 1884 | FOR_EACH_SSA_TREE_OPERAND (def, stmt, i, SSA_OP_DEF) |
1885 | if (TREE_CODE (def) == SSA_NAME) | |
1886 | SSA_NAME_DEF_STMT (def) = stmt; | |
1887 | } | |
1888 | ||
1889 | gsi_next (©_gsi); | |
e27482aa | 1890 | } |
b236ac0e | 1891 | while (!gsi_end_p (copy_gsi)); |
75a70cf9 | 1892 | |
1893 | copy_gsi = gsi_last_bb (copy_basic_block); | |
e27482aa | 1894 | } |
75a70cf9 | 1895 | |
e27482aa | 1896 | return copy_basic_block; |
1897 | } | |
1898 | ||
deff5ffd | 1899 | /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA |
1900 | form is quite easy, since dominator relationship for old basic blocks does | |
1901 | not change. | |
1902 | ||
1903 | There is however exception where inlining might change dominator relation | |
1904 | across EH edges from basic block within inlined functions destinating | |
060a1cf3 | 1905 | to landing pads in function we inline into. |
deff5ffd | 1906 | |
fd71b542 | 1907 | The function fills in PHI_RESULTs of such PHI nodes if they refer |
1908 | to gimple regs. Otherwise, the function mark PHI_RESULT of such | |
1909 | PHI nodes for renaming. For non-gimple regs, renaming is safe: the | |
1910 | EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be | |
1911 | set, and this means that there will be no overlapping live ranges | |
deff5ffd | 1912 | for the underlying symbol. |
1913 | ||
1914 | This might change in future if we allow redirecting of EH edges and | |
1915 | we might want to change way build CFG pre-inlining to include | |
1916 | all the possible edges then. */ | |
1917 | static void | |
fd71b542 | 1918 | update_ssa_across_abnormal_edges (basic_block bb, basic_block ret_bb, |
1919 | bool can_throw, bool nonlocal_goto) | |
deff5ffd | 1920 | { |
1921 | edge e; | |
1922 | edge_iterator ei; | |
1923 | ||
1924 | FOR_EACH_EDGE (e, ei, bb->succs) | |
1925 | if (!e->dest->aux | |
1926 | || ((basic_block)e->dest->aux)->index == ENTRY_BLOCK) | |
1927 | { | |
75a70cf9 | 1928 | gimple phi; |
1929 | gimple_stmt_iterator si; | |
deff5ffd | 1930 | |
fd71b542 | 1931 | if (!nonlocal_goto) |
1932 | gcc_assert (e->flags & EDGE_EH); | |
75a70cf9 | 1933 | |
fd71b542 | 1934 | if (!can_throw) |
1935 | gcc_assert (!(e->flags & EDGE_EH)); | |
75a70cf9 | 1936 | |
1937 | for (si = gsi_start_phis (e->dest); !gsi_end_p (si); gsi_next (&si)) | |
deff5ffd | 1938 | { |
fd71b542 | 1939 | edge re; |
1940 | ||
75a70cf9 | 1941 | phi = gsi_stmt (si); |
1942 | ||
3621f68e | 1943 | /* For abnormal goto/call edges the receiver can be the |
1944 | ENTRY_BLOCK. Do not assert this cannot happen. */ | |
fd71b542 | 1945 | |
3d1eacdb | 1946 | gcc_assert ((e->flags & EDGE_EH) |
1947 | || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi))); | |
fd71b542 | 1948 | |
fd71b542 | 1949 | re = find_edge (ret_bb, e->dest); |
e2a6b9da | 1950 | gcc_checking_assert (re); |
fd71b542 | 1951 | gcc_assert ((re->flags & (EDGE_EH | EDGE_ABNORMAL)) |
1952 | == (e->flags & (EDGE_EH | EDGE_ABNORMAL))); | |
1953 | ||
1954 | SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e), | |
1955 | USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi, re))); | |
deff5ffd | 1956 | } |
1957 | } | |
1958 | } | |
1959 | ||
75a70cf9 | 1960 | |
c78cbec8 | 1961 | /* Copy edges from BB into its copy constructed earlier, scale profile |
1962 | accordingly. Edges will be taken care of later. Assume aux | |
39a98435 | 1963 | pointers to point to the copies of each BB. Return true if any |
1964 | debug stmts are left after a statement that must end the basic block. */ | |
75a70cf9 | 1965 | |
39a98435 | 1966 | static bool |
5f0af0d8 | 1967 | copy_edges_for_bb (basic_block bb, gcov_type count_scale, basic_block ret_bb, |
1968 | bool can_make_abnormal_goto) | |
e27482aa | 1969 | { |
a9c6c0e3 | 1970 | basic_block new_bb = (basic_block) bb->aux; |
e27482aa | 1971 | edge_iterator ei; |
1972 | edge old_edge; | |
75a70cf9 | 1973 | gimple_stmt_iterator si; |
e27482aa | 1974 | int flags; |
39a98435 | 1975 | bool need_debug_cleanup = false; |
e27482aa | 1976 | |
1977 | /* Use the indices from the original blocks to create edges for the | |
1978 | new ones. */ | |
1979 | FOR_EACH_EDGE (old_edge, ei, bb->succs) | |
9bfec7c2 | 1980 | if (!(old_edge->flags & EDGE_EH)) |
1981 | { | |
f4e36c33 | 1982 | edge new_edge; |
e27482aa | 1983 | |
9bfec7c2 | 1984 | flags = old_edge->flags; |
e27482aa | 1985 | |
9bfec7c2 | 1986 | /* Return edges do get a FALLTHRU flag when the get inlined. */ |
1987 | if (old_edge->dest->index == EXIT_BLOCK && !old_edge->flags | |
34154e27 | 1988 | && old_edge->dest->aux != EXIT_BLOCK_PTR_FOR_FN (cfun)) |
9bfec7c2 | 1989 | flags |= EDGE_FALLTHRU; |
f4e36c33 | 1990 | new_edge = make_edge (new_bb, (basic_block) old_edge->dest->aux, flags); |
70074000 | 1991 | new_edge->count = apply_scale (old_edge->count, count_scale); |
f4e36c33 | 1992 | new_edge->probability = old_edge->probability; |
9bfec7c2 | 1993 | } |
e27482aa | 1994 | |
1995 | if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK) | |
39a98435 | 1996 | return false; |
e27482aa | 1997 | |
75a70cf9 | 1998 | for (si = gsi_start_bb (new_bb); !gsi_end_p (si);) |
e27482aa | 1999 | { |
75a70cf9 | 2000 | gimple copy_stmt; |
fd71b542 | 2001 | bool can_throw, nonlocal_goto; |
e27482aa | 2002 | |
75a70cf9 | 2003 | copy_stmt = gsi_stmt (si); |
9845d120 | 2004 | if (!is_gimple_debug (copy_stmt)) |
a7745367 | 2005 | update_stmt (copy_stmt); |
75a70cf9 | 2006 | |
e27482aa | 2007 | /* Do this before the possible split_block. */ |
75a70cf9 | 2008 | gsi_next (&si); |
e27482aa | 2009 | |
2010 | /* If this tree could throw an exception, there are two | |
2011 | cases where we need to add abnormal edge(s): the | |
2012 | tree wasn't in a region and there is a "current | |
2013 | region" in the caller; or the original tree had | |
2014 | EH edges. In both cases split the block after the tree, | |
2015 | and add abnormal edge(s) as needed; we need both | |
2016 | those from the callee and the caller. | |
2017 | We check whether the copy can throw, because the const | |
2018 | propagation can change an INDIRECT_REF which throws | |
2019 | into a COMPONENT_REF which doesn't. If the copy | |
2020 | can throw, the original could also throw. */ | |
75a70cf9 | 2021 | can_throw = stmt_can_throw_internal (copy_stmt); |
caf1e632 | 2022 | nonlocal_goto = stmt_can_make_abnormal_goto (copy_stmt); |
fd71b542 | 2023 | |
2024 | if (can_throw || nonlocal_goto) | |
e27482aa | 2025 | { |
39a98435 | 2026 | if (!gsi_end_p (si)) |
2027 | { | |
2028 | while (!gsi_end_p (si) && is_gimple_debug (gsi_stmt (si))) | |
2029 | gsi_next (&si); | |
2030 | if (gsi_end_p (si)) | |
2031 | need_debug_cleanup = true; | |
2032 | } | |
75a70cf9 | 2033 | if (!gsi_end_p (si)) |
e27482aa | 2034 | /* Note that bb's predecessor edges aren't necessarily |
2035 | right at this point; split_block doesn't care. */ | |
2036 | { | |
2037 | edge e = split_block (new_bb, copy_stmt); | |
deff5ffd | 2038 | |
e27482aa | 2039 | new_bb = e->dest; |
deff5ffd | 2040 | new_bb->aux = e->src->aux; |
75a70cf9 | 2041 | si = gsi_start_bb (new_bb); |
e27482aa | 2042 | } |
fd71b542 | 2043 | } |
e27482aa | 2044 | |
e38def9c | 2045 | if (gimple_code (copy_stmt) == GIMPLE_EH_DISPATCH) |
2046 | make_eh_dispatch_edges (copy_stmt); | |
2047 | else if (can_throw) | |
fd71b542 | 2048 | make_eh_edges (copy_stmt); |
deff5ffd | 2049 | |
caf1e632 | 2050 | /* If the call we inline cannot make abnormal goto do not add |
2051 | additional abnormal edges but only retain those already present | |
2052 | in the original function body. */ | |
2053 | nonlocal_goto &= can_make_abnormal_goto; | |
fd71b542 | 2054 | if (nonlocal_goto) |
75a70cf9 | 2055 | make_abnormal_goto_edges (gimple_bb (copy_stmt), true); |
fd71b542 | 2056 | |
2057 | if ((can_throw || nonlocal_goto) | |
2058 | && gimple_in_ssa_p (cfun)) | |
75a70cf9 | 2059 | update_ssa_across_abnormal_edges (gimple_bb (copy_stmt), ret_bb, |
fd71b542 | 2060 | can_throw, nonlocal_goto); |
deff5ffd | 2061 | } |
39a98435 | 2062 | return need_debug_cleanup; |
deff5ffd | 2063 | } |
2064 | ||
2065 | /* Copy the PHIs. All blocks and edges are copied, some blocks | |
2066 | was possibly split and new outgoing EH edges inserted. | |
2067 | BB points to the block of original function and AUX pointers links | |
2068 | the original and newly copied blocks. */ | |
2069 | ||
2070 | static void | |
2071 | copy_phis_for_bb (basic_block bb, copy_body_data *id) | |
2072 | { | |
45ba1503 | 2073 | basic_block const new_bb = (basic_block) bb->aux; |
deff5ffd | 2074 | edge_iterator ei; |
75a70cf9 | 2075 | gimple phi; |
2076 | gimple_stmt_iterator si; | |
10f8ddfc | 2077 | edge new_edge; |
2078 | bool inserted = false; | |
deff5ffd | 2079 | |
e3a19533 | 2080 | for (si = gsi_start_phis (bb); !gsi_end_p (si); gsi_next (&si)) |
deff5ffd | 2081 | { |
75a70cf9 | 2082 | tree res, new_res; |
2083 | gimple new_phi; | |
deff5ffd | 2084 | |
75a70cf9 | 2085 | phi = gsi_stmt (si); |
2086 | res = PHI_RESULT (phi); | |
2087 | new_res = res; | |
7c782c9b | 2088 | if (!virtual_operand_p (res)) |
deff5ffd | 2089 | { |
75a70cf9 | 2090 | walk_tree (&new_res, copy_tree_body_r, id, NULL); |
9c06f260 | 2091 | new_phi = create_phi_node (new_res, new_bb); |
deff5ffd | 2092 | FOR_EACH_EDGE (new_edge, ei, new_bb->preds) |
2093 | { | |
6a69e813 | 2094 | edge old_edge = find_edge ((basic_block) new_edge->src->aux, bb); |
2095 | tree arg; | |
2096 | tree new_arg; | |
6a69e813 | 2097 | edge_iterator ei2; |
5169661d | 2098 | location_t locus; |
6a69e813 | 2099 | |
292233cd | 2100 | /* When doing partial cloning, we allow PHIs on the entry block |
6a69e813 | 2101 | as long as all the arguments are the same. Find any input |
2102 | edge to see argument to copy. */ | |
2103 | if (!old_edge) | |
2104 | FOR_EACH_EDGE (old_edge, ei2, bb->preds) | |
2105 | if (!old_edge->src->aux) | |
2106 | break; | |
2107 | ||
2108 | arg = PHI_ARG_DEF_FROM_EDGE (phi, old_edge); | |
2109 | new_arg = arg; | |
75a70cf9 | 2110 | walk_tree (&new_arg, copy_tree_body_r, id, NULL); |
deff5ffd | 2111 | gcc_assert (new_arg); |
9915e061 | 2112 | /* With return slot optimization we can end up with |
2113 | non-gimple (foo *)&this->m, fix that here. */ | |
2114 | if (TREE_CODE (new_arg) != SSA_NAME | |
2115 | && TREE_CODE (new_arg) != FUNCTION_DECL | |
2116 | && !is_gimple_val (new_arg)) | |
2117 | { | |
75a70cf9 | 2118 | gimple_seq stmts = NULL; |
2119 | new_arg = force_gimple_operand (new_arg, &stmts, true, NULL); | |
10f8ddfc | 2120 | gsi_insert_seq_on_edge (new_edge, stmts); |
2121 | inserted = true; | |
9915e061 | 2122 | } |
5169661d | 2123 | locus = gimple_phi_arg_location_from_edge (phi, old_edge); |
5169661d | 2124 | if (LOCATION_BLOCK (locus)) |
2125 | { | |
2126 | tree *n; | |
2127 | n = (tree *) pointer_map_contains (id->decl_map, | |
2128 | LOCATION_BLOCK (locus)); | |
2129 | gcc_assert (n); | |
2884d265 | 2130 | if (*n) |
2131 | locus = COMBINE_LOCATION_DATA (line_table, locus, *n); | |
2132 | else | |
2133 | locus = LOCATION_LOCUS (locus); | |
5169661d | 2134 | } |
688b0b5b | 2135 | else |
2136 | locus = LOCATION_LOCUS (locus); | |
5169661d | 2137 | |
688b0b5b | 2138 | add_phi_arg (new_phi, new_arg, new_edge, locus); |
deff5ffd | 2139 | } |
e27482aa | 2140 | } |
2141 | } | |
10f8ddfc | 2142 | |
2143 | /* Commit the delayed edge insertions. */ | |
2144 | if (inserted) | |
2145 | FOR_EACH_EDGE (new_edge, ei, new_bb->preds) | |
2146 | gsi_commit_one_edge_insert (new_edge, NULL); | |
e27482aa | 2147 | } |
2148 | ||
75a70cf9 | 2149 | |
e27482aa | 2150 | /* Wrapper for remap_decl so it can be used as a callback. */ |
75a70cf9 | 2151 | |
e27482aa | 2152 | static tree |
2153 | remap_decl_1 (tree decl, void *data) | |
2154 | { | |
51a48c27 | 2155 | return remap_decl (decl, (copy_body_data *) data); |
e27482aa | 2156 | } |
2157 | ||
deff5ffd | 2158 | /* Build struct function and associated datastructures for the new clone |
9078126c | 2159 | NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes |
2160 | the cfun to the function of new_fndecl (and current_function_decl too). */ | |
deff5ffd | 2161 | |
2162 | static void | |
e2d3f422 | 2163 | initialize_cfun (tree new_fndecl, tree callee_fndecl, gcov_type count) |
deff5ffd | 2164 | { |
deff5ffd | 2165 | struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl); |
e2d3f422 | 2166 | gcov_type count_scale; |
deff5ffd | 2167 | |
79e830ee | 2168 | if (!DECL_ARGUMENTS (new_fndecl)) |
2169 | DECL_ARGUMENTS (new_fndecl) = DECL_ARGUMENTS (callee_fndecl); | |
2170 | if (!DECL_RESULT (new_fndecl)) | |
2171 | DECL_RESULT (new_fndecl) = DECL_RESULT (callee_fndecl); | |
2172 | ||
34154e27 | 2173 | if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count) |
70074000 | 2174 | count_scale |
2175 | = GCOV_COMPUTE_SCALE (count, | |
34154e27 | 2176 | ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count); |
deff5ffd | 2177 | else |
e2d3f422 | 2178 | count_scale = REG_BR_PROB_BASE; |
deff5ffd | 2179 | |
2180 | /* Register specific tree functions. */ | |
75a70cf9 | 2181 | gimple_register_cfg_hooks (); |
1a1a827a | 2182 | |
2183 | /* Get clean struct function. */ | |
2184 | push_struct_function (new_fndecl); | |
2185 | ||
2186 | /* We will rebuild these, so just sanity check that they are empty. */ | |
2187 | gcc_assert (VALUE_HISTOGRAMS (cfun) == NULL); | |
2188 | gcc_assert (cfun->local_decls == NULL); | |
2189 | gcc_assert (cfun->cfg == NULL); | |
2190 | gcc_assert (cfun->decl == new_fndecl); | |
2191 | ||
292233cd | 2192 | /* Copy items we preserve during cloning. */ |
1a1a827a | 2193 | cfun->static_chain_decl = src_cfun->static_chain_decl; |
2194 | cfun->nonlocal_goto_save_area = src_cfun->nonlocal_goto_save_area; | |
2195 | cfun->function_end_locus = src_cfun->function_end_locus; | |
f6568ea4 | 2196 | cfun->curr_properties = src_cfun->curr_properties; |
1a1a827a | 2197 | cfun->last_verified = src_cfun->last_verified; |
1a1a827a | 2198 | cfun->va_list_gpr_size = src_cfun->va_list_gpr_size; |
2199 | cfun->va_list_fpr_size = src_cfun->va_list_fpr_size; | |
1a1a827a | 2200 | cfun->has_nonlocal_label = src_cfun->has_nonlocal_label; |
2201 | cfun->stdarg = src_cfun->stdarg; | |
1a1a827a | 2202 | cfun->after_inlining = src_cfun->after_inlining; |
cbeb677e | 2203 | cfun->can_throw_non_call_exceptions |
2204 | = src_cfun->can_throw_non_call_exceptions; | |
39e8019f | 2205 | cfun->can_delete_dead_exceptions = src_cfun->can_delete_dead_exceptions; |
1a1a827a | 2206 | cfun->returns_struct = src_cfun->returns_struct; |
2207 | cfun->returns_pcc_struct = src_cfun->returns_pcc_struct; | |
1a1a827a | 2208 | |
deff5ffd | 2209 | init_empty_tree_cfg (); |
2210 | ||
e2d3f422 | 2211 | profile_status_for_function (cfun) = profile_status_for_function (src_cfun); |
34154e27 | 2212 | ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = |
2213 | (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale / | |
deff5ffd | 2214 | REG_BR_PROB_BASE); |
34154e27 | 2215 | ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency |
2216 | = ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->frequency; | |
2217 | EXIT_BLOCK_PTR_FOR_FN (cfun)->count = | |
2218 | (EXIT_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale / | |
deff5ffd | 2219 | REG_BR_PROB_BASE); |
34154e27 | 2220 | EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency = |
2221 | EXIT_BLOCK_PTR_FOR_FN (src_cfun)->frequency; | |
deff5ffd | 2222 | if (src_cfun->eh) |
2223 | init_eh_for_function (); | |
2224 | ||
2225 | if (src_cfun->gimple_df) | |
2226 | { | |
bcaa2770 | 2227 | init_tree_ssa (cfun); |
deff5ffd | 2228 | cfun->gimple_df->in_ssa_p = true; |
5084b2e4 | 2229 | init_ssa_operands (cfun); |
deff5ffd | 2230 | } |
deff5ffd | 2231 | } |
2232 | ||
39a98435 | 2233 | /* Helper function for copy_cfg_body. Move debug stmts from the end |
2234 | of NEW_BB to the beginning of successor basic blocks when needed. If the | |
2235 | successor has multiple predecessors, reset them, otherwise keep | |
2236 | their value. */ | |
2237 | ||
2238 | static void | |
2239 | maybe_move_debug_stmts_to_successors (copy_body_data *id, basic_block new_bb) | |
2240 | { | |
2241 | edge e; | |
2242 | edge_iterator ei; | |
2243 | gimple_stmt_iterator si = gsi_last_nondebug_bb (new_bb); | |
2244 | ||
2245 | if (gsi_end_p (si) | |
2246 | || gsi_one_before_end_p (si) | |
2247 | || !(stmt_can_throw_internal (gsi_stmt (si)) | |
2248 | || stmt_can_make_abnormal_goto (gsi_stmt (si)))) | |
2249 | return; | |
2250 | ||
2251 | FOR_EACH_EDGE (e, ei, new_bb->succs) | |
2252 | { | |
2253 | gimple_stmt_iterator ssi = gsi_last_bb (new_bb); | |
2254 | gimple_stmt_iterator dsi = gsi_after_labels (e->dest); | |
2255 | while (is_gimple_debug (gsi_stmt (ssi))) | |
2256 | { | |
2257 | gimple stmt = gsi_stmt (ssi), new_stmt; | |
2258 | tree var; | |
2259 | tree value; | |
2260 | ||
2261 | /* For the last edge move the debug stmts instead of copying | |
2262 | them. */ | |
2263 | if (ei_one_before_end_p (ei)) | |
2264 | { | |
2265 | si = ssi; | |
2266 | gsi_prev (&ssi); | |
841424cc | 2267 | if (!single_pred_p (e->dest) && gimple_debug_bind_p (stmt)) |
39a98435 | 2268 | gimple_debug_bind_reset_value (stmt); |
2269 | gsi_remove (&si, false); | |
2270 | gsi_insert_before (&dsi, stmt, GSI_SAME_STMT); | |
2271 | continue; | |
2272 | } | |
2273 | ||
841424cc | 2274 | if (gimple_debug_bind_p (stmt)) |
39a98435 | 2275 | { |
841424cc | 2276 | var = gimple_debug_bind_get_var (stmt); |
2277 | if (single_pred_p (e->dest)) | |
2278 | { | |
2279 | value = gimple_debug_bind_get_value (stmt); | |
2280 | value = unshare_expr (value); | |
2281 | } | |
2282 | else | |
2283 | value = NULL_TREE; | |
2284 | new_stmt = gimple_build_debug_bind (var, value, stmt); | |
2285 | } | |
2286 | else if (gimple_debug_source_bind_p (stmt)) | |
2287 | { | |
2288 | var = gimple_debug_source_bind_get_var (stmt); | |
2289 | value = gimple_debug_source_bind_get_value (stmt); | |
2290 | new_stmt = gimple_build_debug_source_bind (var, value, stmt); | |
39a98435 | 2291 | } |
2292 | else | |
841424cc | 2293 | gcc_unreachable (); |
39a98435 | 2294 | gsi_insert_before (&dsi, new_stmt, GSI_SAME_STMT); |
f1f41a6c | 2295 | id->debug_stmts.safe_push (new_stmt); |
39a98435 | 2296 | gsi_prev (&ssi); |
2297 | } | |
2298 | } | |
2299 | } | |
2300 | ||
f6568ea4 | 2301 | /* Make a copy of the sub-loops of SRC_PARENT and place them |
2302 | as siblings of DEST_PARENT. */ | |
2303 | ||
2304 | static void | |
84cb1020 | 2305 | copy_loops (copy_body_data *id, |
f6568ea4 | 2306 | struct loop *dest_parent, struct loop *src_parent) |
2307 | { | |
2308 | struct loop *src_loop = src_parent->inner; | |
2309 | while (src_loop) | |
2310 | { | |
84cb1020 | 2311 | if (!id->blocks_to_copy |
2312 | || bitmap_bit_p (id->blocks_to_copy, src_loop->header->index)) | |
f6568ea4 | 2313 | { |
2314 | struct loop *dest_loop = alloc_loop (); | |
2315 | ||
2316 | /* Assign the new loop its header and latch and associate | |
2317 | those with the new loop. */ | |
92b43d63 | 2318 | if (src_loop->header != NULL) |
2319 | { | |
2320 | dest_loop->header = (basic_block)src_loop->header->aux; | |
2321 | dest_loop->header->loop_father = dest_loop; | |
2322 | } | |
f6568ea4 | 2323 | if (src_loop->latch != NULL) |
2324 | { | |
2325 | dest_loop->latch = (basic_block)src_loop->latch->aux; | |
2326 | dest_loop->latch->loop_father = dest_loop; | |
2327 | } | |
2328 | ||
2329 | /* Copy loop meta-data. */ | |
2330 | copy_loop_info (src_loop, dest_loop); | |
2331 | ||
2332 | /* Finally place it into the loop array and the loop tree. */ | |
41f75a99 | 2333 | place_new_loop (cfun, dest_loop); |
f6568ea4 | 2334 | flow_loop_tree_node_add (dest_parent, dest_loop); |
2335 | ||
84cb1020 | 2336 | if (src_loop->simduid) |
2337 | { | |
2338 | dest_loop->simduid = remap_decl (src_loop->simduid, id); | |
2339 | cfun->has_simduid_loops = true; | |
2340 | } | |
2341 | if (src_loop->force_vect) | |
2342 | { | |
2343 | dest_loop->force_vect = true; | |
2344 | cfun->has_force_vect_loops = true; | |
2345 | } | |
2346 | ||
f6568ea4 | 2347 | /* Recurse. */ |
84cb1020 | 2348 | copy_loops (id, dest_loop, src_loop); |
f6568ea4 | 2349 | } |
2350 | src_loop = src_loop->next; | |
2351 | } | |
2352 | } | |
2353 | ||
4d044066 | 2354 | /* Call cgraph_redirect_edge_call_stmt_to_callee on all calls in BB */ |
2355 | ||
2356 | void | |
2357 | redirect_all_calls (copy_body_data * id, basic_block bb) | |
2358 | { | |
2359 | gimple_stmt_iterator si; | |
2360 | for (si = gsi_start_bb (bb); !gsi_end_p (si); gsi_next (&si)) | |
2361 | { | |
2362 | if (is_gimple_call (gsi_stmt (si))) | |
2363 | { | |
2364 | struct cgraph_edge *edge = cgraph_edge (id->dst_node, gsi_stmt (si)); | |
2365 | if (edge) | |
2366 | cgraph_redirect_edge_call_stmt_to_callee (edge); | |
2367 | } | |
2368 | } | |
2369 | } | |
2370 | ||
38a65d4e | 2371 | /* Convert estimated frequencies into counts for NODE, scaling COUNT |
2372 | with each bb's frequency. Used when NODE has a 0-weight entry | |
2373 | but we are about to inline it into a non-zero count call bb. | |
2374 | See the comments for handle_missing_profiles() in predict.c for | |
2375 | when this can happen for COMDATs. */ | |
2376 | ||
2377 | void | |
2378 | freqs_to_counts (struct cgraph_node *node, gcov_type count) | |
2379 | { | |
2380 | basic_block bb; | |
2381 | edge_iterator ei; | |
2382 | edge e; | |
2383 | struct function *fn = DECL_STRUCT_FUNCTION (node->decl); | |
2384 | ||
2385 | FOR_ALL_BB_FN(bb, fn) | |
2386 | { | |
2387 | bb->count = apply_scale (count, | |
2388 | GCOV_COMPUTE_SCALE (bb->frequency, BB_FREQ_MAX)); | |
2389 | FOR_EACH_EDGE (e, ei, bb->succs) | |
2390 | e->count = apply_probability (e->src->count, e->probability); | |
2391 | } | |
2392 | } | |
2393 | ||
e27482aa | 2394 | /* Make a copy of the body of FN so that it can be inserted inline in |
2395 | another function. Walks FN via CFG, returns new fndecl. */ | |
2396 | ||
2397 | static tree | |
e2d3f422 | 2398 | copy_cfg_body (copy_body_data * id, gcov_type count, int frequency_scale, |
b06ab5fa | 2399 | basic_block entry_block_map, basic_block exit_block_map, |
84cb1020 | 2400 | basic_block new_entry) |
e27482aa | 2401 | { |
51a48c27 | 2402 | tree callee_fndecl = id->src_fn; |
e27482aa | 2403 | /* Original cfun for the callee, doesn't change. */ |
51a48c27 | 2404 | struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl); |
deff5ffd | 2405 | struct function *cfun_to_copy; |
e27482aa | 2406 | basic_block bb; |
2407 | tree new_fndecl = NULL; | |
39a98435 | 2408 | bool need_debug_cleanup = false; |
e2d3f422 | 2409 | gcov_type count_scale; |
deff5ffd | 2410 | int last; |
292233cd | 2411 | int incoming_frequency = 0; |
2412 | gcov_type incoming_count = 0; | |
e27482aa | 2413 | |
38a65d4e | 2414 | /* This can happen for COMDAT routines that end up with 0 counts |
2415 | despite being called (see the comments for handle_missing_profiles() | |
2416 | in predict.c as to why). Apply counts to the blocks in the callee | |
2417 | before inlining, using the guessed edge frequencies, so that we don't | |
2418 | end up with a 0-count inline body which can confuse downstream | |
2419 | optimizations such as function splitting. */ | |
34154e27 | 2420 | if (!ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count && count) |
38a65d4e | 2421 | { |
2422 | /* Apply the larger of the call bb count and the total incoming | |
2423 | call edge count to the callee. */ | |
2424 | gcov_type in_count = 0; | |
2425 | struct cgraph_edge *in_edge; | |
2426 | for (in_edge = id->src_node->callers; in_edge; | |
2427 | in_edge = in_edge->next_caller) | |
2428 | in_count += in_edge->count; | |
2429 | freqs_to_counts (id->src_node, count > in_count ? count : in_count); | |
2430 | } | |
2431 | ||
34154e27 | 2432 | if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count) |
70074000 | 2433 | count_scale |
2434 | = GCOV_COMPUTE_SCALE (count, | |
34154e27 | 2435 | ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count); |
e27482aa | 2436 | else |
e2d3f422 | 2437 | count_scale = REG_BR_PROB_BASE; |
e27482aa | 2438 | |
2439 | /* Register specific tree functions. */ | |
75a70cf9 | 2440 | gimple_register_cfg_hooks (); |
e27482aa | 2441 | |
efee62d1 | 2442 | /* If we are inlining just region of the function, make sure to connect |
2443 | new entry to ENTRY_BLOCK_PTR_FOR_FN (cfun). Since new entry can be | |
2444 | part of loop, we must compute frequency and probability of | |
2445 | ENTRY_BLOCK_PTR_FOR_FN (cfun) based on the frequencies and | |
292233cd | 2446 | probabilities of edges incoming from nonduplicated region. */ |
555e8b05 | 2447 | if (new_entry) |
2448 | { | |
2449 | edge e; | |
2450 | edge_iterator ei; | |
2451 | ||
2452 | FOR_EACH_EDGE (e, ei, new_entry->preds) | |
2453 | if (!e->src->aux) | |
2454 | { | |
292233cd | 2455 | incoming_frequency += EDGE_FREQUENCY (e); |
2456 | incoming_count += e->count; | |
555e8b05 | 2457 | } |
70074000 | 2458 | incoming_count = apply_scale (incoming_count, count_scale); |
292233cd | 2459 | incoming_frequency |
70074000 | 2460 | = apply_scale ((gcov_type)incoming_frequency, frequency_scale); |
34154e27 | 2461 | ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = incoming_count; |
2462 | ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency = incoming_frequency; | |
555e8b05 | 2463 | } |
2464 | ||
e27482aa | 2465 | /* Must have a CFG here at this point. */ |
34154e27 | 2466 | gcc_assert (ENTRY_BLOCK_PTR_FOR_FN |
e27482aa | 2467 | (DECL_STRUCT_FUNCTION (callee_fndecl))); |
2468 | ||
deff5ffd | 2469 | cfun_to_copy = id->src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl); |
2470 | ||
34154e27 | 2471 | ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = entry_block_map; |
2472 | EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = exit_block_map; | |
2473 | entry_block_map->aux = ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy); | |
2474 | exit_block_map->aux = EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy); | |
e27482aa | 2475 | |
e27482aa | 2476 | /* Duplicate any exception-handling regions. */ |
2477 | if (cfun->eh) | |
e38def9c | 2478 | id->eh_map = duplicate_eh_regions (cfun_to_copy, NULL, id->eh_lp_nr, |
2479 | remap_decl_1, id); | |
75a70cf9 | 2480 | |
e27482aa | 2481 | /* Use aux pointers to map the original blocks to copy. */ |
2482 | FOR_EACH_BB_FN (bb, cfun_to_copy) | |
84cb1020 | 2483 | if (!id->blocks_to_copy || bitmap_bit_p (id->blocks_to_copy, bb->index)) |
b06ab5fa | 2484 | { |
2485 | basic_block new_bb = copy_bb (id, bb, frequency_scale, count_scale); | |
2486 | bb->aux = new_bb; | |
2487 | new_bb->aux = bb; | |
f6568ea4 | 2488 | new_bb->loop_father = entry_block_map->loop_father; |
b06ab5fa | 2489 | } |
deff5ffd | 2490 | |
944cca50 | 2491 | last = last_basic_block; |
75a70cf9 | 2492 | |
e27482aa | 2493 | /* Now that we've duplicated the blocks, duplicate their edges. */ |
5f0af0d8 | 2494 | bool can_make_abormal_goto |
2495 | = id->gimple_call && stmt_can_make_abnormal_goto (id->gimple_call); | |
e27482aa | 2496 | FOR_ALL_BB_FN (bb, cfun_to_copy) |
84cb1020 | 2497 | if (!id->blocks_to_copy |
2498 | || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index))) | |
5f0af0d8 | 2499 | need_debug_cleanup |= copy_edges_for_bb (bb, count_scale, exit_block_map, |
2500 | can_make_abormal_goto); | |
75a70cf9 | 2501 | |
b06ab5fa | 2502 | if (new_entry) |
deff5ffd | 2503 | { |
555e8b05 | 2504 | edge e = make_edge (entry_block_map, (basic_block)new_entry->aux, EDGE_FALLTHRU); |
b06ab5fa | 2505 | e->probability = REG_BR_PROB_BASE; |
292233cd | 2506 | e->count = incoming_count; |
deff5ffd | 2507 | } |
75a70cf9 | 2508 | |
f6568ea4 | 2509 | /* Duplicate the loop tree, if available and wanted. */ |
41f75a99 | 2510 | if (loops_for_fn (src_cfun) != NULL |
f6568ea4 | 2511 | && current_loops != NULL) |
2512 | { | |
84cb1020 | 2513 | copy_loops (id, entry_block_map->loop_father, |
41f75a99 | 2514 | get_loop (src_cfun, 0)); |
f6568ea4 | 2515 | /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */ |
2516 | loops_state_set (LOOPS_NEED_FIXUP); | |
2517 | } | |
2518 | ||
92b43d63 | 2519 | /* If the loop tree in the source function needed fixup, mark the |
2520 | destination loop tree for fixup, too. */ | |
2521 | if (loops_for_fn (src_cfun)->state & LOOPS_NEED_FIXUP) | |
2522 | loops_state_set (LOOPS_NEED_FIXUP); | |
2523 | ||
6a69e813 | 2524 | if (gimple_in_ssa_p (cfun)) |
2525 | FOR_ALL_BB_FN (bb, cfun_to_copy) | |
84cb1020 | 2526 | if (!id->blocks_to_copy |
2527 | || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index))) | |
6a69e813 | 2528 | copy_phis_for_bb (bb, id); |
2529 | ||
b06ab5fa | 2530 | FOR_ALL_BB_FN (bb, cfun_to_copy) |
2531 | if (bb->aux) | |
2532 | { | |
2533 | if (need_debug_cleanup | |
2534 | && bb->index != ENTRY_BLOCK | |
2535 | && bb->index != EXIT_BLOCK) | |
2536 | maybe_move_debug_stmts_to_successors (id, (basic_block) bb->aux); | |
4d044066 | 2537 | /* Update call edge destinations. This can not be done before loop |
2538 | info is updated, because we may split basic blocks. */ | |
2539 | if (id->transform_call_graph_edges == CB_CGE_DUPLICATE) | |
2540 | redirect_all_calls (id, (basic_block)bb->aux); | |
b06ab5fa | 2541 | ((basic_block)bb->aux)->aux = NULL; |
2542 | bb->aux = NULL; | |
2543 | } | |
2544 | ||
deff5ffd | 2545 | /* Zero out AUX fields of newly created block during EH edge |
2546 | insertion. */ | |
944cca50 | 2547 | for (; last < last_basic_block; last++) |
39a98435 | 2548 | { |
2549 | if (need_debug_cleanup) | |
2550 | maybe_move_debug_stmts_to_successors (id, BASIC_BLOCK (last)); | |
2551 | BASIC_BLOCK (last)->aux = NULL; | |
4d044066 | 2552 | /* Update call edge destinations. This can not be done before loop |
2553 | info is updated, because we may split basic blocks. */ | |
2554 | if (id->transform_call_graph_edges == CB_CGE_DUPLICATE) | |
2555 | redirect_all_calls (id, BASIC_BLOCK (last)); | |
39a98435 | 2556 | } |
deff5ffd | 2557 | entry_block_map->aux = NULL; |
2558 | exit_block_map->aux = NULL; | |
e27482aa | 2559 | |
e38def9c | 2560 | if (id->eh_map) |
2561 | { | |
2562 | pointer_map_destroy (id->eh_map); | |
2563 | id->eh_map = NULL; | |
2564 | } | |
2565 | ||
e27482aa | 2566 | return new_fndecl; |
2567 | } | |
2568 | ||
9845d120 | 2569 | /* Copy the debug STMT using ID. We deal with these statements in a |
2570 | special way: if any variable in their VALUE expression wasn't | |
2571 | remapped yet, we won't remap it, because that would get decl uids | |
2572 | out of sync, causing codegen differences between -g and -g0. If | |
2573 | this arises, we drop the VALUE expression altogether. */ | |
2574 | ||
2575 | static void | |
2576 | copy_debug_stmt (gimple stmt, copy_body_data *id) | |
2577 | { | |
2578 | tree t, *n; | |
2579 | struct walk_stmt_info wi; | |
2580 | ||
9845d120 | 2581 | if (gimple_block (stmt)) |
2582 | { | |
9845d120 | 2583 | n = (tree *) pointer_map_contains (id->decl_map, gimple_block (stmt)); |
688b0b5b | 2584 | gimple_set_block (stmt, n ? *n : id->block); |
9845d120 | 2585 | } |
9845d120 | 2586 | |
2587 | /* Remap all the operands in COPY. */ | |
2588 | memset (&wi, 0, sizeof (wi)); | |
2589 | wi.info = id; | |
2590 | ||
2591 | processing_debug_stmt = 1; | |
2592 | ||
841424cc | 2593 | if (gimple_debug_source_bind_p (stmt)) |
2594 | t = gimple_debug_source_bind_get_var (stmt); | |
2595 | else | |
2596 | t = gimple_debug_bind_get_var (stmt); | |
9845d120 | 2597 | |
2598 | if (TREE_CODE (t) == PARM_DECL && id->debug_map | |
2599 | && (n = (tree *) pointer_map_contains (id->debug_map, t))) | |
2600 | { | |
2601 | gcc_assert (TREE_CODE (*n) == VAR_DECL); | |
2602 | t = *n; | |
2603 | } | |
e0667160 | 2604 | else if (TREE_CODE (t) == VAR_DECL |
4ae5778c | 2605 | && !is_global_var (t) |
2606 | && !pointer_map_contains (id->decl_map, t)) | |
e0667160 | 2607 | /* T is a non-localized variable. */; |
9845d120 | 2608 | else |
2609 | walk_tree (&t, remap_gimple_op_r, &wi, NULL); | |
2610 | ||
841424cc | 2611 | if (gimple_debug_bind_p (stmt)) |
2612 | { | |
2613 | gimple_debug_bind_set_var (stmt, t); | |
9845d120 | 2614 | |
841424cc | 2615 | if (gimple_debug_bind_has_value_p (stmt)) |
2616 | walk_tree (gimple_debug_bind_get_value_ptr (stmt), | |
2617 | remap_gimple_op_r, &wi, NULL); | |
9845d120 | 2618 | |
841424cc | 2619 | /* Punt if any decl couldn't be remapped. */ |
2620 | if (processing_debug_stmt < 0) | |
2621 | gimple_debug_bind_reset_value (stmt); | |
2622 | } | |
2623 | else if (gimple_debug_source_bind_p (stmt)) | |
2624 | { | |
2625 | gimple_debug_source_bind_set_var (stmt, t); | |
2626 | walk_tree (gimple_debug_source_bind_get_value_ptr (stmt), | |
2627 | remap_gimple_op_r, &wi, NULL); | |
eee0ea7c | 2628 | /* When inlining and source bind refers to one of the optimized |
2629 | away parameters, change the source bind into normal debug bind | |
2630 | referring to the corresponding DEBUG_EXPR_DECL that should have | |
2631 | been bound before the call stmt. */ | |
2632 | t = gimple_debug_source_bind_get_value (stmt); | |
2633 | if (t != NULL_TREE | |
2634 | && TREE_CODE (t) == PARM_DECL | |
2635 | && id->gimple_call) | |
2636 | { | |
f1f41a6c | 2637 | vec<tree, va_gc> **debug_args = decl_debug_args_lookup (id->src_fn); |
eee0ea7c | 2638 | unsigned int i; |
2639 | if (debug_args != NULL) | |
2640 | { | |
f1f41a6c | 2641 | for (i = 0; i < vec_safe_length (*debug_args); i += 2) |
2642 | if ((**debug_args)[i] == DECL_ORIGIN (t) | |
2643 | && TREE_CODE ((**debug_args)[i + 1]) == DEBUG_EXPR_DECL) | |
eee0ea7c | 2644 | { |
f1f41a6c | 2645 | t = (**debug_args)[i + 1]; |
de6bd75e | 2646 | stmt->subcode = GIMPLE_DEBUG_BIND; |
eee0ea7c | 2647 | gimple_debug_bind_set_value (stmt, t); |
2648 | break; | |
2649 | } | |
2650 | } | |
2651 | } | |
841424cc | 2652 | } |
9845d120 | 2653 | |
2654 | processing_debug_stmt = 0; | |
2655 | ||
2656 | update_stmt (stmt); | |
9845d120 | 2657 | } |
2658 | ||
2659 | /* Process deferred debug stmts. In order to give values better odds | |
2660 | of being successfully remapped, we delay the processing of debug | |
2661 | stmts until all other stmts that might require remapping are | |
2662 | processed. */ | |
2663 | ||
2664 | static void | |
2665 | copy_debug_stmts (copy_body_data *id) | |
2666 | { | |
2667 | size_t i; | |
2668 | gimple stmt; | |
2669 | ||
f1f41a6c | 2670 | if (!id->debug_stmts.exists ()) |
9845d120 | 2671 | return; |
2672 | ||
f1f41a6c | 2673 | FOR_EACH_VEC_ELT (id->debug_stmts, i, stmt) |
9845d120 | 2674 | copy_debug_stmt (stmt, id); |
2675 | ||
f1f41a6c | 2676 | id->debug_stmts.release (); |
9845d120 | 2677 | } |
2678 | ||
4189e677 | 2679 | /* Make a copy of the body of SRC_FN so that it can be inserted inline in |
2680 | another function. */ | |
2681 | ||
2682 | static tree | |
2683 | copy_tree_body (copy_body_data *id) | |
2684 | { | |
2685 | tree fndecl = id->src_fn; | |
2686 | tree body = DECL_SAVED_TREE (fndecl); | |
2687 | ||
2688 | walk_tree (&body, copy_tree_body_r, id, NULL); | |
2689 | ||
2690 | return body; | |
2691 | } | |
2692 | ||
9845d120 | 2693 | /* Make a copy of the body of FN so that it can be inserted inline in |
2694 | another function. */ | |
2695 | ||
e27482aa | 2696 | static tree |
e2d3f422 | 2697 | copy_body (copy_body_data *id, gcov_type count, int frequency_scale, |
b06ab5fa | 2698 | basic_block entry_block_map, basic_block exit_block_map, |
84cb1020 | 2699 | basic_block new_entry) |
e27482aa | 2700 | { |
51a48c27 | 2701 | tree fndecl = id->src_fn; |
e27482aa | 2702 | tree body; |
2703 | ||
2704 | /* If this body has a CFG, walk CFG and copy. */ | |
34154e27 | 2705 | gcc_assert (ENTRY_BLOCK_PTR_FOR_FN (DECL_STRUCT_FUNCTION (fndecl))); |
b06ab5fa | 2706 | body = copy_cfg_body (id, count, frequency_scale, entry_block_map, exit_block_map, |
84cb1020 | 2707 | new_entry); |
9845d120 | 2708 | copy_debug_stmts (id); |
e27482aa | 2709 | |
2710 | return body; | |
2711 | } | |
2712 | ||
78a289a9 | 2713 | /* Return true if VALUE is an ADDR_EXPR of an automatic variable |
2714 | defined in function FN, or of a data member thereof. */ | |
2715 | ||
2716 | static bool | |
2717 | self_inlining_addr_expr (tree value, tree fn) | |
2718 | { | |
2719 | tree var; | |
2720 | ||
2721 | if (TREE_CODE (value) != ADDR_EXPR) | |
2722 | return false; | |
2723 | ||
2724 | var = get_base_address (TREE_OPERAND (value, 0)); | |
e27482aa | 2725 | |
2ef41604 | 2726 | return var && auto_var_in_fn_p (var, fn); |
78a289a9 | 2727 | } |
2728 | ||
9845d120 | 2729 | /* Append to BB a debug annotation that binds VAR to VALUE, inheriting |
2730 | lexical block and line number information from base_stmt, if given, | |
2731 | or from the last stmt of the block otherwise. */ | |
2732 | ||
2733 | static gimple | |
2734 | insert_init_debug_bind (copy_body_data *id, | |
2735 | basic_block bb, tree var, tree value, | |
2736 | gimple base_stmt) | |
2737 | { | |
2738 | gimple note; | |
2739 | gimple_stmt_iterator gsi; | |
2740 | tree tracked_var; | |
2741 | ||
2742 | if (!gimple_in_ssa_p (id->src_cfun)) | |
2743 | return NULL; | |
2744 | ||
2745 | if (!MAY_HAVE_DEBUG_STMTS) | |
2746 | return NULL; | |
2747 | ||
2748 | tracked_var = target_for_debug_bind (var); | |
2749 | if (!tracked_var) | |
2750 | return NULL; | |
2751 | ||
2752 | if (bb) | |
2753 | { | |
2754 | gsi = gsi_last_bb (bb); | |
2755 | if (!base_stmt && !gsi_end_p (gsi)) | |
2756 | base_stmt = gsi_stmt (gsi); | |
2757 | } | |
2758 | ||
2759 | note = gimple_build_debug_bind (tracked_var, value, base_stmt); | |
2760 | ||
2761 | if (bb) | |
2762 | { | |
2763 | if (!gsi_end_p (gsi)) | |
2764 | gsi_insert_after (&gsi, note, GSI_SAME_STMT); | |
2765 | else | |
2766 | gsi_insert_before (&gsi, note, GSI_SAME_STMT); | |
2767 | } | |
2768 | ||
2769 | return note; | |
2770 | } | |
2771 | ||
4ee9c684 | 2772 | static void |
9845d120 | 2773 | insert_init_stmt (copy_body_data *id, basic_block bb, gimple init_stmt) |
13e50f08 | 2774 | { |
13e50f08 | 2775 | /* If VAR represents a zero-sized variable, it's possible that the |
2776 | assignment statement may result in no gimple statements. */ | |
2777 | if (init_stmt) | |
b236ac0e | 2778 | { |
2779 | gimple_stmt_iterator si = gsi_last_bb (bb); | |
13e50f08 | 2780 | |
8d41b0dd | 2781 | /* We can end up with init statements that store to a non-register |
2782 | from a rhs with a conversion. Handle that here by forcing the | |
2783 | rhs into a temporary. gimple_regimplify_operands is not | |
2784 | prepared to do this for us. */ | |
9845d120 | 2785 | if (!is_gimple_debug (init_stmt) |
2786 | && !is_gimple_reg (gimple_assign_lhs (init_stmt)) | |
8d41b0dd | 2787 | && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt))) |
2788 | && gimple_assign_rhs_class (init_stmt) == GIMPLE_UNARY_RHS) | |
2789 | { | |
2790 | tree rhs = build1 (gimple_assign_rhs_code (init_stmt), | |
2791 | gimple_expr_type (init_stmt), | |
2792 | gimple_assign_rhs1 (init_stmt)); | |
2793 | rhs = force_gimple_operand_gsi (&si, rhs, true, NULL_TREE, false, | |
2794 | GSI_NEW_STMT); | |
2795 | gimple_assign_set_rhs_code (init_stmt, TREE_CODE (rhs)); | |
2796 | gimple_assign_set_rhs1 (init_stmt, rhs); | |
2797 | } | |
b236ac0e | 2798 | gsi_insert_after (&si, init_stmt, GSI_NEW_STMT); |
2799 | gimple_regimplify_operands (init_stmt, &si); | |
9845d120 | 2800 | |
2801 | if (!is_gimple_debug (init_stmt) && MAY_HAVE_DEBUG_STMTS) | |
2802 | { | |
ec11736b | 2803 | tree def = gimple_assign_lhs (init_stmt); |
2804 | insert_init_debug_bind (id, bb, def, def, init_stmt); | |
9845d120 | 2805 | } |
b236ac0e | 2806 | } |
13e50f08 | 2807 | } |
2808 | ||
2809 | /* Initialize parameter P with VALUE. If needed, produce init statement | |
2810 | at the end of BB. When BB is NULL, we return init statement to be | |
2811 | output later. */ | |
2812 | static gimple | |
51a48c27 | 2813 | setup_one_parameter (copy_body_data *id, tree p, tree value, tree fn, |
e27482aa | 2814 | basic_block bb, tree *vars) |
4ee9c684 | 2815 | { |
13e50f08 | 2816 | gimple init_stmt = NULL; |
4ee9c684 | 2817 | tree var; |
c8ca3ee7 | 2818 | tree rhs = value; |
deff5ffd | 2819 | tree def = (gimple_in_ssa_p (cfun) |
c6dfe037 | 2820 | ? ssa_default_def (id->src_cfun, p) : NULL); |
4ee9c684 | 2821 | |
c8ca3ee7 | 2822 | if (value |
2823 | && value != error_mark_node | |
2824 | && !useless_type_conversion_p (TREE_TYPE (p), TREE_TYPE (value))) | |
62437c86 | 2825 | { |
6e383d62 | 2826 | /* If we can match up types by promotion/demotion do so. */ |
62437c86 | 2827 | if (fold_convertible_p (TREE_TYPE (p), value)) |
6e383d62 | 2828 | rhs = fold_convert (TREE_TYPE (p), value); |
62437c86 | 2829 | else |
6e383d62 | 2830 | { |
2831 | /* ??? For valid programs we should not end up here. | |
2832 | Still if we end up with truly mismatched types here, fall back | |
2833 | to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid | |
2834 | GIMPLE to the following passes. */ | |
2835 | if (!is_gimple_reg_type (TREE_TYPE (value)) | |
2836 | || TYPE_SIZE (TREE_TYPE (p)) == TYPE_SIZE (TREE_TYPE (value))) | |
2837 | rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (p), value); | |
2838 | else | |
2839 | rhs = build_zero_cst (TREE_TYPE (p)); | |
2840 | } | |
62437c86 | 2841 | } |
c8ca3ee7 | 2842 | |
9845d120 | 2843 | /* Make an equivalent VAR_DECL. Note that we must NOT remap the type |
2844 | here since the type of this decl must be visible to the calling | |
2845 | function. */ | |
2846 | var = copy_decl_to_var (p, id); | |
2847 | ||
9845d120 | 2848 | /* Declare this new variable. */ |
1767a056 | 2849 | DECL_CHAIN (var) = *vars; |
9845d120 | 2850 | *vars = var; |
2851 | ||
2852 | /* Make gimplifier happy about this variable. */ | |
2853 | DECL_SEEN_IN_BIND_EXPR_P (var) = 1; | |
2854 | ||
deff5ffd | 2855 | /* If the parameter is never assigned to, has no SSA_NAMEs created, |
9845d120 | 2856 | we would not need to create a new variable here at all, if it |
2857 | weren't for debug info. Still, we can just use the argument | |
2858 | value. */ | |
4ee9c684 | 2859 | if (TREE_READONLY (p) |
2860 | && !TREE_ADDRESSABLE (p) | |
deff5ffd | 2861 | && value && !TREE_SIDE_EFFECTS (value) |
2862 | && !def) | |
4ee9c684 | 2863 | { |
11fe6c8b | 2864 | /* We may produce non-gimple trees by adding NOPs or introduce |
2865 | invalid sharing when operand is not really constant. | |
2866 | It is not big deal to prohibit constant propagation here as | |
2867 | we will constant propagate in DOM1 pass anyway. */ | |
2868 | if (is_gimple_min_invariant (value) | |
c8ca3ee7 | 2869 | && useless_type_conversion_p (TREE_TYPE (p), |
2870 | TREE_TYPE (value)) | |
78a289a9 | 2871 | /* We have to be very careful about ADDR_EXPR. Make sure |
2872 | the base variable isn't a local variable of the inlined | |
2873 | function, e.g., when doing recursive inlining, direct or | |
2874 | mutually-recursive or whatever, which is why we don't | |
2875 | just test whether fn == current_function_decl. */ | |
2876 | && ! self_inlining_addr_expr (value, fn)) | |
4ee9c684 | 2877 | { |
4ee9c684 | 2878 | insert_decl_map (id, p, value); |
9845d120 | 2879 | insert_debug_decl_map (id, p, var); |
2880 | return insert_init_debug_bind (id, bb, var, value, NULL); | |
4ee9c684 | 2881 | } |
2882 | } | |
2883 | ||
4ee9c684 | 2884 | /* Register the VAR_DECL as the equivalent for the PARM_DECL; |
2885 | that way, when the PARM_DECL is encountered, it will be | |
2886 | automatically replaced by the VAR_DECL. */ | |
9609c446 | 2887 | insert_decl_map (id, p, var); |
4ee9c684 | 2888 | |
4ee9c684 | 2889 | /* Even if P was TREE_READONLY, the new VAR should not be. |
2890 | In the original code, we would have constructed a | |
2891 | temporary, and then the function body would have never | |
2892 | changed the value of P. However, now, we will be | |
2893 | constructing VAR directly. The constructor body may | |
2894 | change its value multiple times as it is being | |
2895 | constructed. Therefore, it must not be TREE_READONLY; | |
2896 | the back-end assumes that TREE_READONLY variable is | |
2897 | assigned to only once. */ | |
2898 | if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p))) | |
2899 | TREE_READONLY (var) = 0; | |
2900 | ||
deff5ffd | 2901 | /* If there is no setup required and we are in SSA, take the easy route |
2902 | replacing all SSA names representing the function parameter by the | |
2903 | SSA name passed to function. | |
2904 | ||
2905 | We need to construct map for the variable anyway as it might be used | |
2906 | in different SSA names when parameter is set in function. | |
2907 | ||
928059d5 | 2908 | Do replacement at -O0 for const arguments replaced by constant. |
2909 | This is important for builtin_constant_p and other construct requiring | |
9845d120 | 2910 | constant argument to be visible in inlined function body. */ |
deff5ffd | 2911 | if (gimple_in_ssa_p (cfun) && rhs && def && is_gimple_reg (p) |
928059d5 | 2912 | && (optimize |
2913 | || (TREE_READONLY (p) | |
2914 | && is_gimple_min_invariant (rhs))) | |
deff5ffd | 2915 | && (TREE_CODE (rhs) == SSA_NAME |
35b8d56b | 2916 | || is_gimple_min_invariant (rhs)) |
2917 | && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def)) | |
deff5ffd | 2918 | { |
2919 | insert_decl_map (id, def, rhs); | |
9845d120 | 2920 | return insert_init_debug_bind (id, bb, var, rhs, NULL); |
deff5ffd | 2921 | } |
2922 | ||
5dc57610 | 2923 | /* If the value of argument is never used, don't care about initializing |
2924 | it. */ | |
12e12890 | 2925 | if (optimize && gimple_in_ssa_p (cfun) && !def && is_gimple_reg (p)) |
5dc57610 | 2926 | { |
2927 | gcc_assert (!value || !TREE_SIDE_EFFECTS (value)); | |
9845d120 | 2928 | return insert_init_debug_bind (id, bb, var, rhs, NULL); |
5dc57610 | 2929 | } |
2930 | ||
4ee9c684 | 2931 | /* Initialize this VAR_DECL from the equivalent argument. Convert |
2932 | the argument to the proper type in case it was promoted. */ | |
2933 | if (value) | |
2934 | { | |
4ee9c684 | 2935 | if (rhs == error_mark_node) |
deff5ffd | 2936 | { |
9609c446 | 2937 | insert_decl_map (id, p, var); |
9845d120 | 2938 | return insert_init_debug_bind (id, bb, var, rhs, NULL); |
deff5ffd | 2939 | } |
51ab7e35 | 2940 | |
aee8cc15 | 2941 | STRIP_USELESS_TYPE_CONVERSION (rhs); |
4ee9c684 | 2942 | |
cbbd431d | 2943 | /* If we are in SSA form properly remap the default definition |
6084b64c | 2944 | or assign to a dummy SSA name if the parameter is unused and |
2945 | we are not optimizing. */ | |
cbbd431d | 2946 | if (gimple_in_ssa_p (cfun) && is_gimple_reg (p)) |
deff5ffd | 2947 | { |
cbbd431d | 2948 | if (def) |
2949 | { | |
2950 | def = remap_ssa_name (def, id); | |
2951 | init_stmt = gimple_build_assign (def, rhs); | |
2952 | SSA_NAME_IS_DEFAULT_DEF (def) = 0; | |
c6dfe037 | 2953 | set_ssa_default_def (cfun, var, NULL); |
cbbd431d | 2954 | } |
6084b64c | 2955 | else if (!optimize) |
2956 | { | |
2957 | def = make_ssa_name (var, NULL); | |
2958 | init_stmt = gimple_build_assign (def, rhs); | |
2959 | } | |
deff5ffd | 2960 | } |
2961 | else | |
75a70cf9 | 2962 | init_stmt = gimple_build_assign (var, rhs); |
4ee9c684 | 2963 | |
13e50f08 | 2964 | if (bb && init_stmt) |
9845d120 | 2965 | insert_init_stmt (id, bb, init_stmt); |
4ee9c684 | 2966 | } |
13e50f08 | 2967 | return init_stmt; |
4ee9c684 | 2968 | } |
2969 | ||
e343483a | 2970 | /* Generate code to initialize the parameters of the function at the |
75a70cf9 | 2971 | top of the stack in ID from the GIMPLE_CALL STMT. */ |
e343483a | 2972 | |
e27482aa | 2973 | static void |
75a70cf9 | 2974 | initialize_inlined_parameters (copy_body_data *id, gimple stmt, |
e27482aa | 2975 | tree fn, basic_block bb) |
e343483a | 2976 | { |
e343483a | 2977 | tree parms; |
75a70cf9 | 2978 | size_t i; |
e343483a | 2979 | tree p; |
d57cd35f | 2980 | tree vars = NULL_TREE; |
75a70cf9 | 2981 | tree static_chain = gimple_call_chain (stmt); |
e343483a | 2982 | |
2983 | /* Figure out what the parameters are. */ | |
b0cdf642 | 2984 | parms = DECL_ARGUMENTS (fn); |
e343483a | 2985 | |
e343483a | 2986 | /* Loop through the parameter declarations, replacing each with an |
2987 | equivalent VAR_DECL, appropriately initialized. */ | |
1767a056 | 2988 | for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++) |
75a70cf9 | 2989 | { |
2990 | tree val; | |
2991 | val = i < gimple_call_num_args (stmt) ? gimple_call_arg (stmt, i) : NULL; | |
2992 | setup_one_parameter (id, p, val, fn, bb, &vars); | |
2993 | } | |
2f25e4ca | 2994 | /* After remapping parameters remap their types. This has to be done |
2995 | in a second loop over all parameters to appropriately remap | |
2996 | variable sized arrays when the size is specified in a | |
2997 | parameter following the array. */ | |
1767a056 | 2998 | for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++) |
2f25e4ca | 2999 | { |
3000 | tree *varp = (tree *) pointer_map_contains (id->decl_map, p); | |
3001 | if (varp | |
3002 | && TREE_CODE (*varp) == VAR_DECL) | |
3003 | { | |
bc6af3fe | 3004 | tree def = (gimple_in_ssa_p (cfun) && is_gimple_reg (p) |
c6dfe037 | 3005 | ? ssa_default_def (id->src_cfun, p) : NULL); |
bc6af3fe | 3006 | tree var = *varp; |
3007 | TREE_TYPE (var) = remap_type (TREE_TYPE (var), id); | |
2f25e4ca | 3008 | /* Also remap the default definition if it was remapped |
3009 | to the default definition of the parameter replacement | |
3010 | by the parameter setup. */ | |
bc6af3fe | 3011 | if (def) |
2f25e4ca | 3012 | { |
3013 | tree *defp = (tree *) pointer_map_contains (id->decl_map, def); | |
3014 | if (defp | |
3015 | && TREE_CODE (*defp) == SSA_NAME | |
bc6af3fe | 3016 | && SSA_NAME_VAR (*defp) == var) |
3017 | TREE_TYPE (*defp) = TREE_TYPE (var); | |
2f25e4ca | 3018 | } |
3019 | } | |
3020 | } | |
e619d7b1 | 3021 | |
4ee9c684 | 3022 | /* Initialize the static chain. */ |
3023 | p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl; | |
469679ab | 3024 | gcc_assert (fn != current_function_decl); |
4ee9c684 | 3025 | if (p) |
3026 | { | |
3027 | /* No static chain? Seems like a bug in tree-nested.c. */ | |
8c0963c4 | 3028 | gcc_assert (static_chain); |
e619d7b1 | 3029 | |
e27482aa | 3030 | setup_one_parameter (id, p, static_chain, fn, bb, &vars); |
e619d7b1 | 3031 | } |
3032 | ||
e27482aa | 3033 | declare_inline_vars (id->block, vars); |
e343483a | 3034 | } |
3035 | ||
75a70cf9 | 3036 | |
e27482aa | 3037 | /* Declare a return variable to replace the RESULT_DECL for the |
3038 | function we are calling. An appropriate DECL_STMT is returned. | |
3039 | The USE_STMT is filled to contain a use of the declaration to | |
3040 | indicate the return value of the function. | |
3041 | ||
deff5ffd | 3042 | RETURN_SLOT, if non-null is place where to store the result. It |
3043 | is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null, | |
75a70cf9 | 3044 | was the LHS of the MODIFY_EXPR to which this call is the RHS. |
8e7912a5 | 3045 | |
f018d957 | 3046 | The return value is a (possibly null) value that holds the result |
3047 | as seen by the caller. */ | |
e343483a | 3048 | |
d57cd35f | 3049 | static tree |
524a0531 | 3050 | declare_return_variable (copy_body_data *id, tree return_slot, tree modify_dest, |
3051 | basic_block entry_bb) | |
e343483a | 3052 | { |
51a48c27 | 3053 | tree callee = id->src_fn; |
8e7912a5 | 3054 | tree result = DECL_RESULT (callee); |
3055 | tree callee_type = TREE_TYPE (result); | |
c21cf15c | 3056 | tree caller_type; |
8e7912a5 | 3057 | tree var, use; |
e343483a | 3058 | |
c21cf15c | 3059 | /* Handle type-mismatches in the function declaration return type |
3060 | vs. the call expression. */ | |
3061 | if (modify_dest) | |
3062 | caller_type = TREE_TYPE (modify_dest); | |
3063 | else | |
3064 | caller_type = TREE_TYPE (TREE_TYPE (callee)); | |
3065 | ||
7a3ec978 | 3066 | /* We don't need to do anything for functions that don't return anything. */ |
3067 | if (VOID_TYPE_P (callee_type)) | |
f018d957 | 3068 | return NULL_TREE; |
e343483a | 3069 | |
806e4c12 | 3070 | /* If there was a return slot, then the return value is the |
8e7912a5 | 3071 | dereferenced address of that object. */ |
deff5ffd | 3072 | if (return_slot) |
8e7912a5 | 3073 | { |
deff5ffd | 3074 | /* The front end shouldn't have used both return_slot and |
8e7912a5 | 3075 | a modify expression. */ |
8c0963c4 | 3076 | gcc_assert (!modify_dest); |
806e4c12 | 3077 | if (DECL_BY_REFERENCE (result)) |
deff5ffd | 3078 | { |
3079 | tree return_slot_addr = build_fold_addr_expr (return_slot); | |
3080 | STRIP_USELESS_TYPE_CONVERSION (return_slot_addr); | |
3081 | ||
3082 | /* We are going to construct *&return_slot and we can't do that | |
48e1416a | 3083 | for variables believed to be not addressable. |
deff5ffd | 3084 | |
3085 | FIXME: This check possibly can match, because values returned | |
3086 | via return slot optimization are not believed to have address | |
3087 | taken by alias analysis. */ | |
3088 | gcc_assert (TREE_CODE (return_slot) != SSA_NAME); | |
deff5ffd | 3089 | var = return_slot_addr; |
3090 | } | |
806e4c12 | 3091 | else |
deff5ffd | 3092 | { |
3093 | var = return_slot; | |
3094 | gcc_assert (TREE_CODE (var) != SSA_NAME); | |
dfbb5324 | 3095 | TREE_ADDRESSABLE (var) |= TREE_ADDRESSABLE (result); |
deff5ffd | 3096 | } |
8ea8de24 | 3097 | if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE |
3098 | || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE) | |
3099 | && !DECL_GIMPLE_REG_P (result) | |
cd276752 | 3100 | && DECL_P (var)) |
8ea8de24 | 3101 | DECL_GIMPLE_REG_P (var) = 0; |
8e7912a5 | 3102 | use = NULL; |
3103 | goto done; | |
3104 | } | |
3105 | ||
3106 | /* All types requiring non-trivial constructors should have been handled. */ | |
8c0963c4 | 3107 | gcc_assert (!TREE_ADDRESSABLE (callee_type)); |
8e7912a5 | 3108 | |
3109 | /* Attempt to avoid creating a new temporary variable. */ | |
deff5ffd | 3110 | if (modify_dest |
3111 | && TREE_CODE (modify_dest) != SSA_NAME) | |
8e7912a5 | 3112 | { |
3113 | bool use_it = false; | |
3114 | ||
3115 | /* We can't use MODIFY_DEST if there's type promotion involved. */ | |
c8ca3ee7 | 3116 | if (!useless_type_conversion_p (callee_type, caller_type)) |
8e7912a5 | 3117 | use_it = false; |
3118 | ||
3119 | /* ??? If we're assigning to a variable sized type, then we must | |
3120 | reuse the destination variable, because we've no good way to | |
3121 | create variable sized temporaries at this point. */ | |
3122 | else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST) | |
3123 | use_it = true; | |
3124 | ||
3125 | /* If the callee cannot possibly modify MODIFY_DEST, then we can | |
3126 | reuse it as the result of the call directly. Don't do this if | |
3127 | it would promote MODIFY_DEST to addressable. */ | |
560613ae | 3128 | else if (TREE_ADDRESSABLE (result)) |
3129 | use_it = false; | |
3130 | else | |
3131 | { | |
3132 | tree base_m = get_base_address (modify_dest); | |
3133 | ||
3134 | /* If the base isn't a decl, then it's a pointer, and we don't | |
3135 | know where that's going to go. */ | |
3136 | if (!DECL_P (base_m)) | |
3137 | use_it = false; | |
3138 | else if (is_global_var (base_m)) | |
3139 | use_it = false; | |
8ea8de24 | 3140 | else if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE |
3141 | || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE) | |
3142 | && !DECL_GIMPLE_REG_P (result) | |
3143 | && DECL_GIMPLE_REG_P (base_m)) | |
3808a9ff | 3144 | use_it = false; |
560613ae | 3145 | else if (!TREE_ADDRESSABLE (base_m)) |
3146 | use_it = true; | |
3147 | } | |
8e7912a5 | 3148 | |
3149 | if (use_it) | |
3150 | { | |
3151 | var = modify_dest; | |
3152 | use = NULL; | |
3153 | goto done; | |
3154 | } | |
3155 | } | |
3156 | ||
8c0963c4 | 3157 | gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST); |
8e7912a5 | 3158 | |
25b3017b | 3159 | var = copy_result_decl_to_var (result, id); |
8e7912a5 | 3160 | DECL_SEEN_IN_BIND_EXPR_P (var) = 1; |
8e7912a5 | 3161 | |
4ee9c684 | 3162 | /* Do not have the rest of GCC warn about this variable as it should |
dac49aa5 | 3163 | not be visible to the user. */ |
4ee9c684 | 3164 | TREE_NO_WARNING (var) = 1; |
e343483a | 3165 | |
25b3017b | 3166 | declare_inline_vars (id->block, var); |
3167 | ||
8e7912a5 | 3168 | /* Build the use expr. If the return type of the function was |
3169 | promoted, convert it back to the expected type. */ | |
3170 | use = var; | |
c8ca3ee7 | 3171 | if (!useless_type_conversion_p (caller_type, TREE_TYPE (var))) |
6e383d62 | 3172 | { |
3173 | /* If we can match up types by promotion/demotion do so. */ | |
3174 | if (fold_convertible_p (caller_type, var)) | |
3175 | use = fold_convert (caller_type, var); | |
3176 | else | |
3177 | { | |
3178 | /* ??? For valid programs we should not end up here. | |
3179 | Still if we end up with truly mismatched types here, fall back | |
3180 | to using a MEM_REF to not leak invalid GIMPLE to the following | |
3181 | passes. */ | |
3182 | /* Prevent var from being written into SSA form. */ | |
3183 | if (TREE_CODE (TREE_TYPE (var)) == VECTOR_TYPE | |
3184 | || TREE_CODE (TREE_TYPE (var)) == COMPLEX_TYPE) | |
3185 | DECL_GIMPLE_REG_P (var) = false; | |
3186 | else if (is_gimple_reg_type (TREE_TYPE (var))) | |
3187 | TREE_ADDRESSABLE (var) = true; | |
3188 | use = fold_build2 (MEM_REF, caller_type, | |
3189 | build_fold_addr_expr (var), | |
3190 | build_int_cst (ptr_type_node, 0)); | |
3191 | } | |
3192 | } | |
48e1416a | 3193 | |
aee8cc15 | 3194 | STRIP_USELESS_TYPE_CONVERSION (use); |
8e7912a5 | 3195 | |
25b3017b | 3196 | if (DECL_BY_REFERENCE (result)) |
8ad54c54 | 3197 | { |
3198 | TREE_ADDRESSABLE (var) = 1; | |
3199 | var = build_fold_addr_expr (var); | |
3200 | } | |
25b3017b | 3201 | |
8e7912a5 | 3202 | done: |
e343483a | 3203 | /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that |
3204 | way, when the RESULT_DECL is encountered, it will be | |
524a0531 | 3205 | automatically replaced by the VAR_DECL. |
3206 | ||
3207 | When returning by reference, ensure that RESULT_DECL remaps to | |
3208 | gimple_val. */ | |
3209 | if (DECL_BY_REFERENCE (result) | |
3210 | && !is_gimple_val (var)) | |
3211 | { | |
3212 | tree temp = create_tmp_var (TREE_TYPE (result), "retvalptr"); | |
3213 | insert_decl_map (id, result, temp); | |
cbbd431d | 3214 | /* When RESULT_DECL is in SSA form, we need to remap and initialize |
3215 | it's default_def SSA_NAME. */ | |
3216 | if (gimple_in_ssa_p (id->src_cfun) | |
3217 | && is_gimple_reg (result)) | |
3218 | { | |
3219 | temp = make_ssa_name (temp, NULL); | |
c6dfe037 | 3220 | insert_decl_map (id, ssa_default_def (id->src_cfun, result), temp); |
cbbd431d | 3221 | } |
524a0531 | 3222 | insert_init_stmt (id, entry_bb, gimple_build_assign (temp, var)); |
3223 | } | |
3224 | else | |
3225 | insert_decl_map (id, result, var); | |
e343483a | 3226 | |
4ee9c684 | 3227 | /* Remember this so we can ignore it in remap_decls. */ |
3228 | id->retvar = var; | |
3229 | ||
f018d957 | 3230 | return use; |
e343483a | 3231 | } |
3232 | ||
d747fdfb | 3233 | /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference |
3234 | to a local label. */ | |
e619d7b1 | 3235 | |
d747fdfb | 3236 | static tree |
3237 | has_label_address_in_static_1 (tree *nodep, int *walk_subtrees, void *fnp) | |
e619d7b1 | 3238 | { |
d747fdfb | 3239 | tree node = *nodep; |
3240 | tree fn = (tree) fnp; | |
75a70cf9 | 3241 | |
d747fdfb | 3242 | if (TREE_CODE (node) == LABEL_DECL && DECL_CONTEXT (node) == fn) |
3243 | return node; | |
3244 | ||
3245 | if (TYPE_P (node)) | |
3246 | *walk_subtrees = 0; | |
3247 | ||
3248 | return NULL_TREE; | |
3249 | } | |
75a70cf9 | 3250 | |
d747fdfb | 3251 | /* Determine if the function can be copied. If so return NULL. If |
3252 | not return a string describng the reason for failure. */ | |
3253 | ||
3254 | static const char * | |
3255 | copy_forbidden (struct function *fun, tree fndecl) | |
3256 | { | |
3257 | const char *reason = fun->cannot_be_copied_reason; | |
2ab2ce89 | 3258 | tree decl; |
3259 | unsigned ix; | |
d747fdfb | 3260 | |
3261 | /* Only examine the function once. */ | |
3262 | if (fun->cannot_be_copied_set) | |
3263 | return reason; | |
3264 | ||
3265 | /* We cannot copy a function that receives a non-local goto | |
3266 | because we cannot remap the destination label used in the | |
3267 | function that is performing the non-local goto. */ | |
3268 | /* ??? Actually, this should be possible, if we work at it. | |
3269 | No doubt there's just a handful of places that simply | |
3270 | assume it doesn't happen and don't substitute properly. */ | |
3271 | if (fun->has_nonlocal_label) | |
3272 | { | |
3273 | reason = G_("function %q+F can never be copied " | |
3274 | "because it receives a non-local goto"); | |
3275 | goto fail; | |
3276 | } | |
3277 | ||
2ab2ce89 | 3278 | FOR_EACH_LOCAL_DECL (fun, ix, decl) |
3279 | if (TREE_CODE (decl) == VAR_DECL | |
3280 | && TREE_STATIC (decl) | |
3281 | && !DECL_EXTERNAL (decl) | |
3282 | && DECL_INITIAL (decl) | |
3283 | && walk_tree_without_duplicates (&DECL_INITIAL (decl), | |
3284 | has_label_address_in_static_1, | |
3285 | fndecl)) | |
3286 | { | |
3287 | reason = G_("function %q+F can never be copied because it saves " | |
3288 | "address of local label in a static variable"); | |
3289 | goto fail; | |
3290 | } | |
d747fdfb | 3291 | |
3292 | fail: | |
3293 | fun->cannot_be_copied_reason = reason; | |
3294 | fun->cannot_be_copied_set = true; | |
3295 | return reason; | |
3296 | } | |
3297 | ||
3298 | ||
3299 | static const char *inline_forbidden_reason; | |
3300 | ||
3301 | /* A callback for walk_gimple_seq to handle statements. Returns non-null | |
3302 | iff a function can not be inlined. Also sets the reason why. */ | |
9a7ecb49 | 3303 | |
9a7ecb49 | 3304 | static tree |
75a70cf9 | 3305 | inline_forbidden_p_stmt (gimple_stmt_iterator *gsi, bool *handled_ops_p, |
3306 | struct walk_stmt_info *wip) | |
9a7ecb49 | 3307 | { |
75a70cf9 | 3308 | tree fn = (tree) wip->info; |
bc597501 | 3309 | tree t; |
75a70cf9 | 3310 | gimple stmt = gsi_stmt (*gsi); |
9a7ecb49 | 3311 | |
75a70cf9 | 3312 | switch (gimple_code (stmt)) |
bc597501 | 3313 | { |
75a70cf9 | 3314 | case GIMPLE_CALL: |
1f2706b2 | 3315 | /* Refuse to inline alloca call unless user explicitly forced so as |
3316 | this may change program's memory overhead drastically when the | |
3317 | function using alloca is called in loop. In GCC present in | |
3318 | SPEC2000 inlining into schedule_block cause it to require 2GB of | |
a882d754 | 3319 | RAM instead of 256MB. Don't do so for alloca calls emitted for |
3320 | VLA objects as those can't cause unbounded growth (they're always | |
3321 | wrapped inside stack_save/stack_restore regions. */ | |
75a70cf9 | 3322 | if (gimple_alloca_call_p (stmt) |
a882d754 | 3323 | && !gimple_call_alloca_for_var_p (stmt) |
bc597501 | 3324 | && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn))) |
3325 | { | |
9bc3739f | 3326 | inline_forbidden_reason |
3cf8b391 | 3327 | = G_("function %q+F can never be inlined because it uses " |
9bc3739f | 3328 | "alloca (override using the always_inline attribute)"); |
75a70cf9 | 3329 | *handled_ops_p = true; |
3330 | return fn; | |
bc597501 | 3331 | } |
75a70cf9 | 3332 | |
3333 | t = gimple_call_fndecl (stmt); | |
3334 | if (t == NULL_TREE) | |
bc597501 | 3335 | break; |
cb9d4058 | 3336 | |
bc597501 | 3337 | /* We cannot inline functions that call setjmp. */ |
3338 | if (setjmp_call_p (t)) | |
3339 | { | |
9bc3739f | 3340 | inline_forbidden_reason |
3cf8b391 | 3341 | = G_("function %q+F can never be inlined because it uses setjmp"); |
75a70cf9 | 3342 | *handled_ops_p = true; |
3343 | return t; | |
bc597501 | 3344 | } |
3345 | ||
4ee9c684 | 3346 | if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL) |
1f2706b2 | 3347 | switch (DECL_FUNCTION_CODE (t)) |
bc597501 | 3348 | { |
1f2706b2 | 3349 | /* We cannot inline functions that take a variable number of |
3350 | arguments. */ | |
3351 | case BUILT_IN_VA_START: | |
1f2706b2 | 3352 | case BUILT_IN_NEXT_ARG: |
3353 | case BUILT_IN_VA_END: | |
4ee9c684 | 3354 | inline_forbidden_reason |
3cf8b391 | 3355 | = G_("function %q+F can never be inlined because it " |
4ee9c684 | 3356 | "uses variable argument lists"); |
75a70cf9 | 3357 | *handled_ops_p = true; |
3358 | return t; | |
4ee9c684 | 3359 | |
1f2706b2 | 3360 | case BUILT_IN_LONGJMP: |
4ee9c684 | 3361 | /* We can't inline functions that call __builtin_longjmp at |
3362 | all. The non-local goto machinery really requires the | |
3363 | destination be in a different function. If we allow the | |
3364 | function calling __builtin_longjmp to be inlined into the | |
3365 | function calling __builtin_setjmp, Things will Go Awry. */ | |
3366 | inline_forbidden_reason | |
3cf8b391 | 3367 | = G_("function %q+F can never be inlined because " |
4ee9c684 | 3368 | "it uses setjmp-longjmp exception handling"); |
75a70cf9 | 3369 | *handled_ops_p = true; |
3370 | return t; | |
4ee9c684 | 3371 | |
3372 | case BUILT_IN_NONLOCAL_GOTO: | |
3373 | /* Similarly. */ | |
3374 | inline_forbidden_reason | |
3cf8b391 | 3375 | = G_("function %q+F can never be inlined because " |
4ee9c684 | 3376 | "it uses non-local goto"); |
75a70cf9 | 3377 | *handled_ops_p = true; |
3378 | return t; | |
bc597501 | 3379 | |
65061660 | 3380 | case BUILT_IN_RETURN: |
3381 | case BUILT_IN_APPLY_ARGS: | |
3382 | /* If a __builtin_apply_args caller would be inlined, | |
3383 | it would be saving arguments of the function it has | |
3384 | been inlined into. Similarly __builtin_return would | |
3385 | return from the function the inline has been inlined into. */ | |
3386 | inline_forbidden_reason | |
3cf8b391 | 3387 | = G_("function %q+F can never be inlined because " |
65061660 | 3388 | "it uses __builtin_return or __builtin_apply_args"); |
75a70cf9 | 3389 | *handled_ops_p = true; |
3390 | return t; | |
65061660 | 3391 | |
1f2706b2 | 3392 | default: |
3393 | break; | |
3394 | } | |
bc597501 | 3395 | break; |
3396 | ||
75a70cf9 | 3397 | case GIMPLE_GOTO: |
3398 | t = gimple_goto_dest (stmt); | |
bc597501 | 3399 | |
3400 | /* We will not inline a function which uses computed goto. The | |
3401 | addresses of its local labels, which may be tucked into | |
3402 | global storage, are of course not constant across | |
3403 | instantiations, which causes unexpected behavior. */ | |
3404 | if (TREE_CODE (t) != LABEL_DECL) | |
3405 | { | |
9bc3739f | 3406 | inline_forbidden_reason |
3cf8b391 | 3407 | = G_("function %q+F can never be inlined " |
9bc3739f | 3408 | "because it contains a computed goto"); |
75a70cf9 | 3409 | *handled_ops_p = true; |
3410 | return t; | |
bc597501 | 3411 | } |
4ee9c684 | 3412 | break; |
bc597501 | 3413 | |
bc597501 | 3414 | default: |
3415 | break; | |
3416 | } | |
3417 | ||
75a70cf9 | 3418 | *handled_ops_p = false; |
bc597501 | 3419 | return NULL_TREE; |
cb9d4058 | 3420 | } |
3421 | ||
75a70cf9 | 3422 | /* Return true if FNDECL is a function that cannot be inlined into |
3423 | another one. */ | |
3424 | ||
3425 | static bool | |
bc597501 | 3426 | inline_forbidden_p (tree fndecl) |
cb9d4058 | 3427 | { |
361c9aad | 3428 | struct function *fun = DECL_STRUCT_FUNCTION (fndecl); |
75a70cf9 | 3429 | struct walk_stmt_info wi; |
3430 | struct pointer_set_t *visited_nodes; | |
3431 | basic_block bb; | |
3432 | bool forbidden_p = false; | |
3433 | ||
d747fdfb | 3434 | /* First check for shared reasons not to copy the code. */ |
3435 | inline_forbidden_reason = copy_forbidden (fun, fndecl); | |
3436 | if (inline_forbidden_reason != NULL) | |
3437 | return true; | |
3438 | ||
3439 | /* Next, walk the statements of the function looking for | |
3440 | constraucts we can't handle, or are non-optimal for inlining. */ | |
75a70cf9 | 3441 | visited_nodes = pointer_set_create (); |
3442 | memset (&wi, 0, sizeof (wi)); | |
3443 | wi.info = (void *) fndecl; | |
3444 | wi.pset = visited_nodes; | |
e27482aa | 3445 | |
361c9aad | 3446 | FOR_EACH_BB_FN (bb, fun) |
75a70cf9 | 3447 | { |
3448 | gimple ret; | |
3449 | gimple_seq seq = bb_seq (bb); | |
d747fdfb | 3450 | ret = walk_gimple_seq (seq, inline_forbidden_p_stmt, NULL, &wi); |
75a70cf9 | 3451 | forbidden_p = (ret != NULL); |
3452 | if (forbidden_p) | |
d747fdfb | 3453 | break; |
361c9aad | 3454 | } |
3455 | ||
75a70cf9 | 3456 | pointer_set_destroy (visited_nodes); |
75a70cf9 | 3457 | return forbidden_p; |
cb9d4058 | 3458 | } |
ea1760a3 | 3459 | \f |
3460 | /* Return false if the function FNDECL cannot be inlined on account of its | |
3461 | attributes, true otherwise. */ | |
3462 | static bool | |
3463 | function_attribute_inlinable_p (const_tree fndecl) | |
3464 | { | |
3465 | if (targetm.attribute_table) | |
3466 | { | |
3467 | const_tree a; | |
3468 | ||
3469 | for (a = DECL_ATTRIBUTES (fndecl); a; a = TREE_CHAIN (a)) | |
3470 | { | |
3471 | const_tree name = TREE_PURPOSE (a); | |
3472 | int i; | |
3473 | ||
3474 | for (i = 0; targetm.attribute_table[i].name != NULL; i++) | |
3475 | if (is_attribute_p (targetm.attribute_table[i].name, name)) | |
3476 | return targetm.function_attribute_inlinable_p (fndecl); | |
3477 | } | |
3478 | } | |
3479 | ||
3480 | return true; | |
3481 | } | |
cb9d4058 | 3482 | |
746149b7 | 3483 | /* Returns nonzero if FN is a function that does not have any |
3484 | fundamental inline blocking properties. */ | |
e343483a | 3485 | |
d747fdfb | 3486 | bool |
3487 | tree_inlinable_function_p (tree fn) | |
e343483a | 3488 | { |
746149b7 | 3489 | bool inlinable = true; |
7cc6d7a8 | 3490 | bool do_warning; |
3491 | tree always_inline; | |
e343483a | 3492 | |
3493 | /* If we've already decided this function shouldn't be inlined, | |
3494 | there's no need to check again. */ | |
3495 | if (DECL_UNINLINABLE (fn)) | |
746149b7 | 3496 | return false; |
e343483a | 3497 | |
7cc6d7a8 | 3498 | /* We only warn for functions declared `inline' by the user. */ |
3499 | do_warning = (warn_inline | |
7cc6d7a8 | 3500 | && DECL_DECLARED_INLINE_P (fn) |
73b5e722 | 3501 | && !DECL_NO_INLINE_WARNING_P (fn) |
7cc6d7a8 | 3502 | && !DECL_IN_SYSTEM_HEADER (fn)); |
3503 | ||
3504 | always_inline = lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)); | |
3505 | ||
1c2f0012 | 3506 | if (flag_no_inline |
7cc6d7a8 | 3507 | && always_inline == NULL) |
3508 | { | |
3509 | if (do_warning) | |
3510 | warning (OPT_Winline, "function %q+F can never be inlined because it " | |
3511 | "is suppressed using -fno-inline", fn); | |
3512 | inlinable = false; | |
3513 | } | |
3514 | ||
7cc6d7a8 | 3515 | else if (!function_attribute_inlinable_p (fn)) |
3516 | { | |
3517 | if (do_warning) | |
3518 | warning (OPT_Winline, "function %q+F can never be inlined because it " | |
3519 | "uses attributes conflicting with inlining", fn); | |
3520 | inlinable = false; | |
3521 | } | |
60b8c5b3 | 3522 | |
bc597501 | 3523 | else if (inline_forbidden_p (fn)) |
746149b7 | 3524 | { |
3525 | /* See if we should warn about uninlinable functions. Previously, | |
3526 | some of these warnings would be issued while trying to expand | |
3527 | the function inline, but that would cause multiple warnings | |
3528 | about functions that would for example call alloca. But since | |
3529 | this a property of the function, just one warning is enough. | |
3530 | As a bonus we can now give more details about the reason why a | |
7cc6d7a8 | 3531 | function is not inlinable. */ |
3532 | if (always_inline) | |
a522e9eb | 3533 | error (inline_forbidden_reason, fn); |
d731003e | 3534 | else if (do_warning) |
b0ff69b1 | 3535 | warning (OPT_Winline, inline_forbidden_reason, fn); |
746149b7 | 3536 | |
3537 | inlinable = false; | |
3538 | } | |
e343483a | 3539 | |
3540 | /* Squirrel away the result so that we don't have to check again. */ | |
746149b7 | 3541 | DECL_UNINLINABLE (fn) = !inlinable; |
e343483a | 3542 | |
746149b7 | 3543 | return inlinable; |
3544 | } | |
3545 | ||
bc7a14a6 | 3546 | /* Estimate the cost of a memory move. Use machine dependent |
3547 | word size and take possible memcpy call into account. */ | |
3548 | ||
3549 | int | |
3550 | estimate_move_cost (tree type) | |
3551 | { | |
3552 | HOST_WIDE_INT size; | |
3553 | ||
31359ae8 | 3554 | gcc_assert (!VOID_TYPE_P (type)); |
3555 | ||
a97439f9 | 3556 | if (TREE_CODE (type) == VECTOR_TYPE) |
3557 | { | |
3558 | enum machine_mode inner = TYPE_MODE (TREE_TYPE (type)); | |
3559 | enum machine_mode simd | |
3560 | = targetm.vectorize.preferred_simd_mode (inner); | |
3561 | int simd_mode_size = GET_MODE_SIZE (simd); | |
3562 | return ((GET_MODE_SIZE (TYPE_MODE (type)) + simd_mode_size - 1) | |
3563 | / simd_mode_size); | |
3564 | } | |
3565 | ||
bc7a14a6 | 3566 | size = int_size_in_bytes (type); |
3567 | ||
f5733e7c | 3568 | if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO (!optimize_size)) |
bc7a14a6 | 3569 | /* Cost of a memcpy call, 3 arguments and the call. */ |
3570 | return 4; | |
3571 | else | |
3572 | return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES); | |
3573 | } | |
3574 | ||
75a70cf9 | 3575 | /* Returns cost of operation CODE, according to WEIGHTS */ |
bc8bb825 | 3576 | |
75a70cf9 | 3577 | static int |
94e6e359 | 3578 | estimate_operator_cost (enum tree_code code, eni_weights *weights, |
3579 | tree op1 ATTRIBUTE_UNUSED, tree op2) | |
4ee9c684 | 3580 | { |
75a70cf9 | 3581 | switch (code) |
4ee9c684 | 3582 | { |
75a70cf9 | 3583 | /* These are "free" conversions, or their presumed cost |
3584 | is folded into other operations. */ | |
51984d2b | 3585 | case RANGE_EXPR: |
d9659041 | 3586 | CASE_CONVERT: |
75a70cf9 | 3587 | case COMPLEX_EXPR: |
3588 | case PAREN_EXPR: | |
a790c42a | 3589 | case VIEW_CONVERT_EXPR: |
75a70cf9 | 3590 | return 0; |
4ee9c684 | 3591 | |
bc7a14a6 | 3592 | /* Assign cost of 1 to usual operations. |
3593 | ??? We may consider mapping RTL costs to this. */ | |
4ee9c684 | 3594 | case COND_EXPR: |
dcfca6f8 | 3595 | case VEC_COND_EXPR: |
f4803722 | 3596 | case VEC_PERM_EXPR: |
4ee9c684 | 3597 | |
3598 | case PLUS_EXPR: | |
0de36bdb | 3599 | case POINTER_PLUS_EXPR: |
4ee9c684 | 3600 | case MINUS_EXPR: |
3601 | case MULT_EXPR: | |
96504875 | 3602 | case MULT_HIGHPART_EXPR: |
b9be572e | 3603 | case FMA_EXPR: |
4ee9c684 | 3604 | |
bd1a81f7 | 3605 | case ADDR_SPACE_CONVERT_EXPR: |
06f0b99c | 3606 | case FIXED_CONVERT_EXPR: |
4ee9c684 | 3607 | case FIX_TRUNC_EXPR: |
4ee9c684 | 3608 | |
3609 | case NEGATE_EXPR: | |
3610 | case FLOAT_EXPR: | |
3611 | case MIN_EXPR: | |
3612 | case MAX_EXPR: | |
3613 | case ABS_EXPR: | |
3614 | ||
3615 | case LSHIFT_EXPR: | |
3616 | case RSHIFT_EXPR: | |
3617 | case LROTATE_EXPR: | |
3618 | case RROTATE_EXPR: | |
925c62d4 | 3619 | case VEC_LSHIFT_EXPR: |
3620 | case VEC_RSHIFT_EXPR: | |
4ee9c684 | 3621 | |
3622 | case BIT_IOR_EXPR: | |
3623 | case BIT_XOR_EXPR: | |
3624 | case BIT_AND_EXPR: | |
3625 | case BIT_NOT_EXPR: | |
3626 | ||
3627 | case TRUTH_ANDIF_EXPR: | |
3628 | case TRUTH_ORIF_EXPR: | |
3629 | case TRUTH_AND_EXPR: | |
3630 | case TRUTH_OR_EXPR: | |
3631 | case TRUTH_XOR_EXPR: | |
3632 | case TRUTH_NOT_EXPR: | |
3633 | ||
3634 | case LT_EXPR: | |
3635 | case LE_EXPR: | |
3636 | case GT_EXPR: | |
3637 | case GE_EXPR: | |
3638 | case EQ_EXPR: | |
3639 | case NE_EXPR: | |
3640 | case ORDERED_EXPR: | |
3641 | case UNORDERED_EXPR: | |
3642 | ||
3643 | case UNLT_EXPR: | |
3644 | case UNLE_EXPR: | |
3645 | case UNGT_EXPR: | |
3646 | case UNGE_EXPR: | |
3647 | case UNEQ_EXPR: | |
318a728f | 3648 | case LTGT_EXPR: |
4ee9c684 | 3649 | |
4ee9c684 | 3650 | case CONJ_EXPR: |
3651 | ||
3652 | case PREDECREMENT_EXPR: | |
3653 | case PREINCREMENT_EXPR: | |
3654 | case POSTDECREMENT_EXPR: | |
3655 | case POSTINCREMENT_EXPR: | |
3656 | ||
a0e79db9 | 3657 | case REALIGN_LOAD_EXPR: |
3658 | ||
ea8f3370 | 3659 | case REDUC_MAX_EXPR: |
3660 | case REDUC_MIN_EXPR: | |
3661 | case REDUC_PLUS_EXPR: | |
4a61a337 | 3662 | case WIDEN_SUM_EXPR: |
75a70cf9 | 3663 | case WIDEN_MULT_EXPR: |
3664 | case DOT_PROD_EXPR: | |
00f4f705 | 3665 | case WIDEN_MULT_PLUS_EXPR: |
3666 | case WIDEN_MULT_MINUS_EXPR: | |
6083c152 | 3667 | case WIDEN_LSHIFT_EXPR: |
75a70cf9 | 3668 | |
c6c91d61 | 3669 | case VEC_WIDEN_MULT_HI_EXPR: |
3670 | case VEC_WIDEN_MULT_LO_EXPR: | |
79a78f7f | 3671 | case VEC_WIDEN_MULT_EVEN_EXPR: |
3672 | case VEC_WIDEN_MULT_ODD_EXPR: | |
c6c91d61 | 3673 | case VEC_UNPACK_HI_EXPR: |
3674 | case VEC_UNPACK_LO_EXPR: | |
8aa4e142 | 3675 | case VEC_UNPACK_FLOAT_HI_EXPR: |
3676 | case VEC_UNPACK_FLOAT_LO_EXPR: | |
bb8107e7 | 3677 | case VEC_PACK_TRUNC_EXPR: |
c6c91d61 | 3678 | case VEC_PACK_SAT_EXPR: |
8aa4e142 | 3679 | case VEC_PACK_FIX_TRUNC_EXPR: |
6083c152 | 3680 | case VEC_WIDEN_LSHIFT_HI_EXPR: |
3681 | case VEC_WIDEN_LSHIFT_LO_EXPR: | |
6b8dbb53 | 3682 | |
75a70cf9 | 3683 | return 1; |
4ee9c684 | 3684 | |
365db11e | 3685 | /* Few special cases of expensive operations. This is useful |
4ee9c684 | 3686 | to avoid inlining on functions having too many of these. */ |
3687 | case TRUNC_DIV_EXPR: | |
3688 | case CEIL_DIV_EXPR: | |
3689 | case FLOOR_DIV_EXPR: | |
3690 | case ROUND_DIV_EXPR: | |
3691 | case EXACT_DIV_EXPR: | |
3692 | case TRUNC_MOD_EXPR: | |
3693 | case CEIL_MOD_EXPR: | |
3694 | case FLOOR_MOD_EXPR: | |
3695 | case ROUND_MOD_EXPR: | |
3696 | case RDIV_EXPR: | |
94e6e359 | 3697 | if (TREE_CODE (op2) != INTEGER_CST) |
3698 | return weights->div_mod_cost; | |
3699 | return 1; | |
75a70cf9 | 3700 | |
3701 | default: | |
3702 | /* We expect a copy assignment with no operator. */ | |
3703 | gcc_assert (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS); | |
3704 | return 0; | |
3705 | } | |
3706 | } | |
3707 | ||
3708 | ||
3709 | /* Estimate number of instructions that will be created by expanding | |
3710 | the statements in the statement sequence STMTS. | |
3711 | WEIGHTS contains weights attributed to various constructs. */ | |
3712 | ||
3713 | static | |
3714 | int estimate_num_insns_seq (gimple_seq stmts, eni_weights *weights) | |
3715 | { | |
3716 | int cost; | |
3717 | gimple_stmt_iterator gsi; | |
3718 | ||
3719 | cost = 0; | |
3720 | for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi)) | |
3721 | cost += estimate_num_insns (gsi_stmt (gsi), weights); | |
3722 | ||
3723 | return cost; | |
3724 | } | |
3725 | ||
3726 | ||
3727 | /* Estimate number of instructions that will be created by expanding STMT. | |
3728 | WEIGHTS contains weights attributed to various constructs. */ | |
3729 | ||
3730 | int | |
3731 | estimate_num_insns (gimple stmt, eni_weights *weights) | |
3732 | { | |
3733 | unsigned cost, i; | |
3734 | enum gimple_code code = gimple_code (stmt); | |
3735 | tree lhs; | |
94e6e359 | 3736 | tree rhs; |
75a70cf9 | 3737 | |
3738 | switch (code) | |
3739 | { | |
3740 | case GIMPLE_ASSIGN: | |
3741 | /* Try to estimate the cost of assignments. We have three cases to | |
3742 | deal with: | |
3743 | 1) Simple assignments to registers; | |
3744 | 2) Stores to things that must live in memory. This includes | |
3745 | "normal" stores to scalars, but also assignments of large | |
3746 | structures, or constructors of big arrays; | |
3747 | ||
3748 | Let us look at the first two cases, assuming we have "a = b + C": | |
3749 | <GIMPLE_ASSIGN <var_decl "a"> | |
3750 | <plus_expr <var_decl "b"> <constant C>> | |
3751 | If "a" is a GIMPLE register, the assignment to it is free on almost | |
3752 | any target, because "a" usually ends up in a real register. Hence | |
3753 | the only cost of this expression comes from the PLUS_EXPR, and we | |
3754 | can ignore the GIMPLE_ASSIGN. | |
3755 | If "a" is not a GIMPLE register, the assignment to "a" will most | |
3756 | likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost | |
3757 | of moving something into "a", which we compute using the function | |
3758 | estimate_move_cost. */ | |
83480f35 | 3759 | if (gimple_clobber_p (stmt)) |
3760 | return 0; /* ={v} {CLOBBER} stmt expands to nothing. */ | |
3761 | ||
75a70cf9 | 3762 | lhs = gimple_assign_lhs (stmt); |
94e6e359 | 3763 | rhs = gimple_assign_rhs1 (stmt); |
3764 | ||
58b83435 | 3765 | cost = 0; |
75a70cf9 | 3766 | |
58b83435 | 3767 | /* Account for the cost of moving to / from memory. */ |
3768 | if (gimple_store_p (stmt)) | |
3769 | cost += estimate_move_cost (TREE_TYPE (lhs)); | |
3770 | if (gimple_assign_load_p (stmt)) | |
94e6e359 | 3771 | cost += estimate_move_cost (TREE_TYPE (rhs)); |
3772 | ||
3773 | cost += estimate_operator_cost (gimple_assign_rhs_code (stmt), weights, | |
3774 | gimple_assign_rhs1 (stmt), | |
3775 | get_gimple_rhs_class (gimple_assign_rhs_code (stmt)) | |
3776 | == GIMPLE_BINARY_RHS | |
3777 | ? gimple_assign_rhs2 (stmt) : NULL); | |
75a70cf9 | 3778 | break; |
3779 | ||
3780 | case GIMPLE_COND: | |
94e6e359 | 3781 | cost = 1 + estimate_operator_cost (gimple_cond_code (stmt), weights, |
3782 | gimple_op (stmt, 0), | |
3783 | gimple_op (stmt, 1)); | |
75a70cf9 | 3784 | break; |
3785 | ||
3786 | case GIMPLE_SWITCH: | |
3787 | /* Take into account cost of the switch + guess 2 conditional jumps for | |
48e1416a | 3788 | each case label. |
75a70cf9 | 3789 | |
3790 | TODO: once the switch expansion logic is sufficiently separated, we can | |
3791 | do better job on estimating cost of the switch. */ | |
94e6e359 | 3792 | if (weights->time_based) |
3793 | cost = floor_log2 (gimple_switch_num_labels (stmt)) * 2; | |
3794 | else | |
3795 | cost = gimple_switch_num_labels (stmt) * 2; | |
4ee9c684 | 3796 | break; |
75a70cf9 | 3797 | |
3798 | case GIMPLE_CALL: | |
4ee9c684 | 3799 | { |
75a70cf9 | 3800 | tree decl = gimple_call_fndecl (stmt); |
20da2013 | 3801 | struct cgraph_node *node = NULL; |
4ee9c684 | 3802 | |
958b3c8a | 3803 | /* Do not special case builtins where we see the body. |
3804 | This just confuse inliner. */ | |
02774f2d | 3805 | if (!decl || !(node = cgraph_get_node (decl)) || node->definition) |
5ccf5ee5 | 3806 | ; |
958b3c8a | 3807 | /* For buitins that are likely expanded to nothing or |
3808 | inlined do not account operand costs. */ | |
3809 | else if (is_simple_builtin (decl)) | |
a6b74a67 | 3810 | return 0; |
3811 | else if (is_inexpensive_builtin (decl)) | |
958b3c8a | 3812 | return weights->target_builtin_call_cost; |
5ccf5ee5 | 3813 | else if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL) |
3814 | { | |
3815 | /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so | |
3816 | specialize the cheap expansion we do here. | |
3817 | ??? This asks for a more general solution. */ | |
3818 | switch (DECL_FUNCTION_CODE (decl)) | |
3819 | { | |
3820 | case BUILT_IN_POW: | |
3821 | case BUILT_IN_POWF: | |
3822 | case BUILT_IN_POWL: | |
3823 | if (TREE_CODE (gimple_call_arg (stmt, 1)) == REAL_CST | |
3824 | && REAL_VALUES_EQUAL | |
3825 | (TREE_REAL_CST (gimple_call_arg (stmt, 1)), dconst2)) | |
3826 | return estimate_operator_cost (MULT_EXPR, weights, | |
3827 | gimple_call_arg (stmt, 0), | |
3828 | gimple_call_arg (stmt, 0)); | |
3829 | break; | |
3830 | ||
3831 | default: | |
3832 | break; | |
3833 | } | |
3834 | } | |
48e1416a | 3835 | |
20da2013 | 3836 | cost = node ? weights->call_cost : weights->indirect_call_cost; |
1c89c7a8 | 3837 | if (gimple_call_lhs (stmt)) |
3838 | cost += estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt))); | |
3839 | for (i = 0; i < gimple_call_num_args (stmt); i++) | |
e0645921 | 3840 | { |
1c89c7a8 | 3841 | tree arg = gimple_call_arg (stmt, i); |
3842 | cost += estimate_move_cost (TREE_TYPE (arg)); | |
e0645921 | 3843 | } |
4ee9c684 | 3844 | break; |
3845 | } | |
ee68bf10 | 3846 | |
958b3c8a | 3847 | case GIMPLE_RETURN: |
3848 | return weights->return_cost; | |
3849 | ||
75a70cf9 | 3850 | case GIMPLE_GOTO: |
3851 | case GIMPLE_LABEL: | |
3852 | case GIMPLE_NOP: | |
3853 | case GIMPLE_PHI: | |
75a70cf9 | 3854 | case GIMPLE_PREDICT: |
9845d120 | 3855 | case GIMPLE_DEBUG: |
75a70cf9 | 3856 | return 0; |
3857 | ||
3858 | case GIMPLE_ASM: | |
5a5c1f81 | 3859 | { |
3860 | int count = asm_str_count (gimple_asm_string (stmt)); | |
3861 | /* 1000 means infinity. This avoids overflows later | |
3862 | with very long asm statements. */ | |
3863 | if (count > 1000) | |
3864 | count = 1000; | |
3865 | return count; | |
3866 | } | |
75a70cf9 | 3867 | |
e38def9c | 3868 | case GIMPLE_RESX: |
3869 | /* This is either going to be an external function call with one | |
3870 | argument, or two register copy statements plus a goto. */ | |
3871 | return 2; | |
3872 | ||
3873 | case GIMPLE_EH_DISPATCH: | |
3874 | /* ??? This is going to turn into a switch statement. Ideally | |
3875 | we'd have a look at the eh region and estimate the number of | |
3876 | edges involved. */ | |
3877 | return 10; | |
3878 | ||
75a70cf9 | 3879 | case GIMPLE_BIND: |
3880 | return estimate_num_insns_seq (gimple_bind_body (stmt), weights); | |
3881 | ||
3882 | case GIMPLE_EH_FILTER: | |
3883 | return estimate_num_insns_seq (gimple_eh_filter_failure (stmt), weights); | |
3884 | ||
3885 | case GIMPLE_CATCH: | |
3886 | return estimate_num_insns_seq (gimple_catch_handler (stmt), weights); | |
3887 | ||
3888 | case GIMPLE_TRY: | |
3889 | return (estimate_num_insns_seq (gimple_try_eval (stmt), weights) | |
3890 | + estimate_num_insns_seq (gimple_try_cleanup (stmt), weights)); | |
3891 | ||
3892 | /* OpenMP directives are generally very expensive. */ | |
3893 | ||
3894 | case GIMPLE_OMP_RETURN: | |
3895 | case GIMPLE_OMP_SECTIONS_SWITCH: | |
3896 | case GIMPLE_OMP_ATOMIC_STORE: | |
3897 | case GIMPLE_OMP_CONTINUE: | |
3898 | /* ...except these, which are cheap. */ | |
3899 | return 0; | |
3900 | ||
3901 | case GIMPLE_OMP_ATOMIC_LOAD: | |
3902 | return weights->omp_cost; | |
3903 | ||
3904 | case GIMPLE_OMP_FOR: | |
3905 | return (weights->omp_cost | |
3906 | + estimate_num_insns_seq (gimple_omp_body (stmt), weights) | |
3907 | + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt), weights)); | |
3908 | ||
3909 | case GIMPLE_OMP_PARALLEL: | |
3910 | case GIMPLE_OMP_TASK: | |
3911 | case GIMPLE_OMP_CRITICAL: | |
3912 | case GIMPLE_OMP_MASTER: | |
bc7bff74 | 3913 | case GIMPLE_OMP_TASKGROUP: |
75a70cf9 | 3914 | case GIMPLE_OMP_ORDERED: |
3915 | case GIMPLE_OMP_SECTION: | |
3916 | case GIMPLE_OMP_SECTIONS: | |
3917 | case GIMPLE_OMP_SINGLE: | |
bc7bff74 | 3918 | case GIMPLE_OMP_TARGET: |
3919 | case GIMPLE_OMP_TEAMS: | |
75a70cf9 | 3920 | return (weights->omp_cost |
3921 | + estimate_num_insns_seq (gimple_omp_body (stmt), weights)); | |
ee68bf10 | 3922 | |
4c0315d0 | 3923 | case GIMPLE_TRANSACTION: |
3924 | return (weights->tm_cost | |
3925 | + estimate_num_insns_seq (gimple_transaction_body (stmt), | |
3926 | weights)); | |
3927 | ||
4ee9c684 | 3928 | default: |
8c0963c4 | 3929 | gcc_unreachable (); |
4ee9c684 | 3930 | } |
75a70cf9 | 3931 | |
3932 | return cost; | |
4ee9c684 | 3933 | } |
3934 | ||
75a70cf9 | 3935 | /* Estimate number of instructions that will be created by expanding |
3936 | function FNDECL. WEIGHTS contains weights attributed to various | |
3937 | constructs. */ | |
5ff0afa2 | 3938 | |
4ee9c684 | 3939 | int |
75a70cf9 | 3940 | estimate_num_insns_fn (tree fndecl, eni_weights *weights) |
4ee9c684 | 3941 | { |
75a70cf9 | 3942 | struct function *my_function = DECL_STRUCT_FUNCTION (fndecl); |
3943 | gimple_stmt_iterator bsi; | |
e27482aa | 3944 | basic_block bb; |
75a70cf9 | 3945 | int n = 0; |
e27482aa | 3946 | |
75a70cf9 | 3947 | gcc_assert (my_function && my_function->cfg); |
3948 | FOR_EACH_BB_FN (bb, my_function) | |
e27482aa | 3949 | { |
75a70cf9 | 3950 | for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi)) |
3951 | n += estimate_num_insns (gsi_stmt (bsi), weights); | |
e27482aa | 3952 | } |
e27482aa | 3953 | |
75a70cf9 | 3954 | return n; |
bc8bb825 | 3955 | } |
3956 | ||
75a70cf9 | 3957 | |
bc8bb825 | 3958 | /* Initializes weights used by estimate_num_insns. */ |
3959 | ||
3960 | void | |
3961 | init_inline_once (void) | |
3962 | { | |
bc8bb825 | 3963 | eni_size_weights.call_cost = 1; |
20da2013 | 3964 | eni_size_weights.indirect_call_cost = 3; |
4a5b1b7c | 3965 | eni_size_weights.target_builtin_call_cost = 1; |
bc8bb825 | 3966 | eni_size_weights.div_mod_cost = 1; |
bc8bb825 | 3967 | eni_size_weights.omp_cost = 40; |
4c0315d0 | 3968 | eni_size_weights.tm_cost = 10; |
94e6e359 | 3969 | eni_size_weights.time_based = false; |
958b3c8a | 3970 | eni_size_weights.return_cost = 1; |
bc8bb825 | 3971 | |
3972 | /* Estimating time for call is difficult, since we have no idea what the | |
3973 | called function does. In the current uses of eni_time_weights, | |
3974 | underestimating the cost does less harm than overestimating it, so | |
85694bac | 3975 | we choose a rather small value here. */ |
bc8bb825 | 3976 | eni_time_weights.call_cost = 10; |
20da2013 | 3977 | eni_time_weights.indirect_call_cost = 15; |
958b3c8a | 3978 | eni_time_weights.target_builtin_call_cost = 1; |
bc8bb825 | 3979 | eni_time_weights.div_mod_cost = 10; |
bc8bb825 | 3980 | eni_time_weights.omp_cost = 40; |
4c0315d0 | 3981 | eni_time_weights.tm_cost = 40; |
94e6e359 | 3982 | eni_time_weights.time_based = true; |
958b3c8a | 3983 | eni_time_weights.return_cost = 2; |
4ee9c684 | 3984 | } |
3985 | ||
75a70cf9 | 3986 | /* Estimate the number of instructions in a gimple_seq. */ |
3987 | ||
3988 | int | |
3989 | count_insns_seq (gimple_seq seq, eni_weights *weights) | |
3990 | { | |
3991 | gimple_stmt_iterator gsi; | |
3992 | int n = 0; | |
3993 | for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi)) | |
3994 | n += estimate_num_insns (gsi_stmt (gsi), weights); | |
3995 | ||
3996 | return n; | |
3997 | } | |
3998 | ||
3999 | ||
e27482aa | 4000 | /* Install new lexical TREE_BLOCK underneath 'current_block'. */ |
75a70cf9 | 4001 | |
e27482aa | 4002 | static void |
cb302f29 | 4003 | prepend_lexical_block (tree current_block, tree new_block) |
e27482aa | 4004 | { |
cb302f29 | 4005 | BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (current_block); |
4006 | BLOCK_SUBBLOCKS (current_block) = new_block; | |
e27482aa | 4007 | BLOCK_SUPERCONTEXT (new_block) = current_block; |
e27482aa | 4008 | } |
4009 | ||
2ab2ce89 | 4010 | /* Add local variables from CALLEE to CALLER. */ |
4011 | ||
4012 | static inline void | |
4013 | add_local_variables (struct function *callee, struct function *caller, | |
6a1933ed | 4014 | copy_body_data *id) |
2ab2ce89 | 4015 | { |
4016 | tree var; | |
4017 | unsigned ix; | |
4018 | ||
4019 | FOR_EACH_LOCAL_DECL (callee, ix, var) | |
6a1933ed | 4020 | if (!can_be_nonlocal (var, id)) |
2e4223e3 | 4021 | { |
4022 | tree new_var = remap_decl (var, id); | |
4023 | ||
4024 | /* Remap debug-expressions. */ | |
4025 | if (TREE_CODE (new_var) == VAR_DECL | |
8e966116 | 4026 | && DECL_HAS_DEBUG_EXPR_P (var) |
2e4223e3 | 4027 | && new_var != var) |
4028 | { | |
4029 | tree tem = DECL_DEBUG_EXPR (var); | |
4030 | bool old_regimplify = id->regimplify; | |
4031 | id->remapping_type_depth++; | |
4032 | walk_tree (&tem, copy_tree_body_r, id, NULL); | |
4033 | id->remapping_type_depth--; | |
4034 | id->regimplify = old_regimplify; | |
4035 | SET_DECL_DEBUG_EXPR (new_var, tem); | |
8e966116 | 4036 | DECL_HAS_DEBUG_EXPR_P (new_var) = 1; |
2e4223e3 | 4037 | } |
4038 | add_local_decl (caller, new_var); | |
4039 | } | |
2ab2ce89 | 4040 | } |
4041 | ||
75a70cf9 | 4042 | /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */ |
e343483a | 4043 | |
e27482aa | 4044 | static bool |
75a70cf9 | 4045 | expand_call_inline (basic_block bb, gimple stmt, copy_body_data *id) |
e343483a | 4046 | { |
f018d957 | 4047 | tree use_retvar; |
d57cd35f | 4048 | tree fn; |
9845d120 | 4049 | struct pointer_map_t *st, *dst; |
deff5ffd | 4050 | tree return_slot; |
8e7912a5 | 4051 | tree modify_dest; |
4ee9c684 | 4052 | location_t saved_location; |
e27482aa | 4053 | struct cgraph_edge *cg_edge; |
326a9581 | 4054 | cgraph_inline_failed_t reason; |
e27482aa | 4055 | basic_block return_block; |
4056 | edge e; | |
75a70cf9 | 4057 | gimple_stmt_iterator gsi, stmt_gsi; |
e27482aa | 4058 | bool successfully_inlined = FALSE; |
2c8a1497 | 4059 | bool purge_dead_abnormal_edges; |
e343483a | 4060 | |
4ee9c684 | 4061 | /* Set input_location here so we get the right instantiation context |
4062 | if we call instantiate_decl from inlinable_function_p. */ | |
4a020a8c | 4063 | /* FIXME: instantiate_decl isn't called by inlinable_function_p. */ |
4ee9c684 | 4064 | saved_location = input_location; |
c2e72ba3 | 4065 | input_location = gimple_location (stmt); |
4ee9c684 | 4066 | |
e343483a | 4067 | /* From here on, we're only interested in CALL_EXPRs. */ |
75a70cf9 | 4068 | if (gimple_code (stmt) != GIMPLE_CALL) |
4ee9c684 | 4069 | goto egress; |
e343483a | 4070 | |
b819947c | 4071 | cg_edge = cgraph_edge (id->dst_node, stmt); |
4072 | gcc_checking_assert (cg_edge); | |
e343483a | 4073 | /* First, see if we can figure out what function is being called. |
4074 | If we cannot, then there is no hope of inlining the function. */ | |
b819947c | 4075 | if (cg_edge->indirect_unknown_callee) |
1caef38b | 4076 | goto egress; |
02774f2d | 4077 | fn = cg_edge->callee->decl; |
b819947c | 4078 | gcc_checking_assert (fn); |
d7c6d889 | 4079 | |
75a70cf9 | 4080 | /* If FN is a declaration of a function in a nested scope that was |
ad850f1c | 4081 | globally declared inline, we don't set its DECL_INITIAL. |
4082 | However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the | |
4083 | C++ front-end uses it for cdtors to refer to their internal | |
4084 | declarations, that are not real functions. Fortunately those | |
4085 | don't have trees to be saved, so we can tell by checking their | |
75a70cf9 | 4086 | gimple_body. */ |
4087 | if (!DECL_INITIAL (fn) | |
ad850f1c | 4088 | && DECL_ABSTRACT_ORIGIN (fn) |
1a1a827a | 4089 | && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn))) |
ad850f1c | 4090 | fn = DECL_ABSTRACT_ORIGIN (fn); |
4091 | ||
cbeb677e | 4092 | /* Don't try to inline functions that are not well-suited to inlining. */ |
da5e1e7c | 4093 | if (cg_edge->inline_failed) |
28f45805 | 4094 | { |
da5e1e7c | 4095 | reason = cg_edge->inline_failed; |
f8daee9b | 4096 | /* If this call was originally indirect, we do not want to emit any |
4097 | inlining related warnings or sorry messages because there are no | |
4098 | guarantees regarding those. */ | |
799c8711 | 4099 | if (cg_edge->indirect_inlining_edge) |
f8daee9b | 4100 | goto egress; |
4101 | ||
6686ff93 | 4102 | if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)) |
fa1cc29d | 4103 | /* For extern inline functions that get redefined we always |
4104 | silently ignored always_inline flag. Better behaviour would | |
4105 | be to be able to keep both bodies and use extern inline body | |
4106 | for inlining, but we can't do that because frontends overwrite | |
4107 | the body. */ | |
4108 | && !cg_edge->callee->local.redefined_extern_inline | |
c440293e | 4109 | /* During early inline pass, report only when optimization is |
4110 | not turned on. */ | |
4111 | && (cgraph_global_info_ready | |
4112 | || !optimize) | |
a522e9eb | 4113 | /* PR 20090218-1_0.c. Body can be provided by another module. */ |
4114 | && (reason != CIF_BODY_NOT_AVAILABLE || !flag_generate_lto)) | |
d731003e | 4115 | { |
a522e9eb | 4116 | error ("inlining failed in call to always_inline %q+F: %s", fn, |
4117 | cgraph_inline_failed_string (reason)); | |
4118 | error ("called from here"); | |
d731003e | 4119 | } |
59a52681 | 4120 | else if (warn_inline |
4121 | && DECL_DECLARED_INLINE_P (fn) | |
4122 | && !DECL_NO_INLINE_WARNING_P (fn) | |
d731003e | 4123 | && !DECL_IN_SYSTEM_HEADER (fn) |
326a9581 | 4124 | && reason != CIF_UNSPECIFIED |
9e0baf4d | 4125 | && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn)) |
17c205c9 | 4126 | /* Do not warn about not inlined recursive calls. */ |
4127 | && !cgraph_edge_recursive_p (cg_edge) | |
9e0baf4d | 4128 | /* Avoid warnings during early inline pass. */ |
6329636b | 4129 | && cgraph_global_info_ready) |
28f45805 | 4130 | { |
3cf8b391 | 4131 | warning (OPT_Winline, "inlining failed in call to %q+F: %s", |
836045d7 | 4132 | fn, _(cgraph_inline_failed_string (reason))); |
6bf97f82 | 4133 | warning (OPT_Winline, "called from here"); |
28f45805 | 4134 | } |
4ee9c684 | 4135 | goto egress; |
28f45805 | 4136 | } |
02774f2d | 4137 | fn = cg_edge->callee->decl; |
eaad46f2 | 4138 | cgraph_get_body (cg_edge->callee); |
e343483a | 4139 | |
b0cdf642 | 4140 | #ifdef ENABLE_CHECKING |
02774f2d | 4141 | if (cg_edge->callee->decl != id->dst_node->decl) |
e27482aa | 4142 | verify_cgraph_node (cg_edge->callee); |
b0cdf642 | 4143 | #endif |
4144 | ||
e27482aa | 4145 | /* We will be inlining this callee. */ |
e38def9c | 4146 | id->eh_lp_nr = lookup_stmt_eh_lp (stmt); |
e27482aa | 4147 | |
58d82cd0 | 4148 | /* Update the callers EH personality. */ |
02774f2d | 4149 | if (DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl)) |
4150 | DECL_FUNCTION_PERSONALITY (cg_edge->caller->decl) | |
4151 | = DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl); | |
58d82cd0 | 4152 | |
75a70cf9 | 4153 | /* Split the block holding the GIMPLE_CALL. */ |
e27482aa | 4154 | e = split_block (bb, stmt); |
4155 | bb = e->src; | |
4156 | return_block = e->dest; | |
4157 | remove_edge (e); | |
4158 | ||
2c8a1497 | 4159 | /* split_block splits after the statement; work around this by |
4160 | moving the call into the second block manually. Not pretty, | |
4161 | but seems easier than doing the CFG manipulation by hand | |
75a70cf9 | 4162 | when the GIMPLE_CALL is in the last statement of BB. */ |
4163 | stmt_gsi = gsi_last_bb (bb); | |
4164 | gsi_remove (&stmt_gsi, false); | |
2c8a1497 | 4165 | |
75a70cf9 | 4166 | /* If the GIMPLE_CALL was in the last statement of BB, it may have |
2c8a1497 | 4167 | been the source of abnormal edges. In this case, schedule |
4168 | the removal of dead abnormal edges. */ | |
75a70cf9 | 4169 | gsi = gsi_start_bb (return_block); |
4170 | if (gsi_end_p (gsi)) | |
e27482aa | 4171 | { |
75a70cf9 | 4172 | gsi_insert_after (&gsi, stmt, GSI_NEW_STMT); |
2c8a1497 | 4173 | purge_dead_abnormal_edges = true; |
e27482aa | 4174 | } |
2c8a1497 | 4175 | else |
4176 | { | |
75a70cf9 | 4177 | gsi_insert_before (&gsi, stmt, GSI_NEW_STMT); |
2c8a1497 | 4178 | purge_dead_abnormal_edges = false; |
4179 | } | |
4180 | ||
75a70cf9 | 4181 | stmt_gsi = gsi_start_bb (return_block); |
054e01a7 | 4182 | |
d57cd35f | 4183 | /* Build a block containing code to initialize the arguments, the |
4184 | actual inline expansion of the body, and a label for the return | |
4185 | statements within the function to jump to. The type of the | |
c251ba7f | 4186 | statement expression is the return type of the function call. |
4187 | ??? If the call does not have an associated block then we will | |
4188 | remap all callee blocks to NULL, effectively dropping most of | |
4189 | its debug information. This should only happen for calls to | |
4190 | artificial decls inserted by the compiler itself. We need to | |
4191 | either link the inlined blocks into the caller block tree or | |
4192 | not refer to them in any way to not break GC for locations. */ | |
5169661d | 4193 | if (gimple_block (stmt)) |
c251ba7f | 4194 | { |
4195 | id->block = make_node (BLOCK); | |
4196 | BLOCK_ABSTRACT_ORIGIN (id->block) = fn; | |
dc426203 | 4197 | BLOCK_SOURCE_LOCATION (id->block) = LOCATION_LOCUS (input_location); |
c251ba7f | 4198 | prepend_lexical_block (gimple_block (stmt), id->block); |
4199 | } | |
e27482aa | 4200 | |
e343483a | 4201 | /* Local declarations will be replaced by their equivalents in this |
4202 | map. */ | |
4203 | st = id->decl_map; | |
e3022db7 | 4204 | id->decl_map = pointer_map_create (); |
9845d120 | 4205 | dst = id->debug_map; |
4206 | id->debug_map = NULL; | |
e343483a | 4207 | |
e27482aa | 4208 | /* Record the function we are about to inline. */ |
51a48c27 | 4209 | id->src_fn = fn; |
4210 | id->src_node = cg_edge->callee; | |
deff5ffd | 4211 | id->src_cfun = DECL_STRUCT_FUNCTION (fn); |
75a70cf9 | 4212 | id->gimple_call = stmt; |
51a48c27 | 4213 | |
7f481d3e | 4214 | gcc_assert (!id->src_cfun->after_inlining); |
4215 | ||
186f5fff | 4216 | id->entry_bb = bb; |
1add270f | 4217 | if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn))) |
4218 | { | |
4219 | gimple_stmt_iterator si = gsi_last_bb (bb); | |
4220 | gsi_insert_after (&si, gimple_build_predict (PRED_COLD_FUNCTION, | |
4221 | NOT_TAKEN), | |
4222 | GSI_NEW_STMT); | |
4223 | } | |
75a70cf9 | 4224 | initialize_inlined_parameters (id, stmt, fn, bb); |
e343483a | 4225 | |
469679ab | 4226 | if (DECL_INITIAL (fn)) |
896972cc | 4227 | { |
c251ba7f | 4228 | if (gimple_block (stmt)) |
4229 | { | |
4230 | tree *var; | |
4231 | ||
4232 | prepend_lexical_block (id->block, | |
4233 | remap_blocks (DECL_INITIAL (fn), id)); | |
4234 | gcc_checking_assert (BLOCK_SUBBLOCKS (id->block) | |
4235 | && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id->block)) | |
4236 | == NULL_TREE)); | |
4237 | /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block, | |
4238 | otherwise for DWARF DW_TAG_formal_parameter will not be children of | |
4239 | DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block | |
4240 | under it. The parameters can be then evaluated in the debugger, | |
4241 | but don't show in backtraces. */ | |
4242 | for (var = &BLOCK_VARS (BLOCK_SUBBLOCKS (id->block)); *var; ) | |
4243 | if (TREE_CODE (DECL_ORIGIN (*var)) == PARM_DECL) | |
4244 | { | |
4245 | tree v = *var; | |
4246 | *var = TREE_CHAIN (v); | |
4247 | TREE_CHAIN (v) = BLOCK_VARS (id->block); | |
4248 | BLOCK_VARS (id->block) = v; | |
4249 | } | |
4250 | else | |
4251 | var = &TREE_CHAIN (*var); | |
4252 | } | |
4253 | else | |
4254 | remap_blocks_to_null (DECL_INITIAL (fn), id); | |
896972cc | 4255 | } |
b3d24a23 | 4256 | |
e343483a | 4257 | /* Return statements in the function body will be replaced by jumps |
4258 | to the RET_LABEL. */ | |
8c0963c4 | 4259 | gcc_assert (DECL_INITIAL (fn)); |
4260 | gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK); | |
9a0c59e9 | 4261 | |
75a70cf9 | 4262 | /* Find the LHS to which the result of this call is assigned. */ |
deff5ffd | 4263 | return_slot = NULL; |
75a70cf9 | 4264 | if (gimple_call_lhs (stmt)) |
b1672e81 | 4265 | { |
75a70cf9 | 4266 | modify_dest = gimple_call_lhs (stmt); |
b1672e81 | 4267 | |
4268 | /* The function which we are inlining might not return a value, | |
4269 | in which case we should issue a warning that the function | |
4270 | does not return a value. In that case the optimizers will | |
4271 | see that the variable to which the value is assigned was not | |
4272 | initialized. We do not want to issue a warning about that | |
4273 | uninitialized variable. */ | |
4274 | if (DECL_P (modify_dest)) | |
4275 | TREE_NO_WARNING (modify_dest) = 1; | |
75a70cf9 | 4276 | |
4277 | if (gimple_call_return_slot_opt_p (stmt)) | |
ea523851 | 4278 | { |
deff5ffd | 4279 | return_slot = modify_dest; |
ea523851 | 4280 | modify_dest = NULL; |
4281 | } | |
b1672e81 | 4282 | } |
8e7912a5 | 4283 | else |
4284 | modify_dest = NULL; | |
4285 | ||
68d6de5b | 4286 | /* If we are inlining a call to the C++ operator new, we don't want |
4287 | to use type based alias analysis on the return value. Otherwise | |
4288 | we may get confused if the compiler sees that the inlined new | |
4289 | function returns a pointer which was just deleted. See bug | |
4290 | 33407. */ | |
4291 | if (DECL_IS_OPERATOR_NEW (fn)) | |
4292 | { | |
4293 | return_slot = NULL; | |
4294 | modify_dest = NULL; | |
4295 | } | |
4296 | ||
e343483a | 4297 | /* Declare the return variable for the function. */ |
524a0531 | 4298 | use_retvar = declare_return_variable (id, return_slot, modify_dest, bb); |
68d6de5b | 4299 | |
b3d24a23 | 4300 | /* Add local vars in this inlined callee to caller. */ |
6a1933ed | 4301 | add_local_variables (id->src_cfun, cfun, id); |
b3d24a23 | 4302 | |
e2d3f422 | 4303 | if (dump_file && (dump_flags & TDF_DETAILS)) |
4304 | { | |
4305 | fprintf (dump_file, "Inlining "); | |
48e1416a | 4306 | print_generic_expr (dump_file, id->src_fn, 0); |
e2d3f422 | 4307 | fprintf (dump_file, " to "); |
48e1416a | 4308 | print_generic_expr (dump_file, id->dst_fn, 0); |
e2d3f422 | 4309 | fprintf (dump_file, " with frequency %i\n", cg_edge->frequency); |
4310 | } | |
4311 | ||
a8305131 | 4312 | /* This is it. Duplicate the callee body. Assume callee is |
4313 | pre-gimplified. Note that we must not alter the caller | |
4314 | function in any way before this point, as this CALL_EXPR may be | |
4315 | a self-referential call; if we're calling ourselves, we need to | |
4316 | duplicate our body before altering anything. */ | |
e2d3f422 | 4317 | copy_body (id, bb->count, |
70074000 | 4318 | GCOV_COMPUTE_SCALE (cg_edge->frequency, CGRAPH_FREQ_BASE), |
84cb1020 | 4319 | bb, return_block, NULL); |
a8305131 | 4320 | |
cb245216 | 4321 | /* Reset the escaped solution. */ |
7f81b5ee | 4322 | if (cfun->gimple_df) |
cb245216 | 4323 | pt_solution_reset (&cfun->gimple_df->escaped); |
7f81b5ee | 4324 | |
e343483a | 4325 | /* Clean up. */ |
9845d120 | 4326 | if (id->debug_map) |
4327 | { | |
4328 | pointer_map_destroy (id->debug_map); | |
4329 | id->debug_map = dst; | |
4330 | } | |
e3022db7 | 4331 | pointer_map_destroy (id->decl_map); |
e343483a | 4332 | id->decl_map = st; |
4333 | ||
dd277d48 | 4334 | /* Unlink the calls virtual operands before replacing it. */ |
4335 | unlink_stmt_vdef (stmt); | |
4336 | ||
11fe6c8b | 4337 | /* If the inlined function returns a result that we care about, |
75a70cf9 | 4338 | substitute the GIMPLE_CALL with an assignment of the return |
4339 | variable to the LHS of the call. That is, if STMT was | |
4340 | 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */ | |
4341 | if (use_retvar && gimple_call_lhs (stmt)) | |
e27482aa | 4342 | { |
75a70cf9 | 4343 | gimple old_stmt = stmt; |
4344 | stmt = gimple_build_assign (gimple_call_lhs (stmt), use_retvar); | |
4345 | gsi_replace (&stmt_gsi, stmt, false); | |
75a70cf9 | 4346 | maybe_clean_or_replace_eh_stmt (old_stmt, stmt); |
e27482aa | 4347 | } |
4ee9c684 | 4348 | else |
deff5ffd | 4349 | { |
75a70cf9 | 4350 | /* Handle the case of inlining a function with no return |
4351 | statement, which causes the return value to become undefined. */ | |
4352 | if (gimple_call_lhs (stmt) | |
4353 | && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME) | |
deff5ffd | 4354 | { |
75a70cf9 | 4355 | tree name = gimple_call_lhs (stmt); |
4356 | tree var = SSA_NAME_VAR (name); | |
c6dfe037 | 4357 | tree def = ssa_default_def (cfun, var); |
deff5ffd | 4358 | |
deff5ffd | 4359 | if (def) |
4360 | { | |
75a70cf9 | 4361 | /* If the variable is used undefined, make this name |
4362 | undefined via a move. */ | |
4363 | stmt = gimple_build_assign (gimple_call_lhs (stmt), def); | |
4364 | gsi_replace (&stmt_gsi, stmt, true); | |
deff5ffd | 4365 | } |
deff5ffd | 4366 | else |
4367 | { | |
75a70cf9 | 4368 | /* Otherwise make this variable undefined. */ |
4369 | gsi_remove (&stmt_gsi, true); | |
c6dfe037 | 4370 | set_ssa_default_def (cfun, var, name); |
75a70cf9 | 4371 | SSA_NAME_DEF_STMT (name) = gimple_build_nop (); |
deff5ffd | 4372 | } |
4373 | } | |
4374 | else | |
75a70cf9 | 4375 | gsi_remove (&stmt_gsi, true); |
deff5ffd | 4376 | } |
e343483a | 4377 | |
2c8a1497 | 4378 | if (purge_dead_abnormal_edges) |
10f52eb8 | 4379 | { |
4380 | gimple_purge_dead_eh_edges (return_block); | |
4381 | gimple_purge_dead_abnormal_call_edges (return_block); | |
4382 | } | |
11fe6c8b | 4383 | |
e27482aa | 4384 | /* If the value of the new expression is ignored, that's OK. We |
4385 | don't warn about this for CALL_EXPRs, so we shouldn't warn about | |
4386 | the equivalent inlined version either. */ | |
75a70cf9 | 4387 | if (is_gimple_assign (stmt)) |
4388 | { | |
4389 | gcc_assert (gimple_assign_single_p (stmt) | |
d9659041 | 4390 | || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt))); |
75a70cf9 | 4391 | TREE_USED (gimple_assign_rhs1 (stmt)) = 1; |
4392 | } | |
11fe6c8b | 4393 | |
9e45f419 | 4394 | /* Output the inlining info for this abstract function, since it has been |
4395 | inlined. If we don't do this now, we can lose the information about the | |
4396 | variables in the function when the blocks get blown away as soon as we | |
4397 | remove the cgraph node. */ | |
c251ba7f | 4398 | if (gimple_block (stmt)) |
02774f2d | 4399 | (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl); |
11fe6c8b | 4400 | |
833eb724 | 4401 | /* Update callgraph if needed. */ |
e27482aa | 4402 | cgraph_remove_node (cg_edge->callee); |
833eb724 | 4403 | |
e27482aa | 4404 | id->block = NULL_TREE; |
e27482aa | 4405 | successfully_inlined = TRUE; |
054e01a7 | 4406 | |
4ee9c684 | 4407 | egress: |
4408 | input_location = saved_location; | |
e27482aa | 4409 | return successfully_inlined; |
e343483a | 4410 | } |
4ee9c684 | 4411 | |
e27482aa | 4412 | /* Expand call statements reachable from STMT_P. |
4413 | We can only have CALL_EXPRs as the "toplevel" tree code or nested | |
4c0315d0 | 4414 | in a MODIFY_EXPR. */ |
e27482aa | 4415 | |
4416 | static bool | |
51a48c27 | 4417 | gimple_expand_calls_inline (basic_block bb, copy_body_data *id) |
4ee9c684 | 4418 | { |
75a70cf9 | 4419 | gimple_stmt_iterator gsi; |
4ee9c684 | 4420 | |
75a70cf9 | 4421 | for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi)) |
4ee9c684 | 4422 | { |
75a70cf9 | 4423 | gimple stmt = gsi_stmt (gsi); |
e27482aa | 4424 | |
75a70cf9 | 4425 | if (is_gimple_call (stmt) |
4426 | && expand_call_inline (bb, stmt, id)) | |
4427 | return true; | |
4ee9c684 | 4428 | } |
75a70cf9 | 4429 | |
e27482aa | 4430 | return false; |
4ee9c684 | 4431 | } |
4432 | ||
75a70cf9 | 4433 | |
3e9045dd | 4434 | /* Walk all basic blocks created after FIRST and try to fold every statement |
4435 | in the STATEMENTS pointer set. */ | |
75a70cf9 | 4436 | |
3e9045dd | 4437 | static void |
4438 | fold_marked_statements (int first, struct pointer_set_t *statements) | |
4439 | { | |
a28770e1 | 4440 | for (; first < n_basic_blocks_for_fn (cfun); first++) |
3e9045dd | 4441 | if (BASIC_BLOCK (first)) |
4442 | { | |
75a70cf9 | 4443 | gimple_stmt_iterator gsi; |
4444 | ||
4445 | for (gsi = gsi_start_bb (BASIC_BLOCK (first)); | |
4446 | !gsi_end_p (gsi); | |
4447 | gsi_next (&gsi)) | |
4448 | if (pointer_set_contains (statements, gsi_stmt (gsi))) | |
2fcc7de2 | 4449 | { |
75a70cf9 | 4450 | gimple old_stmt = gsi_stmt (gsi); |
8d8c4f3e | 4451 | tree old_decl = is_gimple_call (old_stmt) ? gimple_call_fndecl (old_stmt) : 0; |
117ef3d7 | 4452 | |
a65c4d64 | 4453 | if (old_decl && DECL_BUILT_IN (old_decl)) |
4454 | { | |
4455 | /* Folding builtins can create multiple instructions, | |
4456 | we need to look at all of them. */ | |
4457 | gimple_stmt_iterator i2 = gsi; | |
4458 | gsi_prev (&i2); | |
4459 | if (fold_stmt (&gsi)) | |
4460 | { | |
4461 | gimple new_stmt; | |
bb4322f9 | 4462 | /* If a builtin at the end of a bb folded into nothing, |
4463 | the following loop won't work. */ | |
4464 | if (gsi_end_p (gsi)) | |
4465 | { | |
4466 | cgraph_update_edges_for_call_stmt (old_stmt, | |
4467 | old_decl, NULL); | |
4468 | break; | |
4469 | } | |
a65c4d64 | 4470 | if (gsi_end_p (i2)) |
4471 | i2 = gsi_start_bb (BASIC_BLOCK (first)); | |
4472 | else | |
4473 | gsi_next (&i2); | |
4474 | while (1) | |
4475 | { | |
4476 | new_stmt = gsi_stmt (i2); | |
4477 | update_stmt (new_stmt); | |
4478 | cgraph_update_edges_for_call_stmt (old_stmt, old_decl, | |
4479 | new_stmt); | |
4480 | ||
4481 | if (new_stmt == gsi_stmt (gsi)) | |
4482 | { | |
4483 | /* It is okay to check only for the very last | |
4484 | of these statements. If it is a throwing | |
4485 | statement nothing will change. If it isn't | |
4486 | this can remove EH edges. If that weren't | |
4487 | correct then because some intermediate stmts | |
4488 | throw, but not the last one. That would mean | |
4489 | we'd have to split the block, which we can't | |
4490 | here and we'd loose anyway. And as builtins | |
4491 | probably never throw, this all | |
4492 | is mood anyway. */ | |
4493 | if (maybe_clean_or_replace_eh_stmt (old_stmt, | |
4494 | new_stmt)) | |
4495 | gimple_purge_dead_eh_edges (BASIC_BLOCK (first)); | |
4496 | break; | |
4497 | } | |
4498 | gsi_next (&i2); | |
4499 | } | |
4500 | } | |
4501 | } | |
4502 | else if (fold_stmt (&gsi)) | |
2fcc7de2 | 4503 | { |
75a70cf9 | 4504 | /* Re-read the statement from GSI as fold_stmt() may |
4505 | have changed it. */ | |
4506 | gimple new_stmt = gsi_stmt (gsi); | |
4507 | update_stmt (new_stmt); | |
4508 | ||
8d8c4f3e | 4509 | if (is_gimple_call (old_stmt) |
4510 | || is_gimple_call (new_stmt)) | |
a65c4d64 | 4511 | cgraph_update_edges_for_call_stmt (old_stmt, old_decl, |
4512 | new_stmt); | |
75a70cf9 | 4513 | |
4514 | if (maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt)) | |
4515 | gimple_purge_dead_eh_edges (BASIC_BLOCK (first)); | |
2fcc7de2 | 4516 | } |
4517 | } | |
3e9045dd | 4518 | } |
4519 | } | |
4520 | ||
e343483a | 4521 | /* Expand calls to inline functions in the body of FN. */ |
4522 | ||
09a2e412 | 4523 | unsigned int |
60b8c5b3 | 4524 | optimize_inline_calls (tree fn) |
e343483a | 4525 | { |
51a48c27 | 4526 | copy_body_data id; |
e27482aa | 4527 | basic_block bb; |
a28770e1 | 4528 | int last = n_basic_blocks_for_fn (cfun); |
d1ead98b | 4529 | bool inlined_p = false; |
dac18d1a | 4530 | |
e343483a | 4531 | /* Clear out ID. */ |
4532 | memset (&id, 0, sizeof (id)); | |
4533 | ||
fd6a3c41 | 4534 | id.src_node = id.dst_node = cgraph_get_node (fn); |
02774f2d | 4535 | gcc_assert (id.dst_node->definition); |
51a48c27 | 4536 | id.dst_fn = fn; |
e343483a | 4537 | /* Or any functions that aren't finished yet. */ |
e343483a | 4538 | if (current_function_decl) |
f018d957 | 4539 | id.dst_fn = current_function_decl; |
51a48c27 | 4540 | |
4541 | id.copy_decl = copy_decl_maybe_to_var; | |
4542 | id.transform_call_graph_edges = CB_CGE_DUPLICATE; | |
4543 | id.transform_new_cfg = false; | |
4544 | id.transform_return_to_modify = true; | |
6b99cb5e | 4545 | id.transform_parameter = true; |
32020b10 | 4546 | id.transform_lang_insert_block = NULL; |
3e9045dd | 4547 | id.statements_to_fold = pointer_set_create (); |
51a48c27 | 4548 | |
8a4a28a8 | 4549 | push_gimplify_context (); |
e343483a | 4550 | |
31a8456e | 4551 | /* We make no attempts to keep dominance info up-to-date. */ |
4552 | free_dominance_info (CDI_DOMINATORS); | |
4553 | free_dominance_info (CDI_POST_DOMINATORS); | |
4554 | ||
75a70cf9 | 4555 | /* Register specific gimple functions. */ |
4556 | gimple_register_cfg_hooks (); | |
4557 | ||
e27482aa | 4558 | /* Reach the trees by walking over the CFG, and note the |
4559 | enclosing basic-blocks in the call edges. */ | |
4560 | /* We walk the blocks going forward, because inlined function bodies | |
4561 | will split id->current_basic_block, and the new blocks will | |
4562 | follow it; we'll trudge through them, processing their CALL_EXPRs | |
4563 | along the way. */ | |
4564 | FOR_EACH_BB (bb) | |
d1ead98b | 4565 | inlined_p |= gimple_expand_calls_inline (bb, &id); |
e343483a | 4566 | |
e27482aa | 4567 | pop_gimplify_context (NULL); |
4ee9c684 | 4568 | |
b0cdf642 | 4569 | #ifdef ENABLE_CHECKING |
4570 | { | |
4571 | struct cgraph_edge *e; | |
4572 | ||
51a48c27 | 4573 | verify_cgraph_node (id.dst_node); |
b0cdf642 | 4574 | |
4575 | /* Double check that we inlined everything we are supposed to inline. */ | |
51a48c27 | 4576 | for (e = id.dst_node->callees; e; e = e->next_callee) |
8c0963c4 | 4577 | gcc_assert (e->inline_failed); |
b0cdf642 | 4578 | } |
4579 | #endif | |
48e1416a | 4580 | |
d1ead98b | 4581 | /* Fold queued statements. */ |
184e9f8f | 4582 | fold_marked_statements (last, id.statements_to_fold); |
4583 | pointer_set_destroy (id.statements_to_fold); | |
48e1416a | 4584 | |
f1f41a6c | 4585 | gcc_assert (!id.debug_stmts.exists ()); |
9845d120 | 4586 | |
d1ead98b | 4587 | /* If we didn't inline into the function there is nothing to do. */ |
4588 | if (!inlined_p) | |
4589 | return 0; | |
4590 | ||
184e9f8f | 4591 | /* Renumber the lexical scoping (non-code) blocks consecutively. */ |
4592 | number_blocks (fn); | |
3e9045dd | 4593 | |
31359ae8 | 4594 | delete_unreachable_blocks_update_callgraph (&id); |
4595 | #ifdef ENABLE_CHECKING | |
4596 | verify_cgraph_node (id.dst_node); | |
4597 | #endif | |
75a70cf9 | 4598 | |
deff5ffd | 4599 | /* It would be nice to check SSA/CFG/statement consistency here, but it is |
4600 | not possible yet - the IPA passes might make various functions to not | |
4601 | throw and they don't care to proactively update local EH info. This is | |
4602 | done later in fixup_cfg pass that also execute the verification. */ | |
75a70cf9 | 4603 | return (TODO_update_ssa |
4604 | | TODO_cleanup_cfg | |
4ae20857 | 4605 | | (gimple_in_ssa_p (cfun) ? TODO_remove_unused_locals : 0) |
d1ead98b | 4606 | | (gimple_in_ssa_p (cfun) ? TODO_update_address_taken : 0) |
4ae20857 | 4607 | | (profile_status != PROFILE_ABSENT ? TODO_rebuild_frequencies : 0)); |
e343483a | 4608 | } |
4609 | ||
e343483a | 4610 | /* Passed to walk_tree. Copies the node pointed to, if appropriate. */ |
4611 | ||
4612 | tree | |
60b8c5b3 | 4613 | copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED) |
e343483a | 4614 | { |
4615 | enum tree_code code = TREE_CODE (*tp); | |
35cc02b5 | 4616 | enum tree_code_class cl = TREE_CODE_CLASS (code); |
e343483a | 4617 | |
4618 | /* We make copies of most nodes. */ | |
35cc02b5 | 4619 | if (IS_EXPR_CODE_CLASS (cl) |
e343483a | 4620 | || code == TREE_LIST |
4621 | || code == TREE_VEC | |
55d97af6 | 4622 | || code == TYPE_DECL |
4623 | || code == OMP_CLAUSE) | |
e343483a | 4624 | { |
4625 | /* Because the chain gets clobbered when we make a copy, we save it | |
4626 | here. */ | |
f4e36c33 | 4627 | tree chain = NULL_TREE, new_tree; |
35cc02b5 | 4628 | |
9b88d08d | 4629 | if (CODE_CONTAINS_STRUCT (code, TS_COMMON)) |
4630 | chain = TREE_CHAIN (*tp); | |
e343483a | 4631 | |
4632 | /* Copy the node. */ | |
f4e36c33 | 4633 | new_tree = copy_node (*tp); |
4ee9c684 | 4634 | |
f4e36c33 | 4635 | *tp = new_tree; |
e343483a | 4636 | |
4637 | /* Now, restore the chain, if appropriate. That will cause | |
4638 | walk_tree to walk into the chain as well. */ | |
773c5ba7 | 4639 | if (code == PARM_DECL |
4640 | || code == TREE_LIST | |
55d6e7cd | 4641 | || code == OMP_CLAUSE) |
e343483a | 4642 | TREE_CHAIN (*tp) = chain; |
4643 | ||
4644 | /* For now, we don't update BLOCKs when we make copies. So, we | |
4ee9c684 | 4645 | have to nullify all BIND_EXPRs. */ |
4646 | if (TREE_CODE (*tp) == BIND_EXPR) | |
4647 | BIND_EXPR_BLOCK (*tp) = NULL_TREE; | |
e343483a | 4648 | } |
c75b4594 | 4649 | else if (code == CONSTRUCTOR) |
4650 | { | |
4651 | /* CONSTRUCTOR nodes need special handling because | |
4652 | we need to duplicate the vector of elements. */ | |
f4e36c33 | 4653 | tree new_tree; |
c75b4594 | 4654 | |
f4e36c33 | 4655 | new_tree = copy_node (*tp); |
f1f41a6c | 4656 | CONSTRUCTOR_ELTS (new_tree) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp)); |
f4e36c33 | 4657 | *tp = new_tree; |
c75b4594 | 4658 | } |
d55ebb6a | 4659 | else if (code == STATEMENT_LIST) |
17476aac | 4660 | /* We used to just abort on STATEMENT_LIST, but we can run into them |
4661 | with statement-expressions (c++/40975). */ | |
4662 | copy_statement_list (tp); | |
ce45a448 | 4663 | else if (TREE_CODE_CLASS (code) == tcc_type) |
e343483a | 4664 | *walk_subtrees = 0; |
ce45a448 | 4665 | else if (TREE_CODE_CLASS (code) == tcc_declaration) |
4ee9c684 | 4666 | *walk_subtrees = 0; |
d5406300 | 4667 | else if (TREE_CODE_CLASS (code) == tcc_constant) |
4668 | *walk_subtrees = 0; | |
e343483a | 4669 | return NULL_TREE; |
4670 | } | |
4671 | ||
4672 | /* The SAVE_EXPR pointed to by TP is being copied. If ST contains | |
5ff0afa2 | 4673 | information indicating to what new SAVE_EXPR this one should be mapped, |
e27482aa | 4674 | use that one. Otherwise, create a new node and enter it in ST. FN is |
4675 | the function into which the copy will be placed. */ | |
e343483a | 4676 | |
8c143e71 | 4677 | static void |
67c155cb | 4678 | remap_save_expr (tree *tp, void *st_, int *walk_subtrees) |
e343483a | 4679 | { |
e3022db7 | 4680 | struct pointer_map_t *st = (struct pointer_map_t *) st_; |
4681 | tree *n; | |
fcc73461 | 4682 | tree t; |
e343483a | 4683 | |
4684 | /* See if we already encountered this SAVE_EXPR. */ | |
e3022db7 | 4685 | n = (tree *) pointer_map_contains (st, *tp); |
40570cc2 | 4686 | |
e343483a | 4687 | /* If we didn't already remap this SAVE_EXPR, do so now. */ |
4688 | if (!n) | |
4689 | { | |
fcc73461 | 4690 | t = copy_node (*tp); |
e343483a | 4691 | |
e343483a | 4692 | /* Remember this SAVE_EXPR. */ |
e3022db7 | 4693 | *pointer_map_insert (st, *tp) = t; |
da3bde1a | 4694 | /* Make sure we don't remap an already-remapped SAVE_EXPR. */ |
e3022db7 | 4695 | *pointer_map_insert (st, t) = t; |
e343483a | 4696 | } |
4697 | else | |
fcc73461 | 4698 | { |
4699 | /* We've already walked into this SAVE_EXPR; don't do it again. */ | |
4700 | *walk_subtrees = 0; | |
e3022db7 | 4701 | t = *n; |
fcc73461 | 4702 | } |
e343483a | 4703 | |
4704 | /* Replace this SAVE_EXPR with the copy. */ | |
fcc73461 | 4705 | *tp = t; |
e343483a | 4706 | } |
d57cd35f | 4707 | |
75a70cf9 | 4708 | /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local |
4709 | label, copies the declaration and enters it in the splay_tree in DATA (which | |
4710 | is really a 'copy_body_data *'. */ | |
4711 | ||
4712 | static tree | |
4713 | mark_local_labels_stmt (gimple_stmt_iterator *gsip, | |
4714 | bool *handled_ops_p ATTRIBUTE_UNUSED, | |
4715 | struct walk_stmt_info *wi) | |
4716 | { | |
4717 | copy_body_data *id = (copy_body_data *) wi->info; | |
4718 | gimple stmt = gsi_stmt (*gsip); | |
4719 | ||
4720 | if (gimple_code (stmt) == GIMPLE_LABEL) | |
4721 | { | |
4722 | tree decl = gimple_label_label (stmt); | |
4723 | ||
4724 | /* Copy the decl and remember the copy. */ | |
4725 | insert_decl_map (id, decl, id->copy_decl (decl, id)); | |
4726 | } | |
4727 | ||
4728 | return NULL_TREE; | |
4729 | } | |
4730 | ||
4731 | ||
4732 | /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local. | |
4733 | Using the splay_tree pointed to by ST (which is really a `splay_tree'), | |
4734 | remaps all local declarations to appropriate replacements in gimple | |
4735 | operands. */ | |
4736 | ||
4737 | static tree | |
4738 | replace_locals_op (tree *tp, int *walk_subtrees, void *data) | |
4739 | { | |
4740 | struct walk_stmt_info *wi = (struct walk_stmt_info*) data; | |
4741 | copy_body_data *id = (copy_body_data *) wi->info; | |
4742 | struct pointer_map_t *st = id->decl_map; | |
4743 | tree *n; | |
4744 | tree expr = *tp; | |
4745 | ||
4746 | /* Only a local declaration (variable or label). */ | |
4747 | if ((TREE_CODE (expr) == VAR_DECL | |
4748 | && !TREE_STATIC (expr)) | |
4749 | || TREE_CODE (expr) == LABEL_DECL) | |
4750 | { | |
4751 | /* Lookup the declaration. */ | |
4752 | n = (tree *) pointer_map_contains (st, expr); | |
4753 | ||
4754 | /* If it's there, remap it. */ | |
4755 | if (n) | |
4756 | *tp = *n; | |
4757 | *walk_subtrees = 0; | |
4758 | } | |
4759 | else if (TREE_CODE (expr) == STATEMENT_LIST | |
4760 | || TREE_CODE (expr) == BIND_EXPR | |
4761 | || TREE_CODE (expr) == SAVE_EXPR) | |
4762 | gcc_unreachable (); | |
4763 | else if (TREE_CODE (expr) == TARGET_EXPR) | |
4764 | { | |
4765 | /* Don't mess with a TARGET_EXPR that hasn't been expanded. | |
4766 | It's OK for this to happen if it was part of a subtree that | |
4767 | isn't immediately expanded, such as operand 2 of another | |
4768 | TARGET_EXPR. */ | |
4769 | if (!TREE_OPERAND (expr, 1)) | |
4770 | { | |
4771 | TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3); | |
4772 | TREE_OPERAND (expr, 3) = NULL_TREE; | |
4773 | } | |
4774 | } | |
4775 | ||
4776 | /* Keep iterating. */ | |
4777 | return NULL_TREE; | |
4778 | } | |
4779 | ||
4780 | ||
4781 | /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local. | |
4782 | Using the splay_tree pointed to by ST (which is really a `splay_tree'), | |
4783 | remaps all local declarations to appropriate replacements in gimple | |
4784 | statements. */ | |
4785 | ||
4786 | static tree | |
4787 | replace_locals_stmt (gimple_stmt_iterator *gsip, | |
4788 | bool *handled_ops_p ATTRIBUTE_UNUSED, | |
4789 | struct walk_stmt_info *wi) | |
4790 | { | |
4791 | copy_body_data *id = (copy_body_data *) wi->info; | |
4792 | gimple stmt = gsi_stmt (*gsip); | |
4793 | ||
4794 | if (gimple_code (stmt) == GIMPLE_BIND) | |
4795 | { | |
4796 | tree block = gimple_bind_block (stmt); | |
4797 | ||
4798 | if (block) | |
4799 | { | |
4800 | remap_block (&block, id); | |
4801 | gimple_bind_set_block (stmt, block); | |
4802 | } | |
4803 | ||
4804 | /* This will remap a lot of the same decls again, but this should be | |
4805 | harmless. */ | |
4806 | if (gimple_bind_vars (stmt)) | |
f1f41a6c | 4807 | gimple_bind_set_vars (stmt, remap_decls (gimple_bind_vars (stmt), |
4808 | NULL, id)); | |
75a70cf9 | 4809 | } |
4810 | ||
4811 | /* Keep iterating. */ | |
4812 | return NULL_TREE; | |
4813 | } | |
4814 | ||
4815 | ||
4816 | /* Copies everything in SEQ and replaces variables and labels local to | |
4817 | current_function_decl. */ | |
4818 | ||
4819 | gimple_seq | |
4820 | copy_gimple_seq_and_replace_locals (gimple_seq seq) | |
4821 | { | |
4822 | copy_body_data id; | |
4823 | struct walk_stmt_info wi; | |
4824 | struct pointer_set_t *visited; | |
4825 | gimple_seq copy; | |
4826 | ||
4827 | /* There's nothing to do for NULL_TREE. */ | |
4828 | if (seq == NULL) | |
4829 | return seq; | |
4830 | ||
4831 | /* Set up ID. */ | |
4832 | memset (&id, 0, sizeof (id)); | |
4833 | id.src_fn = current_function_decl; | |
4834 | id.dst_fn = current_function_decl; | |
4835 | id.decl_map = pointer_map_create (); | |
9845d120 | 4836 | id.debug_map = NULL; |
75a70cf9 | 4837 | |
4838 | id.copy_decl = copy_decl_no_change; | |
4839 | id.transform_call_graph_edges = CB_CGE_DUPLICATE; | |
4840 | id.transform_new_cfg = false; | |
4841 | id.transform_return_to_modify = false; | |
6b99cb5e | 4842 | id.transform_parameter = false; |
75a70cf9 | 4843 | id.transform_lang_insert_block = NULL; |
4844 | ||
4845 | /* Walk the tree once to find local labels. */ | |
4846 | memset (&wi, 0, sizeof (wi)); | |
4847 | visited = pointer_set_create (); | |
4848 | wi.info = &id; | |
4849 | wi.pset = visited; | |
4850 | walk_gimple_seq (seq, mark_local_labels_stmt, NULL, &wi); | |
4851 | pointer_set_destroy (visited); | |
4852 | ||
4853 | copy = gimple_seq_copy (seq); | |
4854 | ||
4855 | /* Walk the copy, remapping decls. */ | |
4856 | memset (&wi, 0, sizeof (wi)); | |
4857 | wi.info = &id; | |
4858 | walk_gimple_seq (copy, replace_locals_stmt, replace_locals_op, &wi); | |
4859 | ||
4860 | /* Clean up. */ | |
4861 | pointer_map_destroy (id.decl_map); | |
9845d120 | 4862 | if (id.debug_map) |
4863 | pointer_map_destroy (id.debug_map); | |
75a70cf9 | 4864 | |
4865 | return copy; | |
4866 | } | |
4867 | ||
4868 | ||
4ee9c684 | 4869 | /* Allow someone to determine if SEARCH is a child of TOP from gdb. */ |
5ff0afa2 | 4870 | |
4ee9c684 | 4871 | static tree |
4872 | debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data) | |
4873 | { | |
4874 | if (*tp == data) | |
4875 | return (tree) data; | |
4876 | else | |
4877 | return NULL; | |
4878 | } | |
4879 | ||
4b987fac | 4880 | DEBUG_FUNCTION bool |
4ee9c684 | 4881 | debug_find_tree (tree top, tree search) |
4882 | { | |
4883 | return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0; | |
4884 | } | |
4885 | ||
e27482aa | 4886 | |
4ee9c684 | 4887 | /* Declare the variables created by the inliner. Add all the variables in |
4888 | VARS to BIND_EXPR. */ | |
4889 | ||
4890 | static void | |
e27482aa | 4891 | declare_inline_vars (tree block, tree vars) |
4ee9c684 | 4892 | { |
11fe6c8b | 4893 | tree t; |
1767a056 | 4894 | for (t = vars; t; t = DECL_CHAIN (t)) |
8e224d28 | 4895 | { |
4896 | DECL_SEEN_IN_BIND_EXPR_P (t) = 1; | |
4897 | gcc_assert (!TREE_STATIC (t) && !TREE_ASM_WRITTEN (t)); | |
2ab2ce89 | 4898 | add_local_decl (cfun, t); |
8e224d28 | 4899 | } |
4ee9c684 | 4900 | |
e27482aa | 4901 | if (block) |
4902 | BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars); | |
4903 | } | |
4904 | ||
c5235c0b | 4905 | /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN, |
51a48c27 | 4906 | but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to |
4907 | VAR_DECL translation. */ | |
c5235c0b | 4908 | |
51a48c27 | 4909 | static tree |
4910 | copy_decl_for_dup_finish (copy_body_data *id, tree decl, tree copy) | |
c5235c0b | 4911 | { |
c5235c0b | 4912 | /* Don't generate debug information for the copy if we wouldn't have |
4913 | generated it for the copy either. */ | |
4914 | DECL_ARTIFICIAL (copy) = DECL_ARTIFICIAL (decl); | |
4915 | DECL_IGNORED_P (copy) = DECL_IGNORED_P (decl); | |
4916 | ||
4917 | /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what | |
48e1416a | 4918 | declaration inspired this copy. */ |
c5235c0b | 4919 | DECL_ABSTRACT_ORIGIN (copy) = DECL_ORIGIN (decl); |
4920 | ||
4921 | /* The new variable/label has no RTL, yet. */ | |
68331616 | 4922 | if (CODE_CONTAINS_STRUCT (TREE_CODE (copy), TS_DECL_WRTL) |
4923 | && !TREE_STATIC (copy) && !DECL_EXTERNAL (copy)) | |
8e3cb73b | 4924 | SET_DECL_RTL (copy, 0); |
48e1416a | 4925 | |
c5235c0b | 4926 | /* These args would always appear unused, if not for this. */ |
4927 | TREE_USED (copy) = 1; | |
4928 | ||
4929 | /* Set the context for the new declaration. */ | |
4930 | if (!DECL_CONTEXT (decl)) | |
4931 | /* Globals stay global. */ | |
4932 | ; | |
51a48c27 | 4933 | else if (DECL_CONTEXT (decl) != id->src_fn) |
c5235c0b | 4934 | /* Things that weren't in the scope of the function we're inlining |
4935 | from aren't in the scope we're inlining to, either. */ | |
4936 | ; | |
4937 | else if (TREE_STATIC (decl)) | |
4938 | /* Function-scoped static variables should stay in the original | |
4939 | function. */ | |
4940 | ; | |
4941 | else | |
4942 | /* Ordinary automatic local variables are now in the scope of the | |
4943 | new function. */ | |
51a48c27 | 4944 | DECL_CONTEXT (copy) = id->dst_fn; |
c5235c0b | 4945 | |
4946 | return copy; | |
4947 | } | |
4948 | ||
51a48c27 | 4949 | static tree |
4950 | copy_decl_to_var (tree decl, copy_body_data *id) | |
4951 | { | |
4952 | tree copy, type; | |
4953 | ||
4954 | gcc_assert (TREE_CODE (decl) == PARM_DECL | |
4955 | || TREE_CODE (decl) == RESULT_DECL); | |
4956 | ||
4957 | type = TREE_TYPE (decl); | |
4958 | ||
e60a6f7b | 4959 | copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn), |
4960 | VAR_DECL, DECL_NAME (decl), type); | |
1a981e1a | 4961 | if (DECL_PT_UID_SET_P (decl)) |
4962 | SET_DECL_PT_UID (copy, DECL_PT_UID (decl)); | |
51a48c27 | 4963 | TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl); |
4964 | TREE_READONLY (copy) = TREE_READONLY (decl); | |
4965 | TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl); | |
8ea8de24 | 4966 | DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl); |
51a48c27 | 4967 | |
4968 | return copy_decl_for_dup_finish (id, decl, copy); | |
4969 | } | |
4970 | ||
25b3017b | 4971 | /* Like copy_decl_to_var, but create a return slot object instead of a |
4972 | pointer variable for return by invisible reference. */ | |
4973 | ||
4974 | static tree | |
4975 | copy_result_decl_to_var (tree decl, copy_body_data *id) | |
4976 | { | |
4977 | tree copy, type; | |
4978 | ||
4979 | gcc_assert (TREE_CODE (decl) == PARM_DECL | |
4980 | || TREE_CODE (decl) == RESULT_DECL); | |
4981 | ||
4982 | type = TREE_TYPE (decl); | |
4983 | if (DECL_BY_REFERENCE (decl)) | |
4984 | type = TREE_TYPE (type); | |
4985 | ||
e60a6f7b | 4986 | copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn), |
4987 | VAR_DECL, DECL_NAME (decl), type); | |
1a981e1a | 4988 | if (DECL_PT_UID_SET_P (decl)) |
4989 | SET_DECL_PT_UID (copy, DECL_PT_UID (decl)); | |
25b3017b | 4990 | TREE_READONLY (copy) = TREE_READONLY (decl); |
4991 | TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl); | |
4992 | if (!DECL_BY_REFERENCE (decl)) | |
4993 | { | |
4994 | TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl); | |
8ea8de24 | 4995 | DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl); |
25b3017b | 4996 | } |
4997 | ||
4998 | return copy_decl_for_dup_finish (id, decl, copy); | |
4999 | } | |
5000 | ||
32020b10 | 5001 | tree |
51a48c27 | 5002 | copy_decl_no_change (tree decl, copy_body_data *id) |
5003 | { | |
5004 | tree copy; | |
5005 | ||
5006 | copy = copy_node (decl); | |
5007 | ||
5008 | /* The COPY is not abstract; it will be generated in DST_FN. */ | |
5009 | DECL_ABSTRACT (copy) = 0; | |
5010 | lang_hooks.dup_lang_specific_decl (copy); | |
5011 | ||
5012 | /* TREE_ADDRESSABLE isn't used to indicate that a label's address has | |
5013 | been taken; it's for internal bookkeeping in expand_goto_internal. */ | |
5014 | if (TREE_CODE (copy) == LABEL_DECL) | |
5015 | { | |
5016 | TREE_ADDRESSABLE (copy) = 0; | |
5017 | LABEL_DECL_UID (copy) = -1; | |
5018 | } | |
5019 | ||
5020 | return copy_decl_for_dup_finish (id, decl, copy); | |
5021 | } | |
5022 | ||
5023 | static tree | |
5024 | copy_decl_maybe_to_var (tree decl, copy_body_data *id) | |
5025 | { | |
5026 | if (TREE_CODE (decl) == PARM_DECL || TREE_CODE (decl) == RESULT_DECL) | |
5027 | return copy_decl_to_var (decl, id); | |
5028 | else | |
5029 | return copy_decl_no_change (decl, id); | |
5030 | } | |
5031 | ||
c5235c0b | 5032 | /* Return a copy of the function's argument tree. */ |
5033 | static tree | |
5afe38fe | 5034 | copy_arguments_for_versioning (tree orig_parm, copy_body_data * id, |
5035 | bitmap args_to_skip, tree *vars) | |
c5235c0b | 5036 | { |
5afe38fe | 5037 | tree arg, *parg; |
5038 | tree new_parm = NULL; | |
5039 | int i = 0; | |
c5235c0b | 5040 | |
5afe38fe | 5041 | parg = &new_parm; |
5042 | ||
1767a056 | 5043 | for (arg = orig_parm; arg; arg = DECL_CHAIN (arg), i++) |
5afe38fe | 5044 | if (!args_to_skip || !bitmap_bit_p (args_to_skip, i)) |
5045 | { | |
5046 | tree new_tree = remap_decl (arg, id); | |
03f99d3c | 5047 | if (TREE_CODE (new_tree) != PARM_DECL) |
5048 | new_tree = id->copy_decl (arg, id); | |
5afe38fe | 5049 | lang_hooks.dup_lang_specific_decl (new_tree); |
5050 | *parg = new_tree; | |
1767a056 | 5051 | parg = &DECL_CHAIN (new_tree); |
5afe38fe | 5052 | } |
a8305131 | 5053 | else if (!pointer_map_contains (id->decl_map, arg)) |
5afe38fe | 5054 | { |
5055 | /* Make an equivalent VAR_DECL. If the argument was used | |
5056 | as temporary variable later in function, the uses will be | |
5057 | replaced by local variable. */ | |
5058 | tree var = copy_decl_to_var (arg, id); | |
5afe38fe | 5059 | insert_decl_map (id, arg, var); |
5060 | /* Declare this new variable. */ | |
1767a056 | 5061 | DECL_CHAIN (var) = *vars; |
5afe38fe | 5062 | *vars = var; |
5063 | } | |
5064 | return new_parm; | |
c5235c0b | 5065 | } |
5066 | ||
5067 | /* Return a copy of the function's static chain. */ | |
5068 | static tree | |
51a48c27 | 5069 | copy_static_chain (tree static_chain, copy_body_data * id) |
c5235c0b | 5070 | { |
5071 | tree *chain_copy, *pvar; | |
5072 | ||
5073 | chain_copy = &static_chain; | |
1767a056 | 5074 | for (pvar = chain_copy; *pvar; pvar = &DECL_CHAIN (*pvar)) |
c5235c0b | 5075 | { |
f4e36c33 | 5076 | tree new_tree = remap_decl (*pvar, id); |
5077 | lang_hooks.dup_lang_specific_decl (new_tree); | |
1767a056 | 5078 | DECL_CHAIN (new_tree) = DECL_CHAIN (*pvar); |
f4e36c33 | 5079 | *pvar = new_tree; |
c5235c0b | 5080 | } |
5081 | return static_chain; | |
5082 | } | |
5083 | ||
5084 | /* Return true if the function is allowed to be versioned. | |
5085 | This is a guard for the versioning functionality. */ | |
d747fdfb | 5086 | |
c5235c0b | 5087 | bool |
5088 | tree_versionable_function_p (tree fndecl) | |
5089 | { | |
bdb1f0d1 | 5090 | return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl)) |
5091 | && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl), fndecl) == NULL); | |
c5235c0b | 5092 | } |
5093 | ||
ccf4ab6b | 5094 | /* Delete all unreachable basic blocks and update callgraph. |
5095 | Doing so is somewhat nontrivial because we need to update all clones and | |
5096 | remove inline function that become unreachable. */ | |
38150ede | 5097 | |
ccf4ab6b | 5098 | static bool |
5099 | delete_unreachable_blocks_update_callgraph (copy_body_data *id) | |
38150ede | 5100 | { |
ccf4ab6b | 5101 | bool changed = false; |
5102 | basic_block b, next_bb; | |
5103 | ||
5104 | find_unreachable_blocks (); | |
5105 | ||
5106 | /* Delete all unreachable basic blocks. */ | |
5107 | ||
34154e27 | 5108 | for (b = ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb; b |
5109 | != EXIT_BLOCK_PTR_FOR_FN (cfun); b = next_bb) | |
ccf4ab6b | 5110 | { |
5111 | next_bb = b->next_bb; | |
5112 | ||
5113 | if (!(b->flags & BB_REACHABLE)) | |
5114 | { | |
5115 | gimple_stmt_iterator bsi; | |
5116 | ||
5117 | for (bsi = gsi_start_bb (b); !gsi_end_p (bsi); gsi_next (&bsi)) | |
4d044066 | 5118 | { |
5119 | struct cgraph_edge *e; | |
5120 | struct cgraph_node *node; | |
ccf4ab6b | 5121 | |
02774f2d | 5122 | ipa_remove_stmt_references (id->dst_node, gsi_stmt (bsi)); |
4d044066 | 5123 | |
5124 | if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL | |
5125 | &&(e = cgraph_edge (id->dst_node, gsi_stmt (bsi))) != NULL) | |
5126 | { | |
5127 | if (!e->inline_failed) | |
5128 | cgraph_remove_node_and_inline_clones (e->callee, id->dst_node); | |
5129 | else | |
5130 | cgraph_remove_edge (e); | |
5131 | } | |
5132 | if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES | |
5133 | && id->dst_node->clones) | |
5134 | for (node = id->dst_node->clones; node != id->dst_node;) | |
ccf4ab6b | 5135 | { |
02774f2d | 5136 | ipa_remove_stmt_references (node, gsi_stmt (bsi)); |
4d044066 | 5137 | if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL |
5138 | && (e = cgraph_edge (node, gsi_stmt (bsi))) != NULL) | |
5139 | { | |
5140 | if (!e->inline_failed) | |
5141 | cgraph_remove_node_and_inline_clones (e->callee, id->dst_node); | |
5142 | else | |
5143 | cgraph_remove_edge (e); | |
5144 | } | |
5145 | ||
5146 | if (node->clones) | |
5147 | node = node->clones; | |
5148 | else if (node->next_sibling_clone) | |
5149 | node = node->next_sibling_clone; | |
ccf4ab6b | 5150 | else |
4d044066 | 5151 | { |
5152 | while (node != id->dst_node && !node->next_sibling_clone) | |
5153 | node = node->clone_of; | |
5154 | if (node != id->dst_node) | |
5155 | node = node->next_sibling_clone; | |
5156 | } | |
ccf4ab6b | 5157 | } |
4d044066 | 5158 | } |
ccf4ab6b | 5159 | delete_basic_block (b); |
5160 | changed = true; | |
5161 | } | |
5162 | } | |
5163 | ||
ccf4ab6b | 5164 | return changed; |
38150ede | 5165 | } |
5166 | ||
e20422ea | 5167 | /* Update clone info after duplication. */ |
5168 | ||
5169 | static void | |
5170 | update_clone_info (copy_body_data * id) | |
5171 | { | |
5172 | struct cgraph_node *node; | |
5173 | if (!id->dst_node->clones) | |
5174 | return; | |
5175 | for (node = id->dst_node->clones; node != id->dst_node;) | |
5176 | { | |
5177 | /* First update replace maps to match the new body. */ | |
5178 | if (node->clone.tree_map) | |
5179 | { | |
5180 | unsigned int i; | |
f1f41a6c | 5181 | for (i = 0; i < vec_safe_length (node->clone.tree_map); i++) |
e20422ea | 5182 | { |
5183 | struct ipa_replace_map *replace_info; | |
f1f41a6c | 5184 | replace_info = (*node->clone.tree_map)[i]; |
e20422ea | 5185 | walk_tree (&replace_info->old_tree, copy_tree_body_r, id, NULL); |
5186 | walk_tree (&replace_info->new_tree, copy_tree_body_r, id, NULL); | |
5187 | } | |
5188 | } | |
5189 | if (node->clones) | |
5190 | node = node->clones; | |
5191 | else if (node->next_sibling_clone) | |
5192 | node = node->next_sibling_clone; | |
5193 | else | |
5194 | { | |
5195 | while (node != id->dst_node && !node->next_sibling_clone) | |
5196 | node = node->clone_of; | |
5197 | if (node != id->dst_node) | |
5198 | node = node->next_sibling_clone; | |
5199 | } | |
5200 | } | |
5201 | } | |
5202 | ||
c5235c0b | 5203 | /* Create a copy of a function's tree. |
5204 | OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes | |
5205 | of the original function and the new copied function | |
48e1416a | 5206 | respectively. In case we want to replace a DECL |
5207 | tree with another tree while duplicating the function's | |
5208 | body, TREE_MAP represents the mapping between these | |
469679ab | 5209 | trees. If UPDATE_CLONES is set, the call_stmt fields |
b06ab5fa | 5210 | of edges of clones of the function will be updated. |
5211 | ||
5212 | If non-NULL ARGS_TO_SKIP determine function parameters to remove | |
5213 | from new version. | |
7a3ec978 | 5214 | If SKIP_RETURN is true, the new version will return void. |
b06ab5fa | 5215 | If non-NULL BLOCK_TO_COPY determine what basic blocks to copy. |
5216 | If non_NULL NEW_ENTRY determine new entry BB of the clone. | |
5217 | */ | |
c5235c0b | 5218 | void |
d747fdfb | 5219 | tree_function_versioning (tree old_decl, tree new_decl, |
f1f41a6c | 5220 | vec<ipa_replace_map_p, va_gc> *tree_map, |
b06ab5fa | 5221 | bool update_clones, bitmap args_to_skip, |
7a3ec978 | 5222 | bool skip_return, bitmap blocks_to_copy, |
5223 | basic_block new_entry) | |
c5235c0b | 5224 | { |
5225 | struct cgraph_node *old_version_node; | |
5226 | struct cgraph_node *new_version_node; | |
51a48c27 | 5227 | copy_body_data id; |
deff5ffd | 5228 | tree p; |
c5235c0b | 5229 | unsigned i; |
5230 | struct ipa_replace_map *replace_info; | |
9845d120 | 5231 | basic_block old_entry_block, bb; |
e85cf4e5 | 5232 | stack_vec<gimple, 10> init_stmts; |
13e50f08 | 5233 | tree vars = NULL_TREE; |
c5235c0b | 5234 | |
5235 | gcc_assert (TREE_CODE (old_decl) == FUNCTION_DECL | |
5236 | && TREE_CODE (new_decl) == FUNCTION_DECL); | |
5237 | DECL_POSSIBLY_INLINED (old_decl) = 1; | |
5238 | ||
53f79206 | 5239 | old_version_node = cgraph_get_node (old_decl); |
5240 | gcc_checking_assert (old_version_node); | |
5241 | new_version_node = cgraph_get_node (new_decl); | |
5242 | gcc_checking_assert (new_version_node); | |
c5235c0b | 5243 | |
841424cc | 5244 | /* Copy over debug args. */ |
5245 | if (DECL_HAS_DEBUG_ARGS_P (old_decl)) | |
5246 | { | |
f1f41a6c | 5247 | vec<tree, va_gc> **new_debug_args, **old_debug_args; |
841424cc | 5248 | gcc_checking_assert (decl_debug_args_lookup (new_decl) == NULL); |
5249 | DECL_HAS_DEBUG_ARGS_P (new_decl) = 0; | |
5250 | old_debug_args = decl_debug_args_lookup (old_decl); | |
5251 | if (old_debug_args) | |
5252 | { | |
5253 | new_debug_args = decl_debug_args_insert (new_decl); | |
f1f41a6c | 5254 | *new_debug_args = vec_safe_copy (*old_debug_args); |
841424cc | 5255 | } |
5256 | } | |
5257 | ||
3d280f42 | 5258 | /* Output the inlining info for this abstract function, since it has been |
5259 | inlined. If we don't do this now, we can lose the information about the | |
5260 | variables in the function when the blocks get blown away as soon as we | |
5261 | remove the cgraph node. */ | |
5262 | (*debug_hooks->outlining_inline_function) (old_decl); | |
5263 | ||
c5235c0b | 5264 | DECL_ARTIFICIAL (new_decl) = 1; |
5265 | DECL_ABSTRACT_ORIGIN (new_decl) = DECL_ORIGIN (old_decl); | |
abb1a237 | 5266 | if (DECL_ORIGIN (old_decl) == old_decl) |
5267 | old_version_node->used_as_abstract_origin = true; | |
58d82cd0 | 5268 | DECL_FUNCTION_PERSONALITY (new_decl) = DECL_FUNCTION_PERSONALITY (old_decl); |
c5235c0b | 5269 | |
b2f42a98 | 5270 | /* Prepare the data structures for the tree copy. */ |
5271 | memset (&id, 0, sizeof (id)); | |
5272 | ||
c5235c0b | 5273 | /* Generate a new name for the new version. */ |
ccf4ab6b | 5274 | id.statements_to_fold = pointer_set_create (); |
9845d120 | 5275 | |
e3022db7 | 5276 | id.decl_map = pointer_map_create (); |
9845d120 | 5277 | id.debug_map = NULL; |
51a48c27 | 5278 | id.src_fn = old_decl; |
5279 | id.dst_fn = new_decl; | |
5280 | id.src_node = old_version_node; | |
5281 | id.dst_node = new_version_node; | |
5282 | id.src_cfun = DECL_STRUCT_FUNCTION (old_decl); | |
da51794e | 5283 | id.blocks_to_copy = blocks_to_copy; |
f1f41a6c | 5284 | if (id.src_node->ipa_transforms_to_apply.exists ()) |
6d1cc52c | 5285 | { |
f1f41a6c | 5286 | vec<ipa_opt_pass> old_transforms_to_apply |
5287 | = id.dst_node->ipa_transforms_to_apply; | |
6d1cc52c | 5288 | unsigned int i; |
5289 | ||
f1f41a6c | 5290 | id.dst_node->ipa_transforms_to_apply |
5291 | = id.src_node->ipa_transforms_to_apply.copy (); | |
5292 | for (i = 0; i < old_transforms_to_apply.length (); i++) | |
5293 | id.dst_node->ipa_transforms_to_apply.safe_push (old_transforms_to_apply[i]); | |
5294 | old_transforms_to_apply.release (); | |
6d1cc52c | 5295 | } |
48e1416a | 5296 | |
51a48c27 | 5297 | id.copy_decl = copy_decl_no_change; |
5298 | id.transform_call_graph_edges | |
5299 | = update_clones ? CB_CGE_MOVE_CLONES : CB_CGE_MOVE; | |
5300 | id.transform_new_cfg = true; | |
5301 | id.transform_return_to_modify = false; | |
6b99cb5e | 5302 | id.transform_parameter = false; |
32020b10 | 5303 | id.transform_lang_insert_block = NULL; |
51a48c27 | 5304 | |
34154e27 | 5305 | old_entry_block = ENTRY_BLOCK_PTR_FOR_FN |
deff5ffd | 5306 | (DECL_STRUCT_FUNCTION (old_decl)); |
abb1a237 | 5307 | DECL_RESULT (new_decl) = DECL_RESULT (old_decl); |
5308 | DECL_ARGUMENTS (new_decl) = DECL_ARGUMENTS (old_decl); | |
deff5ffd | 5309 | initialize_cfun (new_decl, old_decl, |
e2d3f422 | 5310 | old_entry_block->count); |
3912327b | 5311 | DECL_STRUCT_FUNCTION (new_decl)->gimple_df->ipa_pta |
5312 | = id.src_cfun->gimple_df->ipa_pta; | |
48e1416a | 5313 | |
c5235c0b | 5314 | /* Copy the function's static chain. */ |
5315 | p = DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl; | |
5316 | if (p) | |
5317 | DECL_STRUCT_FUNCTION (new_decl)->static_chain_decl = | |
5318 | copy_static_chain (DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl, | |
5319 | &id); | |
48e1416a | 5320 | |
c5235c0b | 5321 | /* If there's a tree_map, prepare for substitution. */ |
5322 | if (tree_map) | |
f1f41a6c | 5323 | for (i = 0; i < tree_map->length (); i++) |
c5235c0b | 5324 | { |
13e50f08 | 5325 | gimple init; |
f1f41a6c | 5326 | replace_info = (*tree_map)[i]; |
51a48c27 | 5327 | if (replace_info->replace_p) |
b9c94ed7 | 5328 | { |
1bf41320 | 5329 | if (!replace_info->old_tree) |
5330 | { | |
5331 | int i = replace_info->parm_num; | |
5332 | tree parm; | |
09ab6335 | 5333 | tree req_type; |
5334 | ||
1767a056 | 5335 | for (parm = DECL_ARGUMENTS (old_decl); i; parm = DECL_CHAIN (parm)) |
1bf41320 | 5336 | i --; |
5337 | replace_info->old_tree = parm; | |
09ab6335 | 5338 | req_type = TREE_TYPE (parm); |
5339 | if (!useless_type_conversion_p (req_type, TREE_TYPE (replace_info->new_tree))) | |
5340 | { | |
5341 | if (fold_convertible_p (req_type, replace_info->new_tree)) | |
5342 | replace_info->new_tree = fold_build1 (NOP_EXPR, req_type, replace_info->new_tree); | |
5343 | else if (TYPE_SIZE (req_type) == TYPE_SIZE (TREE_TYPE (replace_info->new_tree))) | |
5344 | replace_info->new_tree = fold_build1 (VIEW_CONVERT_EXPR, req_type, replace_info->new_tree); | |
5345 | else | |
5346 | { | |
5347 | if (dump_file) | |
5348 | { | |
5349 | fprintf (dump_file, " const "); | |
5350 | print_generic_expr (dump_file, replace_info->new_tree, 0); | |
5351 | fprintf (dump_file, " can't be converted to param "); | |
5352 | print_generic_expr (dump_file, parm, 0); | |
5353 | fprintf (dump_file, "\n"); | |
5354 | } | |
5355 | replace_info->old_tree = NULL; | |
5356 | } | |
5357 | } | |
5358 | } | |
5359 | else | |
5360 | gcc_assert (TREE_CODE (replace_info->old_tree) == PARM_DECL); | |
5361 | if (replace_info->old_tree) | |
5362 | { | |
5363 | init = setup_one_parameter (&id, replace_info->old_tree, | |
5364 | replace_info->new_tree, id.src_fn, | |
5365 | NULL, | |
5366 | &vars); | |
5367 | if (init) | |
5368 | init_stmts.safe_push (init); | |
1bf41320 | 5369 | } |
b9c94ed7 | 5370 | } |
c5235c0b | 5371 | } |
a8305131 | 5372 | /* Copy the function's arguments. */ |
5373 | if (DECL_ARGUMENTS (old_decl) != NULL_TREE) | |
5374 | DECL_ARGUMENTS (new_decl) = | |
5375 | copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl), &id, | |
5376 | args_to_skip, &vars); | |
48e1416a | 5377 | |
a8305131 | 5378 | DECL_INITIAL (new_decl) = remap_blocks (DECL_INITIAL (id.src_fn), &id); |
a6519462 | 5379 | BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl)) = new_decl; |
48e1416a | 5380 | |
13e50f08 | 5381 | declare_inline_vars (DECL_INITIAL (new_decl), vars); |
ccf4ab6b | 5382 | |
f1f41a6c | 5383 | if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl)->local_decls)) |
c5235c0b | 5384 | /* Add local vars. */ |
6a1933ed | 5385 | add_local_variables (DECL_STRUCT_FUNCTION (old_decl), cfun, &id); |
48e1416a | 5386 | |
0c41699c | 5387 | if (DECL_RESULT (old_decl) == NULL_TREE) |
7a3ec978 | 5388 | ; |
0c41699c | 5389 | else if (skip_return && !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl)))) |
7a3ec978 | 5390 | { |
5391 | DECL_RESULT (new_decl) | |
5392 | = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl)), | |
5393 | RESULT_DECL, NULL_TREE, void_type_node); | |
5394 | DECL_CONTEXT (DECL_RESULT (new_decl)) = new_decl; | |
5395 | cfun->returns_struct = 0; | |
5396 | cfun->returns_pcc_struct = 0; | |
5397 | } | |
5398 | else | |
c5235c0b | 5399 | { |
c6ba6fb8 | 5400 | tree old_name; |
5401 | DECL_RESULT (new_decl) = remap_decl (DECL_RESULT (old_decl), &id); | |
c5235c0b | 5402 | lang_hooks.dup_lang_specific_decl (DECL_RESULT (new_decl)); |
c6ba6fb8 | 5403 | if (gimple_in_ssa_p (id.src_cfun) |
5404 | && DECL_BY_REFERENCE (DECL_RESULT (old_decl)) | |
c6dfe037 | 5405 | && (old_name = ssa_default_def (id.src_cfun, DECL_RESULT (old_decl)))) |
c6ba6fb8 | 5406 | { |
5407 | tree new_name = make_ssa_name (DECL_RESULT (new_decl), NULL); | |
5408 | insert_decl_map (&id, old_name, new_name); | |
5409 | SSA_NAME_DEF_STMT (new_name) = gimple_build_nop (); | |
c6dfe037 | 5410 | set_ssa_default_def (cfun, DECL_RESULT (new_decl), new_name); |
c6ba6fb8 | 5411 | } |
c5235c0b | 5412 | } |
48e1416a | 5413 | |
f6568ea4 | 5414 | /* Set up the destination functions loop tree. */ |
41f75a99 | 5415 | if (loops_for_fn (DECL_STRUCT_FUNCTION (old_decl)) != NULL) |
f6568ea4 | 5416 | { |
5417 | cfun->curr_properties &= ~PROP_loops; | |
5418 | loop_optimizer_init (AVOID_CFG_MODIFICATIONS); | |
5419 | cfun->curr_properties |= PROP_loops; | |
5420 | } | |
5421 | ||
c6ba6fb8 | 5422 | /* Copy the Function's body. */ |
5423 | copy_body (&id, old_entry_block->count, REG_BR_PROB_BASE, | |
34154e27 | 5424 | ENTRY_BLOCK_PTR_FOR_FN (cfun), EXIT_BLOCK_PTR_FOR_FN (cfun), |
5425 | new_entry); | |
c6ba6fb8 | 5426 | |
c5235c0b | 5427 | /* Renumber the lexical scoping (non-code) blocks consecutively. */ |
5428 | number_blocks (new_decl); | |
5429 | ||
9845d120 | 5430 | /* We want to create the BB unconditionally, so that the addition of |
5431 | debug stmts doesn't affect BB count, which may in the end cause | |
5432 | codegen differences. */ | |
34154e27 | 5433 | bb = split_edge (single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun))); |
f1f41a6c | 5434 | while (init_stmts.length ()) |
5435 | insert_init_stmt (&id, bb, init_stmts.pop ()); | |
e20422ea | 5436 | update_clone_info (&id); |
13e50f08 | 5437 | |
d747fdfb | 5438 | /* Remap the nonlocal_goto_save_area, if any. */ |
5439 | if (cfun->nonlocal_goto_save_area) | |
5440 | { | |
5441 | struct walk_stmt_info wi; | |
5442 | ||
5443 | memset (&wi, 0, sizeof (wi)); | |
5444 | wi.info = &id; | |
5445 | walk_tree (&cfun->nonlocal_goto_save_area, remap_gimple_op_r, &wi, NULL); | |
5446 | } | |
5447 | ||
c5235c0b | 5448 | /* Clean up. */ |
e3022db7 | 5449 | pointer_map_destroy (id.decl_map); |
9845d120 | 5450 | if (id.debug_map) |
5451 | pointer_map_destroy (id.debug_map); | |
dd277d48 | 5452 | free_dominance_info (CDI_DOMINATORS); |
5453 | free_dominance_info (CDI_POST_DOMINATORS); | |
ccf4ab6b | 5454 | |
5455 | fold_marked_statements (0, id.statements_to_fold); | |
5456 | pointer_set_destroy (id.statements_to_fold); | |
5457 | fold_cond_expr_cond (); | |
5458 | delete_unreachable_blocks_update_callgraph (&id); | |
02774f2d | 5459 | if (id.dst_node->definition) |
ea7e866e | 5460 | cgraph_rebuild_references (); |
ccf4ab6b | 5461 | update_ssa (TODO_update_ssa); |
555e8b05 | 5462 | |
5463 | /* After partial cloning we need to rescale frequencies, so they are | |
5464 | within proper range in the cloned function. */ | |
5465 | if (new_entry) | |
5466 | { | |
5467 | struct cgraph_edge *e; | |
5468 | rebuild_frequencies (); | |
5469 | ||
34154e27 | 5470 | new_version_node->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count; |
555e8b05 | 5471 | for (e = new_version_node->callees; e; e = e->next_callee) |
5472 | { | |
5473 | basic_block bb = gimple_bb (e->call_stmt); | |
1a036a3b | 5474 | e->frequency = compute_call_stmt_bb_frequency (current_function_decl, |
5475 | bb); | |
5476 | e->count = bb->count; | |
5477 | } | |
5478 | for (e = new_version_node->indirect_calls; e; e = e->next_callee) | |
5479 | { | |
5480 | basic_block bb = gimple_bb (e->call_stmt); | |
5481 | e->frequency = compute_call_stmt_bb_frequency (current_function_decl, | |
5482 | bb); | |
555e8b05 | 5483 | e->count = bb->count; |
5484 | } | |
5485 | } | |
5486 | ||
ccf4ab6b | 5487 | free_dominance_info (CDI_DOMINATORS); |
5488 | free_dominance_info (CDI_POST_DOMINATORS); | |
5489 | ||
f1f41a6c | 5490 | gcc_assert (!id.debug_stmts.exists ()); |
deff5ffd | 5491 | pop_cfun (); |
c5235c0b | 5492 | return; |
5493 | } | |
5494 | ||
4189e677 | 5495 | /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate |
5496 | the callee and return the inlined body on success. */ | |
5497 | ||
5498 | tree | |
5499 | maybe_inline_call_in_expr (tree exp) | |
5500 | { | |
5501 | tree fn = get_callee_fndecl (exp); | |
5502 | ||
5503 | /* We can only try to inline "const" functions. */ | |
5504 | if (fn && TREE_READONLY (fn) && DECL_SAVED_TREE (fn)) | |
5505 | { | |
5506 | struct pointer_map_t *decl_map = pointer_map_create (); | |
5507 | call_expr_arg_iterator iter; | |
5508 | copy_body_data id; | |
5509 | tree param, arg, t; | |
5510 | ||
5511 | /* Remap the parameters. */ | |
5512 | for (param = DECL_ARGUMENTS (fn), arg = first_call_expr_arg (exp, &iter); | |
5513 | param; | |
1767a056 | 5514 | param = DECL_CHAIN (param), arg = next_call_expr_arg (&iter)) |
4189e677 | 5515 | *pointer_map_insert (decl_map, param) = arg; |
5516 | ||
5517 | memset (&id, 0, sizeof (id)); | |
5518 | id.src_fn = fn; | |
5519 | id.dst_fn = current_function_decl; | |
5520 | id.src_cfun = DECL_STRUCT_FUNCTION (fn); | |
5521 | id.decl_map = decl_map; | |
5522 | ||
5523 | id.copy_decl = copy_decl_no_change; | |
5524 | id.transform_call_graph_edges = CB_CGE_DUPLICATE; | |
5525 | id.transform_new_cfg = false; | |
5526 | id.transform_return_to_modify = true; | |
6b99cb5e | 5527 | id.transform_parameter = true; |
839c5aac | 5528 | id.transform_lang_insert_block = NULL; |
4189e677 | 5529 | |
5530 | /* Make sure not to unshare trees behind the front-end's back | |
5531 | since front-end specific mechanisms may rely on sharing. */ | |
5532 | id.regimplify = false; | |
5533 | id.do_not_unshare = true; | |
5534 | ||
5535 | /* We're not inside any EH region. */ | |
e38def9c | 5536 | id.eh_lp_nr = 0; |
4189e677 | 5537 | |
5538 | t = copy_tree_body (&id); | |
5539 | pointer_map_destroy (decl_map); | |
5540 | ||
5541 | /* We can only return something suitable for use in a GENERIC | |
5542 | expression tree. */ | |
5543 | if (TREE_CODE (t) == MODIFY_EXPR) | |
5544 | return TREE_OPERAND (t, 1); | |
5545 | } | |
5546 | ||
5547 | return NULL_TREE; | |
5548 | } | |
5549 | ||
03908818 | 5550 | /* Duplicate a type, fields and all. */ |
5551 | ||
5552 | tree | |
5553 | build_duplicate_type (tree type) | |
5554 | { | |
51a48c27 | 5555 | struct copy_body_data id; |
03908818 | 5556 | |
5557 | memset (&id, 0, sizeof (id)); | |
51a48c27 | 5558 | id.src_fn = current_function_decl; |
5559 | id.dst_fn = current_function_decl; | |
5560 | id.src_cfun = cfun; | |
e3022db7 | 5561 | id.decl_map = pointer_map_create (); |
9845d120 | 5562 | id.debug_map = NULL; |
881eb642 | 5563 | id.copy_decl = copy_decl_no_change; |
03908818 | 5564 | |
5565 | type = remap_type_1 (type, &id); | |
5566 | ||
e3022db7 | 5567 | pointer_map_destroy (id.decl_map); |
9845d120 | 5568 | if (id.debug_map) |
5569 | pointer_map_destroy (id.debug_map); | |
03908818 | 5570 | |
e8e0078c | 5571 | TYPE_CANONICAL (type) = type; |
5572 | ||
03908818 | 5573 | return type; |
5574 | } |