IPA ICF, part 4/5
[official-gcc.git] / gcc / tree-nrv.c
blob02a4af9e6818cb8483c51ddfa6fc372d7b3a908e
1 /* Language independent return value optimizations
2 Copyright (C) 2004-2014 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "tree.h"
25 #include "function.h"
26 #include "basic-block.h"
27 #include "tree-pretty-print.h"
28 #include "tree-ssa-alias.h"
29 #include "internal-fn.h"
30 #include "gimple-expr.h"
31 #include "is-a.h"
32 #include "gimple.h"
33 #include "gimple-iterator.h"
34 #include "gimple-walk.h"
35 #include "gimple-ssa.h"
36 #include "stringpool.h"
37 #include "tree-ssanames.h"
38 #include "tree-pass.h"
39 #include "langhooks.h"
40 #include "flags.h" /* For "optimize" in gate_pass_return_slot.
41 FIXME: That should be up to the pass manager,
42 but pass_nrv is not in pass_all_optimizations. */
44 /* This file implements return value optimizations for functions which
45 return aggregate types.
47 Basically this pass searches the function for return statements which
48 return a local aggregate. When converted to RTL such statements will
49 generate a copy from the local aggregate to final return value destination
50 mandated by the target's ABI.
52 That copy can often be avoided by directly constructing the return value
53 into the final destination mandated by the target's ABI.
55 This is basically a generic equivalent to the C++ front-end's
56 Named Return Value optimization. */
58 struct nrv_data_t
60 /* This is the temporary (a VAR_DECL) which appears in all of
61 this function's RETURN_EXPR statements. */
62 tree var;
64 /* This is the function's RESULT_DECL. We will replace all occurrences
65 of VAR with RESULT_DECL when we apply this optimization. */
66 tree result;
67 int modified;
70 static tree finalize_nrv_r (tree *, int *, void *);
72 /* Callback for the tree walker.
74 If TP refers to a RETURN_EXPR, then set the expression being returned
75 to nrv_data->result.
77 If TP refers to nrv_data->var, then replace nrv_data->var with
78 nrv_data->result.
80 If we reach a node where we know all the subtrees are uninteresting,
81 then set *WALK_SUBTREES to zero. */
83 static tree
84 finalize_nrv_r (tree *tp, int *walk_subtrees, void *data)
86 struct walk_stmt_info *wi = (struct walk_stmt_info *) data;
87 struct nrv_data_t *dp = (struct nrv_data_t *) wi->info;
89 /* No need to walk into types. */
90 if (TYPE_P (*tp))
91 *walk_subtrees = 0;
93 /* Otherwise replace all occurrences of VAR with RESULT. */
94 else if (*tp == dp->var)
96 *tp = dp->result;
97 dp->modified = 1;
100 /* Keep iterating. */
101 return NULL_TREE;
104 /* Main entry point for return value optimizations.
106 If this function always returns the same local variable, and that
107 local variable is an aggregate type, then replace the variable with
108 the function's DECL_RESULT.
110 This is the equivalent of the C++ named return value optimization
111 applied to optimized trees in a language independent form. If we
112 ever encounter languages which prevent this kind of optimization,
113 then we could either have the languages register the optimization or
114 we could change the gating function to check the current language. */
116 namespace {
118 const pass_data pass_data_nrv =
120 GIMPLE_PASS, /* type */
121 "nrv", /* name */
122 OPTGROUP_NONE, /* optinfo_flags */
123 TV_TREE_NRV, /* tv_id */
124 ( PROP_ssa | PROP_cfg ), /* properties_required */
125 0, /* properties_provided */
126 0, /* properties_destroyed */
127 0, /* todo_flags_start */
128 0, /* todo_flags_finish */
131 class pass_nrv : public gimple_opt_pass
133 public:
134 pass_nrv (gcc::context *ctxt)
135 : gimple_opt_pass (pass_data_nrv, ctxt)
138 /* opt_pass methods: */
139 virtual bool gate (function *) { return optimize > 0; }
141 virtual unsigned int execute (function *);
143 }; // class pass_nrv
145 unsigned int
146 pass_nrv::execute (function *fun)
148 tree result = DECL_RESULT (current_function_decl);
149 tree result_type = TREE_TYPE (result);
150 tree found = NULL;
151 basic_block bb;
152 gimple_stmt_iterator gsi;
153 struct nrv_data_t data;
155 /* If this function does not return an aggregate type in memory, then
156 there is nothing to do. */
157 if (!aggregate_value_p (result, current_function_decl))
158 return 0;
160 /* If a GIMPLE type is returned in memory, finalize_nrv_r might create
161 non-GIMPLE. */
162 if (is_gimple_reg_type (result_type))
163 return 0;
165 /* If the front end already did something like this, don't do it here. */
166 if (DECL_NAME (result))
167 return 0;
169 /* If the result has its address taken then it might be modified
170 by means not detected in the following loop. Bail out in this
171 case. */
172 if (TREE_ADDRESSABLE (result))
173 return 0;
175 /* Look through each block for assignments to the RESULT_DECL. */
176 FOR_EACH_BB_FN (bb, fun)
178 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
180 gimple stmt = gsi_stmt (gsi);
181 tree ret_val;
183 if (gimple_code (stmt) == GIMPLE_RETURN)
185 /* In a function with an aggregate return value, the
186 gimplifier has changed all non-empty RETURN_EXPRs to
187 return the RESULT_DECL. */
188 ret_val = gimple_return_retval (stmt);
189 if (ret_val)
190 gcc_assert (ret_val == result);
192 else if (gimple_has_lhs (stmt)
193 && gimple_get_lhs (stmt) == result)
195 tree rhs;
197 if (!gimple_assign_copy_p (stmt))
198 return 0;
200 rhs = gimple_assign_rhs1 (stmt);
202 /* Now verify that this return statement uses the same value
203 as any previously encountered return statement. */
204 if (found != NULL)
206 /* If we found a return statement using a different variable
207 than previous return statements, then we can not perform
208 NRV optimizations. */
209 if (found != rhs)
210 return 0;
212 else
213 found = rhs;
215 /* The returned value must be a local automatic variable of the
216 same type and alignment as the function's result. */
217 if (TREE_CODE (found) != VAR_DECL
218 || TREE_THIS_VOLATILE (found)
219 || !auto_var_in_fn_p (found, current_function_decl)
220 || TREE_ADDRESSABLE (found)
221 || DECL_ALIGN (found) > DECL_ALIGN (result)
222 || !useless_type_conversion_p (result_type,
223 TREE_TYPE (found)))
224 return 0;
226 else if (gimple_has_lhs (stmt))
228 tree addr = get_base_address (gimple_get_lhs (stmt));
229 /* If there's any MODIFY of component of RESULT,
230 then bail out. */
231 if (addr && addr == result)
232 return 0;
237 if (!found)
238 return 0;
240 /* If dumping details, then note once and only the NRV replacement. */
241 if (dump_file && (dump_flags & TDF_DETAILS))
243 fprintf (dump_file, "NRV Replaced: ");
244 print_generic_expr (dump_file, found, dump_flags);
245 fprintf (dump_file, " with: ");
246 print_generic_expr (dump_file, result, dump_flags);
247 fprintf (dump_file, "\n");
250 /* At this point we know that all the return statements return the
251 same local which has suitable attributes for NRV. Copy debugging
252 information from FOUND to RESULT if it will be useful. But don't set
253 DECL_ABSTRACT_ORIGIN to point at another function. */
254 if (!DECL_IGNORED_P (found)
255 && !(DECL_ABSTRACT_ORIGIN (found)
256 && DECL_CONTEXT (DECL_ABSTRACT_ORIGIN (found)) != current_function_decl))
258 DECL_NAME (result) = DECL_NAME (found);
259 DECL_SOURCE_LOCATION (result) = DECL_SOURCE_LOCATION (found);
260 DECL_ABSTRACT_ORIGIN (result) = DECL_ABSTRACT_ORIGIN (found);
263 TREE_ADDRESSABLE (result) |= TREE_ADDRESSABLE (found);
265 /* Now walk through the function changing all references to VAR to be
266 RESULT. */
267 data.var = found;
268 data.result = result;
269 FOR_EACH_BB_FN (bb, fun)
271 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); )
273 gimple stmt = gsi_stmt (gsi);
274 /* If this is a copy from VAR to RESULT, remove it. */
275 if (gimple_assign_copy_p (stmt)
276 && gimple_assign_lhs (stmt) == result
277 && gimple_assign_rhs1 (stmt) == found)
279 unlink_stmt_vdef (stmt);
280 gsi_remove (&gsi, true);
281 release_defs (stmt);
283 else
285 struct walk_stmt_info wi;
286 memset (&wi, 0, sizeof (wi));
287 wi.info = &data;
288 data.modified = 0;
289 walk_gimple_op (stmt, finalize_nrv_r, &wi);
290 if (data.modified)
291 update_stmt (stmt);
292 gsi_next (&gsi);
297 SET_DECL_VALUE_EXPR (found, result);
298 DECL_HAS_VALUE_EXPR_P (found) = 1;
300 return 0;
303 } // anon namespace
305 gimple_opt_pass *
306 make_pass_nrv (gcc::context *ctxt)
308 return new pass_nrv (ctxt);
311 /* Determine (pessimistically) whether DEST is available for NRV
312 optimization, where DEST is expected to be the LHS of a modify
313 expression where the RHS is a function returning an aggregate.
315 DEST is available if it is not clobbered or used by the call. */
317 static bool
318 dest_safe_for_nrv_p (gimple call)
320 tree dest = gimple_call_lhs (call);
322 dest = get_base_address (dest);
323 if (! dest)
324 return false;
326 if (TREE_CODE (dest) == SSA_NAME)
327 return true;
329 if (call_may_clobber_ref_p (call, dest)
330 || ref_maybe_used_by_stmt_p (call, dest))
331 return false;
333 return true;
336 /* Walk through the function looking for GIMPLE_ASSIGNs with calls that
337 return in memory on the RHS. For each of these, determine whether it is
338 safe to pass the address of the LHS as the return slot, and mark the
339 call appropriately if so.
341 The NRV shares the return slot with a local variable in the callee; this
342 optimization shares the return slot with the target of the call within
343 the caller. If the NRV is performed (which we can't know in general),
344 this optimization is safe if the address of the target has not
345 escaped prior to the call. If it has, modifications to the local
346 variable will produce visible changes elsewhere, as in PR c++/19317. */
348 namespace {
350 const pass_data pass_data_return_slot =
352 GIMPLE_PASS, /* type */
353 "retslot", /* name */
354 OPTGROUP_NONE, /* optinfo_flags */
355 TV_NONE, /* tv_id */
356 PROP_ssa, /* properties_required */
357 0, /* properties_provided */
358 0, /* properties_destroyed */
359 0, /* todo_flags_start */
360 0, /* todo_flags_finish */
363 class pass_return_slot : public gimple_opt_pass
365 public:
366 pass_return_slot (gcc::context *ctxt)
367 : gimple_opt_pass (pass_data_return_slot, ctxt)
370 /* opt_pass methods: */
371 virtual unsigned int execute (function *);
373 }; // class pass_return_slot
375 unsigned int
376 pass_return_slot::execute (function *fun)
378 basic_block bb;
380 FOR_EACH_BB_FN (bb, fun)
382 gimple_stmt_iterator gsi;
383 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
385 gimple stmt = gsi_stmt (gsi);
386 bool slot_opt_p;
388 if (is_gimple_call (stmt)
389 && gimple_call_lhs (stmt)
390 && !gimple_call_return_slot_opt_p (stmt)
391 && aggregate_value_p (TREE_TYPE (gimple_call_lhs (stmt)),
392 gimple_call_fndecl (stmt)))
394 /* Check if the location being assigned to is
395 clobbered by the call. */
396 slot_opt_p = dest_safe_for_nrv_p (stmt);
397 gimple_call_set_return_slot_opt (stmt, slot_opt_p);
401 return 0;
404 } // anon namespace
406 gimple_opt_pass *
407 make_pass_return_slot (gcc::context *ctxt)
409 return new pass_return_slot (ctxt);