Branch data Line data Source code
1 : : /* Language independent return value optimizations
2 : : Copyright (C) 2004-2024 Free Software Foundation, Inc.
3 : :
4 : : This file is part of GCC.
5 : :
6 : : GCC is free software; you can redistribute it and/or modify
7 : : it under the terms of the GNU General Public License as published by
8 : : the Free Software Foundation; either version 3, or (at your option)
9 : : any later version.
10 : :
11 : : GCC is distributed in the hope that it will be useful,
12 : : but WITHOUT ANY WARRANTY; without even the implied warranty of
13 : : MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 : : GNU General Public License for more details.
15 : :
16 : : You should have received a copy of the GNU General Public License
17 : : along with GCC; see the file COPYING3. If not see
18 : : <http://www.gnu.org/licenses/>. */
19 : :
20 : : #include "config.h"
21 : : #include "system.h"
22 : : #include "coretypes.h"
23 : : #include "backend.h"
24 : : #include "tree.h"
25 : : #include "gimple.h"
26 : : #include "tree-pass.h"
27 : : #include "ssa.h"
28 : : #include "tree-pretty-print.h"
29 : : #include "gimple-iterator.h"
30 : : #include "gimple-walk.h"
31 : : #include "internal-fn.h"
32 : :
33 : : /* This file implements return value optimizations for functions which
34 : : return aggregate types.
35 : :
36 : : Basically this pass searches the function for return statements which
37 : : return a local aggregate. When converted to RTL such statements will
38 : : generate a copy from the local aggregate to final return value destination
39 : : mandated by the target's ABI.
40 : :
41 : : That copy can often be avoided by directly constructing the return value
42 : : into the final destination mandated by the target's ABI.
43 : :
44 : : This is basically a generic equivalent to the C++ front-end's
45 : : Named Return Value optimization. */
46 : :
47 : : struct nrv_data_t
48 : : {
49 : : /* This is the temporary (a VAR_DECL) which appears in all of
50 : : this function's RETURN_EXPR statements. */
51 : : tree var;
52 : :
53 : : /* This is the function's RESULT_DECL. We will replace all occurrences
54 : : of VAR with RESULT_DECL when we apply this optimization. */
55 : : tree result;
56 : : int modified;
57 : : };
58 : :
59 : : static tree finalize_nrv_r (tree *, int *, void *);
60 : :
61 : : /* Callback for the tree walker.
62 : :
63 : : If TP refers to a RETURN_EXPR, then set the expression being returned
64 : : to nrv_data->result.
65 : :
66 : : If TP refers to nrv_data->var, then replace nrv_data->var with
67 : : nrv_data->result.
68 : :
69 : : If we reach a node where we know all the subtrees are uninteresting,
70 : : then set *WALK_SUBTREES to zero. */
71 : :
72 : : static tree
73 : 142178 : finalize_nrv_r (tree *tp, int *walk_subtrees, void *data)
74 : : {
75 : 142178 : struct walk_stmt_info *wi = (struct walk_stmt_info *) data;
76 : 142178 : struct nrv_data_t *dp = (struct nrv_data_t *) wi->info;
77 : :
78 : : /* No need to walk into types. */
79 : 142178 : if (TYPE_P (*tp))
80 : 0 : *walk_subtrees = 0;
81 : :
82 : : /* Otherwise replace all occurrences of VAR with RESULT. */
83 : 142178 : else if (*tp == dp->var)
84 : : {
85 : 1746 : *tp = dp->result;
86 : 1746 : dp->modified = 1;
87 : : }
88 : :
89 : : /* Keep iterating. */
90 : 142178 : return NULL_TREE;
91 : : }
92 : :
93 : : /* Main entry point for return value optimizations.
94 : :
95 : : If this function always returns the same local variable, and that
96 : : local variable is an aggregate type, then replace the variable with
97 : : the function's DECL_RESULT.
98 : :
99 : : This is the equivalent of the C++ named return value optimization
100 : : applied to optimized trees in a language independent form. If we
101 : : ever encounter languages which prevent this kind of optimization,
102 : : then we could either have the languages register the optimization or
103 : : we could change the gating function to check the current language. */
104 : :
105 : : namespace {
106 : :
107 : : const pass_data pass_data_nrv =
108 : : {
109 : : GIMPLE_PASS, /* type */
110 : : "nrv", /* name */
111 : : OPTGROUP_NONE, /* optinfo_flags */
112 : : TV_TREE_NRV, /* tv_id */
113 : : ( PROP_ssa | PROP_cfg ), /* properties_required */
114 : : 0, /* properties_provided */
115 : : 0, /* properties_destroyed */
116 : : 0, /* todo_flags_start */
117 : : 0, /* todo_flags_finish */
118 : : };
119 : :
120 : : class pass_nrv : public gimple_opt_pass
121 : : {
122 : : public:
123 : 280114 : pass_nrv (gcc::context *ctxt)
124 : 560228 : : gimple_opt_pass (pass_data_nrv, ctxt)
125 : : {}
126 : :
127 : : /* opt_pass methods: */
128 : 1416251 : bool gate (function *) final override { return optimize > 0; }
129 : :
130 : : unsigned int execute (function *) final override;
131 : :
132 : : }; // class pass_nrv
133 : :
134 : : unsigned int
135 : 998662 : pass_nrv::execute (function *fun)
136 : : {
137 : 998662 : tree result = DECL_RESULT (current_function_decl);
138 : 998662 : tree result_type = TREE_TYPE (result);
139 : 998662 : tree found = NULL;
140 : 998662 : basic_block bb;
141 : 998662 : gimple_stmt_iterator gsi;
142 : 998662 : struct nrv_data_t data;
143 : :
144 : : /* If this function does not return an aggregate type in memory, then
145 : : there is nothing to do. */
146 : 998662 : if (!aggregate_value_p (result, current_function_decl))
147 : : return 0;
148 : :
149 : : /* If a GIMPLE type is returned in memory, finalize_nrv_r might create
150 : : non-GIMPLE. */
151 : 52987 : if (is_gimple_reg_type (result_type))
152 : : return 0;
153 : :
154 : : /* If the front end already did something like this, don't do it here. */
155 : 43336 : if (DECL_NAME (result))
156 : : return 0;
157 : :
158 : : /* If the result has its address taken then it might be modified
159 : : by means not detected in the following loop. Bail out in this
160 : : case. */
161 : 42599 : if (TREE_ADDRESSABLE (result))
162 : : return 0;
163 : :
164 : : /* Look through each block for assignments to the RESULT_DECL. */
165 : 592928 : FOR_EACH_BB_FN (bb, fun)
166 : : {
167 : 3918768 : for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
168 : : {
169 : 2775285 : gimple *stmt = gsi_stmt (gsi);
170 : 2775285 : tree ret_val;
171 : :
172 : 2775285 : if (greturn *return_stmt = dyn_cast <greturn *> (stmt))
173 : : {
174 : : /* In a function with an aggregate return value, the
175 : : gimplifier has changed all non-empty RETURN_EXPRs to
176 : : return the RESULT_DECL. */
177 : 902 : ret_val = gimple_return_retval (return_stmt);
178 : 902 : if (ret_val)
179 : 902 : gcc_assert (ret_val == result);
180 : : }
181 : 2774383 : else if (gimple_has_lhs (stmt)
182 : 1309851 : && gimple_get_lhs (stmt) == result)
183 : : {
184 : 3396 : tree rhs;
185 : :
186 : 3396 : if (!gimple_assign_copy_p (stmt))
187 : : return 0;
188 : :
189 : 2859 : rhs = gimple_assign_rhs1 (stmt);
190 : :
191 : : /* Now verify that this return statement uses the same value
192 : : as any previously encountered return statement. */
193 : 2859 : if (found != NULL)
194 : : {
195 : : /* If we found a return statement using a different variable
196 : : than previous return statements, then we cannot perform
197 : : NRV optimizations. */
198 : 56 : if (found != rhs)
199 : : return 0;
200 : : }
201 : : else
202 : : found = rhs;
203 : :
204 : : /* The returned value must be a local automatic variable of the
205 : : same type and alignment as the function's result. */
206 : 2815 : if (!VAR_P (found)
207 : 2815 : || TREE_THIS_VOLATILE (found)
208 : 2534 : || !auto_var_in_fn_p (found, current_function_decl)
209 : 1658 : || TREE_ADDRESSABLE (found)
210 : 1526 : || DECL_ALIGN (found) > DECL_ALIGN (result)
211 : 3566 : || !useless_type_conversion_p (result_type,
212 : 751 : TREE_TYPE (found)))
213 : 2064 : return 0;
214 : : }
215 : 5742439 : else if (gimple_has_lhs (stmt))
216 : : {
217 : 1206926 : tree addr = get_base_address (gimple_get_lhs (stmt));
218 : : /* If there's any MODIFY of component of RESULT,
219 : : then bail out. */
220 : 1206926 : if (addr && addr == result)
221 : : return 0;
222 : : }
223 : : }
224 : : }
225 : :
226 : 802 : if (!found)
227 : : return 0;
228 : :
229 : : /* If dumping details, then note once and only the NRV replacement. */
230 : 691 : if (dump_file && (dump_flags & TDF_DETAILS))
231 : : {
232 : 0 : fprintf (dump_file, "NRV Replaced: ");
233 : 0 : print_generic_expr (dump_file, found, dump_flags);
234 : 0 : fprintf (dump_file, " with: ");
235 : 0 : print_generic_expr (dump_file, result, dump_flags);
236 : 0 : fprintf (dump_file, "\n");
237 : : }
238 : :
239 : 691 : TREE_ADDRESSABLE (result) |= TREE_ADDRESSABLE (found);
240 : :
241 : : /* Now walk through the function changing all references to VAR to be
242 : : RESULT. */
243 : 691 : data.var = found;
244 : 691 : data.result = result;
245 : 9277 : FOR_EACH_BB_FN (bb, fun)
246 : : {
247 : 57021 : for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); )
248 : : {
249 : 39849 : gimple *stmt = gsi_stmt (gsi);
250 : : /* If this is a copy from VAR to RESULT, remove it. */
251 : 39849 : if (gimple_assign_copy_p (stmt)
252 : 8813 : && gimple_assign_lhs (stmt) == result
253 : 40552 : && gimple_assign_rhs1 (stmt) == found)
254 : : {
255 : 703 : unlink_stmt_vdef (stmt);
256 : 703 : gsi_remove (&gsi, true);
257 : 703 : release_defs (stmt);
258 : : }
259 : : else
260 : : {
261 : 39146 : struct walk_stmt_info wi;
262 : 39146 : memset (&wi, 0, sizeof (wi));
263 : 39146 : wi.info = &data;
264 : 39146 : data.modified = 0;
265 : 39146 : walk_gimple_op (stmt, finalize_nrv_r, &wi);
266 : 39146 : if (data.modified)
267 : : {
268 : : /* If this is a CLOBBER of VAR, remove it. */
269 : 1746 : if (gimple_clobber_p (stmt))
270 : : {
271 : 688 : unlink_stmt_vdef (stmt);
272 : 688 : gsi_remove (&gsi, true);
273 : 688 : release_defs (stmt);
274 : 688 : continue;
275 : : }
276 : 1058 : update_stmt (stmt);
277 : : }
278 : 38458 : gsi_next (&gsi);
279 : : }
280 : : }
281 : : }
282 : :
283 : 691 : SET_DECL_VALUE_EXPR (found, result);
284 : 691 : DECL_HAS_VALUE_EXPR_P (found) = 1;
285 : :
286 : 691 : return 0;
287 : : }
288 : :
289 : : } // anon namespace
290 : :
291 : : gimple_opt_pass *
292 : 280114 : make_pass_nrv (gcc::context *ctxt)
293 : : {
294 : 280114 : return new pass_nrv (ctxt);
295 : : }
296 : :
297 : : /* Determine (pessimistically) whether DEST is available for NRV
298 : : optimization, where DEST is expected to be the LHS of a modify
299 : : expression where the RHS is a function returning an aggregate.
300 : :
301 : : DEST is available if it is not clobbered or used by the call. */
302 : :
303 : : static bool
304 : 7271 : dest_safe_for_nrv_p (gcall *call)
305 : : {
306 : 7271 : tree dest = gimple_call_lhs (call);
307 : :
308 : 7271 : dest = get_base_address (dest);
309 : 7271 : if (! dest)
310 : : return false;
311 : :
312 : 7271 : if (TREE_CODE (dest) == SSA_NAME)
313 : : return true;
314 : :
315 : 3488 : if (call_may_clobber_ref_p (call, dest, false)
316 : 3488 : || ref_maybe_used_by_stmt_p (call, dest, false))
317 : 722 : return false;
318 : :
319 : : return true;
320 : : }
321 : :
322 : : /* Walk through the function looking for GIMPLE_ASSIGNs with calls that
323 : : return in memory on the RHS. For each of these, determine whether it is
324 : : safe to pass the address of the LHS as the return slot, and mark the
325 : : call appropriately if so.
326 : :
327 : : The NRV shares the return slot with a local variable in the callee; this
328 : : optimization shares the return slot with the target of the call within
329 : : the caller. If the NRV is performed (which we can't know in general),
330 : : this optimization is safe if the address of the target has not
331 : : escaped prior to the call. If it has, modifications to the local
332 : : variable will produce visible changes elsewhere, as in PR c++/19317. */
333 : :
334 : : namespace {
335 : :
336 : : const pass_data pass_data_return_slot =
337 : : {
338 : : GIMPLE_PASS, /* type */
339 : : "retslot", /* name */
340 : : OPTGROUP_NONE, /* optinfo_flags */
341 : : TV_NONE, /* tv_id */
342 : : PROP_ssa, /* properties_required */
343 : : 0, /* properties_provided */
344 : : 0, /* properties_destroyed */
345 : : 0, /* todo_flags_start */
346 : : 0, /* todo_flags_finish */
347 : : };
348 : :
349 : : class pass_return_slot : public gimple_opt_pass
350 : : {
351 : : public:
352 : 280114 : pass_return_slot (gcc::context *ctxt)
353 : 560228 : : gimple_opt_pass (pass_data_return_slot, ctxt)
354 : : {}
355 : :
356 : : /* opt_pass methods: */
357 : : unsigned int execute (function *) final override;
358 : :
359 : : }; // class pass_return_slot
360 : :
361 : : unsigned int
362 : 996079 : pass_return_slot::execute (function *fun)
363 : : {
364 : 996079 : basic_block bb;
365 : :
366 : 11455994 : FOR_EACH_BB_FN (bb, fun)
367 : : {
368 : 10459915 : gimple_stmt_iterator gsi;
369 : 94263789 : for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
370 : : {
371 : 73343959 : gcall *stmt;
372 : 73343959 : bool slot_opt_p;
373 : :
374 : 73343959 : stmt = dyn_cast <gcall *> (gsi_stmt (gsi));
375 : 5364344 : if (stmt
376 : 5364344 : && gimple_call_lhs (stmt)
377 : 1941057 : && !gimple_call_return_slot_opt_p (stmt)
378 : : /* Ignore internal functions, those are expanded specially
379 : : and aggregate_value_p on their result might result in
380 : : undesirable warnings with some backends. */
381 : 1756991 : && !gimple_call_internal_p (stmt)
382 : 1686740 : && aggregate_value_p (TREE_TYPE (gimple_call_lhs (stmt)),
383 : 1686740 : gimple_call_fndecl (stmt)))
384 : : {
385 : : /* Check if the location being assigned to is
386 : : clobbered by the call. */
387 : 7271 : slot_opt_p = dest_safe_for_nrv_p (stmt);
388 : 73351230 : gimple_call_set_return_slot_opt (stmt, slot_opt_p);
389 : : }
390 : : }
391 : : }
392 : 996079 : return 0;
393 : : }
394 : :
395 : : } // anon namespace
396 : :
397 : : gimple_opt_pass *
398 : 280114 : make_pass_return_slot (gcc::context *ctxt)
399 : : {
400 : 280114 : return new pass_return_slot (ctxt);
401 : : }
|