diff options
author | Richard Sandiford <richard.sandiford@arm.com> | 2016-11-21 15:52:09 +0000 |
---|---|---|
committer | Richard Sandiford <rsandifo@gcc.gnu.org> | 2016-11-21 15:52:09 +0000 |
commit | 9713daa015b807a9ffd349f3698cee7acbbaed23 (patch) | |
tree | e99ef73d3ba4d9ddf7188f90a7bc54817d66c427 /gcc/tree-tailcall.c | |
parent | 67b5d0b2fe8cdb72dfc56644e42c28f453cb2f76 (diff) |
Handle sibcalls with aggregate returns
We treated this g as a sibling call to f:
int f (int);
int g (void) { return f (1); }
but not this one:
struct s { int i; };
struct s f (int);
struct s g (void) { return f (1); }
We treated them both as sibcalls on x86 before the first patch for PR36326,
so I suppose this is a regression of sorts from 4.3.
The patch allows function returns to be local aggregate variables as well
as gimple registers.
gcc/
* tree-tailcall.c (process_assignment): Simplify the check for
a valid copy, allowing the source to be a local variable as
well as an SSA name.
(find_tail_calls): Allow copies between local variables to follow
the call. Allow the result to be stored in any local variable,
even if it's an aggregate.
(eliminate_tail_call): Check whether the result is an SSA name
before updating its SSA_NAME_DEF_STMT.
gcc/testsuite/
* gcc.dg/tree-ssa/tailcall-7.c: New test.
From-SVN: r242668
Diffstat (limited to 'gcc/tree-tailcall.c')
-rw-r--r-- | gcc/tree-tailcall.c | 28 |
1 files changed, 17 insertions, 11 deletions
diff --git a/gcc/tree-tailcall.c b/gcc/tree-tailcall.c index 0436f0f04a6..f97541d35a5 100644 --- a/gcc/tree-tailcall.c +++ b/gcc/tree-tailcall.c @@ -269,7 +269,7 @@ process_assignment (gassign *stmt, gimple_stmt_iterator call, tree *m, conversions that can never produce extra code between the function call and the function return. */ if ((rhs_class == GIMPLE_SINGLE_RHS || gimple_assign_cast_p (stmt)) - && (TREE_CODE (src_var) == SSA_NAME)) + && src_var == *ass_var) { /* Reject a tailcall if the type conversion might need additional code. */ @@ -287,9 +287,6 @@ process_assignment (gassign *stmt, gimple_stmt_iterator call, tree *m, return false; } - if (src_var != *ass_var) - return false; - *ass_var = dest; return true; } @@ -428,6 +425,13 @@ find_tail_calls (basic_block bb, struct tailcall **ret) break; } + /* Allow simple copies between local variables, even if they're + aggregates. */ + if (is_gimple_assign (stmt) + && auto_var_in_fn_p (gimple_assign_lhs (stmt), cfun->decl) + && auto_var_in_fn_p (gimple_assign_rhs1 (stmt), cfun->decl)) + continue; + /* If the statement references memory or volatile operands, fail. */ if (gimple_references_memory_p (stmt) || gimple_has_volatile_ops (stmt)) @@ -444,18 +448,20 @@ find_tail_calls (basic_block bb, struct tailcall **ret) return; } - /* If the LHS of our call is not just a simple register, we can't - transform this into a tail or sibling call. This situation happens, - in (e.g.) "*p = foo()" where foo returns a struct. In this case - we won't have a temporary here, but we need to carry out the side - effect anyway, so tailcall is impossible. + /* If the LHS of our call is not just a simple register or local + variable, we can't transform this into a tail or sibling call. + This situation happens, in (e.g.) "*p = foo()" where foo returns a + struct. In this case we won't have a temporary here, but we need + to carry out the side effect anyway, so tailcall is impossible. ??? In some situations (when the struct is returned in memory via invisible argument) we could deal with this, e.g. by passing 'p' itself as that argument to foo, but it's too early to do this here, and expand_call() will not handle it anyway. If it ever can, then we need to revisit this here, to allow that situation. */ - if (ass_var && !is_gimple_reg (ass_var)) + if (ass_var + && !is_gimple_reg (ass_var) + && !auto_var_in_fn_p (ass_var, cfun->decl)) return; /* We found the call, check whether it is suitable. */ @@ -888,7 +894,7 @@ eliminate_tail_call (struct tailcall *t) call = gsi_stmt (t->call_gsi); rslt = gimple_call_lhs (call); - if (rslt != NULL_TREE) + if (rslt != NULL_TREE && TREE_CODE (rslt) == SSA_NAME) { /* Result of the call will no longer be defined. So adjust the SSA_NAME_DEF_STMT accordingly. */ |