7ee2468b92
gcc/ * system.h (dump_file): Do not define. * tree-pass.h: Include dumpfile.h, which is a new file containing... (enum tree_dump_index, TDF_*, get_dump_file_name, dump_enabled_p, dump_initialized_p, dump_begin, dump_end, dump_node, dump_switch_p, dump_flag_name, dump_file, dump_flags, dump_file_name, get_dump_file_info, struct dump_file_info): all of this, moved to... * dumpfile.h: Here, new file. * tree-dump.h: Include dumpfile.h, but not tree-pass.h. (dump_stmt): Remove prototype for C++ specific function. (dump_enumerated_decls): Move prototype from here... * tree-flow.h (dump_enumerated_decls): ... to here. (get_ref_base_and_extent) Move prototype from here ... * tree.h (get_ref_base_and_extent) ... to here. * tree-ssa-live.c: Do not inclde tree-pretty-print.h, because gimple-pretty-print.h is enough. Do not include tree-dump.h, include timevar.h and dumpfile.h instead. (struct numbered_tree_d, compare_decls_by_uid, dump_enumerated_decls_push, dump_enumerated_decls): Move from here ... * tree-dfa.c:(struct numbered_tree_d, compare_decls_by_uid, dump_enumerated_decls_push, dump_enumerated_decls):... to here. Do not include timevar.h. * tree.c: Do not include timevar.h. * tree-cfg.c: Do not include langhooks.h, tree-pretty-print.h, and timevar.h. (dump_cfg_stats): Use current_function_name. (gimple_cfg2vcg): Likewise. (dump_function_to_file): Likewise. * df-scan.c: Do not include tree-pass.h and timevar.h. Include dumpfile.h. (df_entry_block_bitmap_verify, df_exit_block_bitmap_verify): Do not use print_current_pass. * df-problems.c: Include dumpfile.h. Always define REG_DEAD_DEBUGGING, avoid #ifdef code, because it leads to errors in the code not selected. (df_note_compute): Do not print_rtl_with_bb here. Fix compilation bug if REG_DEAD_DEBUGGING is not 0, get_insns is not available here. * lcm.c: Include dumpfile.h. Remove obsolete include of insn-attr.h. * dojump.c (do_compare_rtx_and_jump): Remove failure printing for missing probability notes. * stmt.c: Include dumpfile.h. (emit_case_decision_tree): Re-enable printing expand details only if TDF_DETAILS. * alias.c, auto-inc-dec.c, bb-reorder.c, caller-save.c, cfg.c, cfgcleanup.c, cfgexpand.c, cfgloop.c, cfgloopmanip.c, cgraph.c, cgraphclones.c, cgraphunit.c, combine.c, combine-stack-adj.c, coverage.c, cprop.c, cse.c, cselib.c, dbgcnt.c, dce.c, df-core.c, dse.c, dwarf2out.c, emit-rtl.c, except.c, expr.c, final.c, function.c, fwprop.c, gcse.c, gimple-fold.c, gimple-pretty-print.c, gimple-ssa-strength-reduction.c, gimplify.c, graphite-blocking.c, graphite-clast-to-gimple.c, graphite-dependences.c, graphite-interchange.c, graphite-optimize-isl.c, graphite-poly.c, graphite-sese-to-poly.c, haifa-sched.c, hw-doloop.c, ifcvt.c, ipa.c, ipa-cp.c, ipa-inline-analysis.c, ipa-inline.c, ipa-inline-transform.c, ipa-prop.c, ipa-pure-const.c, ipa-reference.c, ipa-split.c, ipa-utils.c, ira.c, ira-emit.c, jump.c, loop-doloop.c, loop-init.c, loop-invariant.c, loop-iv.c, loop-unroll.c, loop-unswitch.c, lower-subreg.c, lto-section-out.c, lto-streamer-in.c, matrix-reorg.c, mcf.c, mode-switching.c, modulo-sched.c, omega.c, omp-low.c, passes.c, plugin.c, postreload.c, postreload-gcse.c, predict.c, print-rtl.c, print-tree.c, profile.c, recog.c, ree.c, regcprop.c, reginfo.c, regmove.c, regrename.c, reg-stack.c, reload1.c, reorg.c, sched-rgn.c, sched-vis.c, sel-sched.c, sel-sched-ir.c, store-motion.c, tracer.c, trans-mem.c, tree-affine.c, tree-call-cdce.c, tree-cfgcleanup.c, tree-chrec.c, tree-data-ref.c, tree-diagnostic.c, tree-dump.c, tree-eh.c, tree-flow-inline.h, tree-if-conv.c, tree-into-ssa.c, tree-mudflap.c, tree-nrv.c, tree-object-size.c, tree-optimize.c, tree-outof-ssa.c, tree-predcom.c, tree-pretty-print.c, tree-profile.c, tree-scalar-evolution.c, tree-sra.c, tree-ssa-address.c, tree-ssa-alias.c, tree-ssa.c, tree-ssa-ccp.c, tree-ssa-coalesce.c, tree-ssa-copy.c, tree-ssa-copyrename.c,, tree-ssa-dce.c, tree-ssa-dom.c, tree-ssa-dse.c, tree-ssa-forwprop.c, tree-ssa-ifcombine.c, tree-ssa-loop.c, tree-ssa-loop-ch.c, tree-ssa-loop-im.c, tree-ssa-loop-ivcanon.c, tree-ssa-loop-ivopts.c, tree-ssa-loop-manip.c, tree-ssa-loop-niter.c, tree-ssa-loop-prefetch.c, tree-ssa-loop-unswitch.c, tree-ssa-math-opts.c, tree-ssa-operands.c, tree-ssa-phiopt.c, tree-ssa-phiprop.c, tree-ssa-pre.c, tree-ssa-propagate.c, tree-ssa-reassoc.c, tree-ssa-sccvn.c, tree-ssa-sink.c, tree-ssa-structalias.c, tree-ssa-tail-merge.c, tree-ssa-ter.c, tree-ssa-threadedge.c, tree-ssa-threadupdate.c, tree-ssa-uncprop.c, tree-ssa-uninit.c, tree-switch-conversion.c, tree-tailcall.c, tree-vect-data-refs.c, tree-vect-loop.c, tree-vect-loop-manip.c, tree-vectorizer.c, tree-vect-patterns.c, tree-vect-slp.c, tree-vect-stmts.c, tree-vrp.c, value-prof.c, var-tracking.c, web.c: Include tree-pass.h only if needed. If tree-pass.h is included, do not include timevar.h and dumpfile.h. If tree-pass.h is not included but dump_file, or dump_flags, or the TDF_* flags are used, include dumpfile.h. If gimple-pretty-print.h is included, don't include tree-pretty-print.h. Remove assorted unnecessary includes. * config/mn10300/mn10300.c, config/c6x/c6x.c, config/ia64/ia64.c, config/arm/arm.c, config/bfin/bfin.c, config/frv/frv.c, config/spu/spu.c, config/mep/mep.c, config/i386/i386.c: Include dumpfile.h. * config/rl78/rl78.c: Include dumpfile.h instead of tree-pass.h. * arm/t-arm, avr/t-avr, i386/t-i386, ia64/t-ia64, mep/t-mep, spu/t-spu-elf: Fix dependencies. c-family/ * c-gimplify.c: Include dumpfile.h instead of tree-dump.h. * c-ada-spec.c: Likewise. * c-dump.c (dump_stmt): Move to cp/dump.c, the only user. c/ * c-decl.c: Include dumpfile.h instead of tree-dump.h. * Make-lang.in: Fix dependencies. cp/ * dump.c (dump_stmt): Moved here from c-dump.c. * optimize.c: Include dumpfile.h instead of tree-dump.h. * class.c: Likewise. * decl2.c: Likewise. * Make-lang.in: Fix dependencies. fortran/ * f95-lang.c: Include dumpfile.h instead of tree-dump.h. * Make-lang.in: Fix dependencies. java/ * java-gimplify.c Include dumpfile.h instead of tree-dump.h * Make-lang.in: Fix dependencies. lto/ * lto.c: Do not include timevar.h. * Make-lang.in: Fix dependencies. ada/ * gcc-interface/utils.c: Include timevar.h. * Make-lang.in: Fix dependencies. From-SVN: r189519
871 lines
28 KiB
C
871 lines
28 KiB
C
/* Callgraph clones
|
|
Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010,
|
|
2011, 2012 Free Software Foundation, Inc.
|
|
Contributed by Jan Hubicka
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free
|
|
Software Foundation; either version 3, or (at your option) any later
|
|
version.
|
|
|
|
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING3. If not see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
/* This module provide facilities for clonning functions. I.e. creating
|
|
new functions based on existing functions with simple modifications,
|
|
such as replacement of parameters.
|
|
|
|
To allow whole program optimization without actual presence of function
|
|
bodies, an additional infrastructure is provided for so-called virtual
|
|
clones
|
|
|
|
A virtual clone in the callgraph is a function that has no
|
|
associated body, just a description of how to create its body based
|
|
on a different function (which itself may be a virtual clone).
|
|
|
|
The description of function modifications includes adjustments to
|
|
the function's signature (which allows, for example, removing or
|
|
adding function arguments), substitutions to perform on the
|
|
function body, and, for inlined functions, a pointer to the
|
|
function that it will be inlined into.
|
|
|
|
It is also possible to redirect any edge of the callgraph from a
|
|
function to its virtual clone. This implies updating of the call
|
|
site to adjust for the new function signature.
|
|
|
|
Most of the transformations performed by inter-procedural
|
|
optimizations can be represented via virtual clones. For
|
|
instance, a constant propagation pass can produce a virtual clone
|
|
of the function which replaces one of its arguments by a
|
|
constant. The inliner can represent its decisions by producing a
|
|
clone of a function whose body will be later integrated into
|
|
a given function.
|
|
|
|
Using virtual clones, the program can be easily updated
|
|
during the Execute stage, solving most of pass interactions
|
|
problems that would otherwise occur during Transform.
|
|
|
|
Virtual clones are later materialized in the LTRANS stage and
|
|
turned into real functions. Passes executed after the virtual
|
|
clone were introduced also perform their Transform stage
|
|
on new functions, so for a pass there is no significant
|
|
difference between operating on a real function or a virtual
|
|
clone introduced before its Execute stage.
|
|
|
|
Optimization passes then work on virtual clones introduced before
|
|
their Execute stage as if they were real functions. The
|
|
only difference is that clones are not visible during the
|
|
Generate Summary stage. */
|
|
|
|
#include "config.h"
|
|
#include "system.h"
|
|
#include "coretypes.h"
|
|
#include "tm.h"
|
|
#include "tree.h"
|
|
#include "rtl.h"
|
|
#include "tree-flow.h"
|
|
#include "tree-inline.h"
|
|
#include "langhooks.h"
|
|
#include "pointer-set.h"
|
|
#include "toplev.h"
|
|
#include "flags.h"
|
|
#include "ggc.h"
|
|
#include "debug.h"
|
|
#include "target.h"
|
|
#include "cgraph.h"
|
|
#include "diagnostic.h"
|
|
#include "params.h"
|
|
#include "intl.h"
|
|
#include "function.h"
|
|
#include "ipa-prop.h"
|
|
#include "gimple.h"
|
|
#include "tree-iterator.h"
|
|
#include "tree-dump.h"
|
|
#include "gimple-pretty-print.h"
|
|
#include "coverage.h"
|
|
#include "ipa-inline.h"
|
|
#include "ipa-utils.h"
|
|
#include "lto-streamer.h"
|
|
#include "except.h"
|
|
|
|
/* Create clone of E in the node N represented by CALL_EXPR the callgraph. */
|
|
struct cgraph_edge *
|
|
cgraph_clone_edge (struct cgraph_edge *e, struct cgraph_node *n,
|
|
gimple call_stmt, unsigned stmt_uid, gcov_type count_scale,
|
|
int freq_scale, bool update_original)
|
|
{
|
|
struct cgraph_edge *new_edge;
|
|
gcov_type count = e->count * count_scale / REG_BR_PROB_BASE;
|
|
gcov_type freq;
|
|
|
|
/* We do not want to ignore loop nest after frequency drops to 0. */
|
|
if (!freq_scale)
|
|
freq_scale = 1;
|
|
freq = e->frequency * (gcov_type) freq_scale / CGRAPH_FREQ_BASE;
|
|
if (freq > CGRAPH_FREQ_MAX)
|
|
freq = CGRAPH_FREQ_MAX;
|
|
|
|
if (e->indirect_unknown_callee)
|
|
{
|
|
tree decl;
|
|
|
|
if (call_stmt && (decl = gimple_call_fndecl (call_stmt)))
|
|
{
|
|
struct cgraph_node *callee = cgraph_get_node (decl);
|
|
gcc_checking_assert (callee);
|
|
new_edge = cgraph_create_edge (n, callee, call_stmt, count, freq);
|
|
}
|
|
else
|
|
{
|
|
new_edge = cgraph_create_indirect_edge (n, call_stmt,
|
|
e->indirect_info->ecf_flags,
|
|
count, freq);
|
|
*new_edge->indirect_info = *e->indirect_info;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
new_edge = cgraph_create_edge (n, e->callee, call_stmt, count, freq);
|
|
if (e->indirect_info)
|
|
{
|
|
new_edge->indirect_info
|
|
= ggc_alloc_cleared_cgraph_indirect_call_info ();
|
|
*new_edge->indirect_info = *e->indirect_info;
|
|
}
|
|
}
|
|
|
|
new_edge->inline_failed = e->inline_failed;
|
|
new_edge->indirect_inlining_edge = e->indirect_inlining_edge;
|
|
new_edge->lto_stmt_uid = stmt_uid;
|
|
/* Clone flags that depend on call_stmt availability manually. */
|
|
new_edge->can_throw_external = e->can_throw_external;
|
|
new_edge->call_stmt_cannot_inline_p = e->call_stmt_cannot_inline_p;
|
|
if (update_original)
|
|
{
|
|
e->count -= new_edge->count;
|
|
if (e->count < 0)
|
|
e->count = 0;
|
|
}
|
|
cgraph_call_edge_duplication_hooks (e, new_edge);
|
|
return new_edge;
|
|
}
|
|
|
|
|
|
/* Create node representing clone of N executed COUNT times. Decrease
|
|
the execution counts from original node too.
|
|
The new clone will have decl set to DECL that may or may not be the same
|
|
as decl of N.
|
|
|
|
When UPDATE_ORIGINAL is true, the counts are subtracted from the original
|
|
function's profile to reflect the fact that part of execution is handled
|
|
by node.
|
|
When CALL_DUPLICATOIN_HOOK is true, the ipa passes are acknowledged about
|
|
the new clone. Otherwise the caller is responsible for doing so later. */
|
|
|
|
struct cgraph_node *
|
|
cgraph_clone_node (struct cgraph_node *n, tree decl, gcov_type count, int freq,
|
|
bool update_original,
|
|
VEC(cgraph_edge_p,heap) *redirect_callers,
|
|
bool call_duplication_hook)
|
|
{
|
|
struct cgraph_node *new_node = cgraph_create_empty_node ();
|
|
struct cgraph_edge *e;
|
|
gcov_type count_scale;
|
|
unsigned i;
|
|
|
|
new_node->symbol.decl = decl;
|
|
symtab_register_node ((symtab_node)new_node);
|
|
new_node->origin = n->origin;
|
|
if (new_node->origin)
|
|
{
|
|
new_node->next_nested = new_node->origin->nested;
|
|
new_node->origin->nested = new_node;
|
|
}
|
|
new_node->analyzed = n->analyzed;
|
|
new_node->local = n->local;
|
|
new_node->symbol.externally_visible = false;
|
|
new_node->local.local = true;
|
|
new_node->global = n->global;
|
|
new_node->rtl = n->rtl;
|
|
new_node->count = count;
|
|
new_node->frequency = n->frequency;
|
|
new_node->clone = n->clone;
|
|
new_node->clone.tree_map = 0;
|
|
if (n->count)
|
|
{
|
|
if (new_node->count > n->count)
|
|
count_scale = REG_BR_PROB_BASE;
|
|
else
|
|
count_scale = new_node->count * REG_BR_PROB_BASE / n->count;
|
|
}
|
|
else
|
|
count_scale = 0;
|
|
if (update_original)
|
|
{
|
|
n->count -= count;
|
|
if (n->count < 0)
|
|
n->count = 0;
|
|
}
|
|
|
|
FOR_EACH_VEC_ELT (cgraph_edge_p, redirect_callers, i, e)
|
|
{
|
|
/* Redirect calls to the old version node to point to its new
|
|
version. */
|
|
cgraph_redirect_edge_callee (e, new_node);
|
|
}
|
|
|
|
|
|
for (e = n->callees;e; e=e->next_callee)
|
|
cgraph_clone_edge (e, new_node, e->call_stmt, e->lto_stmt_uid,
|
|
count_scale, freq, update_original);
|
|
|
|
for (e = n->indirect_calls; e; e = e->next_callee)
|
|
cgraph_clone_edge (e, new_node, e->call_stmt, e->lto_stmt_uid,
|
|
count_scale, freq, update_original);
|
|
ipa_clone_references ((symtab_node)new_node, &n->symbol.ref_list);
|
|
|
|
new_node->next_sibling_clone = n->clones;
|
|
if (n->clones)
|
|
n->clones->prev_sibling_clone = new_node;
|
|
n->clones = new_node;
|
|
new_node->clone_of = n;
|
|
|
|
if (call_duplication_hook)
|
|
cgraph_call_node_duplication_hooks (n, new_node);
|
|
return new_node;
|
|
}
|
|
|
|
/* Create a new name for clone of DECL, add SUFFIX. Returns an identifier. */
|
|
|
|
static GTY(()) unsigned int clone_fn_id_num;
|
|
|
|
tree
|
|
clone_function_name (tree decl, const char *suffix)
|
|
{
|
|
tree name = DECL_ASSEMBLER_NAME (decl);
|
|
size_t len = IDENTIFIER_LENGTH (name);
|
|
char *tmp_name, *prefix;
|
|
|
|
prefix = XALLOCAVEC (char, len + strlen (suffix) + 2);
|
|
memcpy (prefix, IDENTIFIER_POINTER (name), len);
|
|
strcpy (prefix + len + 1, suffix);
|
|
#ifndef NO_DOT_IN_LABEL
|
|
prefix[len] = '.';
|
|
#elif !defined NO_DOLLAR_IN_LABEL
|
|
prefix[len] = '$';
|
|
#else
|
|
prefix[len] = '_';
|
|
#endif
|
|
ASM_FORMAT_PRIVATE_NAME (tmp_name, prefix, clone_fn_id_num++);
|
|
return get_identifier (tmp_name);
|
|
}
|
|
|
|
/* Create callgraph node clone with new declaration. The actual body will
|
|
be copied later at compilation stage.
|
|
|
|
TODO: after merging in ipa-sra use function call notes instead of args_to_skip
|
|
bitmap interface.
|
|
*/
|
|
struct cgraph_node *
|
|
cgraph_create_virtual_clone (struct cgraph_node *old_node,
|
|
VEC(cgraph_edge_p,heap) *redirect_callers,
|
|
VEC(ipa_replace_map_p,gc) *tree_map,
|
|
bitmap args_to_skip,
|
|
const char * suffix)
|
|
{
|
|
tree old_decl = old_node->symbol.decl;
|
|
struct cgraph_node *new_node = NULL;
|
|
tree new_decl;
|
|
size_t i;
|
|
struct ipa_replace_map *map;
|
|
|
|
if (!flag_wpa)
|
|
gcc_checking_assert (tree_versionable_function_p (old_decl));
|
|
|
|
gcc_assert (old_node->local.can_change_signature || !args_to_skip);
|
|
|
|
/* Make a new FUNCTION_DECL tree node */
|
|
if (!args_to_skip)
|
|
new_decl = copy_node (old_decl);
|
|
else
|
|
new_decl = build_function_decl_skip_args (old_decl, args_to_skip, false);
|
|
DECL_STRUCT_FUNCTION (new_decl) = NULL;
|
|
|
|
/* Generate a new name for the new version. */
|
|
DECL_NAME (new_decl) = clone_function_name (old_decl, suffix);
|
|
SET_DECL_ASSEMBLER_NAME (new_decl, DECL_NAME (new_decl));
|
|
SET_DECL_RTL (new_decl, NULL);
|
|
|
|
new_node = cgraph_clone_node (old_node, new_decl, old_node->count,
|
|
CGRAPH_FREQ_BASE, false,
|
|
redirect_callers, false);
|
|
/* Update the properties.
|
|
Make clone visible only within this translation unit. Make sure
|
|
that is not weak also.
|
|
??? We cannot use COMDAT linkage because there is no
|
|
ABI support for this. */
|
|
DECL_EXTERNAL (new_node->symbol.decl) = 0;
|
|
if (DECL_ONE_ONLY (old_decl))
|
|
DECL_SECTION_NAME (new_node->symbol.decl) = NULL;
|
|
DECL_COMDAT_GROUP (new_node->symbol.decl) = 0;
|
|
TREE_PUBLIC (new_node->symbol.decl) = 0;
|
|
DECL_COMDAT (new_node->symbol.decl) = 0;
|
|
DECL_WEAK (new_node->symbol.decl) = 0;
|
|
DECL_STATIC_CONSTRUCTOR (new_node->symbol.decl) = 0;
|
|
DECL_STATIC_DESTRUCTOR (new_node->symbol.decl) = 0;
|
|
new_node->clone.tree_map = tree_map;
|
|
new_node->clone.args_to_skip = args_to_skip;
|
|
FOR_EACH_VEC_ELT (ipa_replace_map_p, tree_map, i, map)
|
|
{
|
|
tree var = map->new_tree;
|
|
symtab_node ref_node;
|
|
|
|
STRIP_NOPS (var);
|
|
if (TREE_CODE (var) != ADDR_EXPR)
|
|
continue;
|
|
var = get_base_var (var);
|
|
if (!var)
|
|
continue;
|
|
if (TREE_CODE (var) != FUNCTION_DECL
|
|
&& TREE_CODE (var) != VAR_DECL)
|
|
continue;
|
|
|
|
/* Record references of the future statement initializing the constant
|
|
argument. */
|
|
ref_node = symtab_get_node (var);
|
|
gcc_checking_assert (ref_node);
|
|
ipa_record_reference ((symtab_node)new_node, (symtab_node)ref_node,
|
|
IPA_REF_ADDR, NULL);
|
|
}
|
|
if (!args_to_skip)
|
|
new_node->clone.combined_args_to_skip = old_node->clone.combined_args_to_skip;
|
|
else if (old_node->clone.combined_args_to_skip)
|
|
{
|
|
int newi = 0, oldi = 0;
|
|
tree arg;
|
|
bitmap new_args_to_skip = BITMAP_GGC_ALLOC ();
|
|
struct cgraph_node *orig_node;
|
|
for (orig_node = old_node; orig_node->clone_of; orig_node = orig_node->clone_of)
|
|
;
|
|
for (arg = DECL_ARGUMENTS (orig_node->symbol.decl);
|
|
arg; arg = DECL_CHAIN (arg), oldi++)
|
|
{
|
|
if (bitmap_bit_p (old_node->clone.combined_args_to_skip, oldi))
|
|
{
|
|
bitmap_set_bit (new_args_to_skip, oldi);
|
|
continue;
|
|
}
|
|
if (bitmap_bit_p (args_to_skip, newi))
|
|
bitmap_set_bit (new_args_to_skip, oldi);
|
|
newi++;
|
|
}
|
|
new_node->clone.combined_args_to_skip = new_args_to_skip;
|
|
}
|
|
else
|
|
new_node->clone.combined_args_to_skip = args_to_skip;
|
|
new_node->symbol.externally_visible = 0;
|
|
new_node->local.local = 1;
|
|
new_node->lowered = true;
|
|
|
|
cgraph_call_node_duplication_hooks (old_node, new_node);
|
|
|
|
|
|
return new_node;
|
|
}
|
|
|
|
/* NODE is being removed from symbol table; see if its entry can be replaced by
|
|
other inline clone. */
|
|
struct cgraph_node *
|
|
cgraph_find_replacement_node (struct cgraph_node *node)
|
|
{
|
|
struct cgraph_node *next_inline_clone, *replacement;
|
|
|
|
for (next_inline_clone = node->clones;
|
|
next_inline_clone
|
|
&& next_inline_clone->symbol.decl != node->symbol.decl;
|
|
next_inline_clone = next_inline_clone->next_sibling_clone)
|
|
;
|
|
|
|
/* If there is inline clone of the node being removed, we need
|
|
to put it into the position of removed node and reorganize all
|
|
other clones to be based on it. */
|
|
if (next_inline_clone)
|
|
{
|
|
struct cgraph_node *n;
|
|
struct cgraph_node *new_clones;
|
|
|
|
replacement = next_inline_clone;
|
|
|
|
/* Unlink inline clone from the list of clones of removed node. */
|
|
if (next_inline_clone->next_sibling_clone)
|
|
next_inline_clone->next_sibling_clone->prev_sibling_clone
|
|
= next_inline_clone->prev_sibling_clone;
|
|
if (next_inline_clone->prev_sibling_clone)
|
|
{
|
|
gcc_assert (node->clones != next_inline_clone);
|
|
next_inline_clone->prev_sibling_clone->next_sibling_clone
|
|
= next_inline_clone->next_sibling_clone;
|
|
}
|
|
else
|
|
{
|
|
gcc_assert (node->clones == next_inline_clone);
|
|
node->clones = next_inline_clone->next_sibling_clone;
|
|
}
|
|
|
|
new_clones = node->clones;
|
|
node->clones = NULL;
|
|
|
|
/* Copy clone info. */
|
|
next_inline_clone->clone = node->clone;
|
|
|
|
/* Now place it into clone tree at same level at NODE. */
|
|
next_inline_clone->clone_of = node->clone_of;
|
|
next_inline_clone->prev_sibling_clone = NULL;
|
|
next_inline_clone->next_sibling_clone = NULL;
|
|
if (node->clone_of)
|
|
{
|
|
if (node->clone_of->clones)
|
|
node->clone_of->clones->prev_sibling_clone = next_inline_clone;
|
|
next_inline_clone->next_sibling_clone = node->clone_of->clones;
|
|
node->clone_of->clones = next_inline_clone;
|
|
}
|
|
|
|
/* Merge the clone list. */
|
|
if (new_clones)
|
|
{
|
|
if (!next_inline_clone->clones)
|
|
next_inline_clone->clones = new_clones;
|
|
else
|
|
{
|
|
n = next_inline_clone->clones;
|
|
while (n->next_sibling_clone)
|
|
n = n->next_sibling_clone;
|
|
n->next_sibling_clone = new_clones;
|
|
new_clones->prev_sibling_clone = n;
|
|
}
|
|
}
|
|
|
|
/* Update clone_of pointers. */
|
|
n = new_clones;
|
|
while (n)
|
|
{
|
|
n->clone_of = next_inline_clone;
|
|
n = n->next_sibling_clone;
|
|
}
|
|
return replacement;
|
|
}
|
|
else
|
|
return NULL;
|
|
}
|
|
|
|
/* Like cgraph_set_call_stmt but walk the clone tree and update all
|
|
clones sharing the same function body. */
|
|
|
|
void
|
|
cgraph_set_call_stmt_including_clones (struct cgraph_node *orig,
|
|
gimple old_stmt, gimple new_stmt)
|
|
{
|
|
struct cgraph_node *node;
|
|
struct cgraph_edge *edge = cgraph_edge (orig, old_stmt);
|
|
|
|
if (edge)
|
|
cgraph_set_call_stmt (edge, new_stmt);
|
|
|
|
node = orig->clones;
|
|
if (node)
|
|
while (node != orig)
|
|
{
|
|
struct cgraph_edge *edge = cgraph_edge (node, old_stmt);
|
|
if (edge)
|
|
cgraph_set_call_stmt (edge, new_stmt);
|
|
if (node->clones)
|
|
node = node->clones;
|
|
else if (node->next_sibling_clone)
|
|
node = node->next_sibling_clone;
|
|
else
|
|
{
|
|
while (node != orig && !node->next_sibling_clone)
|
|
node = node->clone_of;
|
|
if (node != orig)
|
|
node = node->next_sibling_clone;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Like cgraph_create_edge walk the clone tree and update all clones sharing
|
|
same function body. If clones already have edge for OLD_STMT; only
|
|
update the edge same way as cgraph_set_call_stmt_including_clones does.
|
|
|
|
TODO: COUNT and LOOP_DEPTH should be properly distributed based on relative
|
|
frequencies of the clones. */
|
|
|
|
void
|
|
cgraph_create_edge_including_clones (struct cgraph_node *orig,
|
|
struct cgraph_node *callee,
|
|
gimple old_stmt,
|
|
gimple stmt, gcov_type count,
|
|
int freq,
|
|
cgraph_inline_failed_t reason)
|
|
{
|
|
struct cgraph_node *node;
|
|
struct cgraph_edge *edge;
|
|
|
|
if (!cgraph_edge (orig, stmt))
|
|
{
|
|
edge = cgraph_create_edge (orig, callee, stmt, count, freq);
|
|
edge->inline_failed = reason;
|
|
}
|
|
|
|
node = orig->clones;
|
|
if (node)
|
|
while (node != orig)
|
|
{
|
|
struct cgraph_edge *edge = cgraph_edge (node, old_stmt);
|
|
|
|
/* It is possible that clones already contain the edge while
|
|
master didn't. Either we promoted indirect call into direct
|
|
call in the clone or we are processing clones of unreachable
|
|
master where edges has been removed. */
|
|
if (edge)
|
|
cgraph_set_call_stmt (edge, stmt);
|
|
else if (!cgraph_edge (node, stmt))
|
|
{
|
|
edge = cgraph_create_edge (node, callee, stmt, count,
|
|
freq);
|
|
edge->inline_failed = reason;
|
|
}
|
|
|
|
if (node->clones)
|
|
node = node->clones;
|
|
else if (node->next_sibling_clone)
|
|
node = node->next_sibling_clone;
|
|
else
|
|
{
|
|
while (node != orig && !node->next_sibling_clone)
|
|
node = node->clone_of;
|
|
if (node != orig)
|
|
node = node->next_sibling_clone;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Remove the node from cgraph and all inline clones inlined into it.
|
|
Skip however removal of FORBIDDEN_NODE and return true if it needs to be
|
|
removed. This allows to call the function from outer loop walking clone
|
|
tree. */
|
|
|
|
bool
|
|
cgraph_remove_node_and_inline_clones (struct cgraph_node *node, struct cgraph_node *forbidden_node)
|
|
{
|
|
struct cgraph_edge *e, *next;
|
|
bool found = false;
|
|
|
|
if (node == forbidden_node)
|
|
return true;
|
|
for (e = node->callees; e; e = next)
|
|
{
|
|
next = e->next_callee;
|
|
if (!e->inline_failed)
|
|
found |= cgraph_remove_node_and_inline_clones (e->callee, forbidden_node);
|
|
}
|
|
cgraph_remove_node (node);
|
|
return found;
|
|
}
|
|
|
|
/* The edges representing the callers of the NEW_VERSION node were
|
|
fixed by cgraph_function_versioning (), now the call_expr in their
|
|
respective tree code should be updated to call the NEW_VERSION. */
|
|
|
|
static void
|
|
update_call_expr (struct cgraph_node *new_version)
|
|
{
|
|
struct cgraph_edge *e;
|
|
|
|
gcc_assert (new_version);
|
|
|
|
/* Update the call expr on the edges to call the new version. */
|
|
for (e = new_version->callers; e; e = e->next_caller)
|
|
{
|
|
struct function *inner_function = DECL_STRUCT_FUNCTION (e->caller->symbol.decl);
|
|
gimple_call_set_fndecl (e->call_stmt, new_version->symbol.decl);
|
|
maybe_clean_eh_stmt_fn (inner_function, e->call_stmt);
|
|
}
|
|
}
|
|
|
|
|
|
/* Create a new cgraph node which is the new version of
|
|
OLD_VERSION node. REDIRECT_CALLERS holds the callers
|
|
edges which should be redirected to point to
|
|
NEW_VERSION. ALL the callees edges of OLD_VERSION
|
|
are cloned to the new version node. Return the new
|
|
version node.
|
|
|
|
If non-NULL BLOCK_TO_COPY determine what basic blocks
|
|
was copied to prevent duplications of calls that are dead
|
|
in the clone. */
|
|
|
|
struct cgraph_node *
|
|
cgraph_copy_node_for_versioning (struct cgraph_node *old_version,
|
|
tree new_decl,
|
|
VEC(cgraph_edge_p,heap) *redirect_callers,
|
|
bitmap bbs_to_copy)
|
|
{
|
|
struct cgraph_node *new_version;
|
|
struct cgraph_edge *e;
|
|
unsigned i;
|
|
|
|
gcc_assert (old_version);
|
|
|
|
new_version = cgraph_create_node (new_decl);
|
|
|
|
new_version->analyzed = old_version->analyzed;
|
|
new_version->local = old_version->local;
|
|
new_version->symbol.externally_visible = false;
|
|
new_version->local.local = old_version->analyzed;
|
|
new_version->global = old_version->global;
|
|
new_version->rtl = old_version->rtl;
|
|
new_version->count = old_version->count;
|
|
|
|
for (e = old_version->callees; e; e=e->next_callee)
|
|
if (!bbs_to_copy
|
|
|| bitmap_bit_p (bbs_to_copy, gimple_bb (e->call_stmt)->index))
|
|
cgraph_clone_edge (e, new_version, e->call_stmt,
|
|
e->lto_stmt_uid, REG_BR_PROB_BASE,
|
|
CGRAPH_FREQ_BASE,
|
|
true);
|
|
for (e = old_version->indirect_calls; e; e=e->next_callee)
|
|
if (!bbs_to_copy
|
|
|| bitmap_bit_p (bbs_to_copy, gimple_bb (e->call_stmt)->index))
|
|
cgraph_clone_edge (e, new_version, e->call_stmt,
|
|
e->lto_stmt_uid, REG_BR_PROB_BASE,
|
|
CGRAPH_FREQ_BASE,
|
|
true);
|
|
FOR_EACH_VEC_ELT (cgraph_edge_p, redirect_callers, i, e)
|
|
{
|
|
/* Redirect calls to the old version node to point to its new
|
|
version. */
|
|
cgraph_redirect_edge_callee (e, new_version);
|
|
}
|
|
|
|
cgraph_call_node_duplication_hooks (old_version, new_version);
|
|
|
|
return new_version;
|
|
}
|
|
|
|
/* Perform function versioning.
|
|
Function versioning includes copying of the tree and
|
|
a callgraph update (creating a new cgraph node and updating
|
|
its callees and callers).
|
|
|
|
REDIRECT_CALLERS varray includes the edges to be redirected
|
|
to the new version.
|
|
|
|
TREE_MAP is a mapping of tree nodes we want to replace with
|
|
new ones (according to results of prior analysis).
|
|
OLD_VERSION_NODE is the node that is versioned.
|
|
|
|
If non-NULL ARGS_TO_SKIP determine function parameters to remove
|
|
from new version.
|
|
If SKIP_RETURN is true, the new version will return void.
|
|
If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
|
|
If non_NULL NEW_ENTRY determine new entry BB of the clone.
|
|
|
|
Return the new version's cgraph node. */
|
|
|
|
struct cgraph_node *
|
|
cgraph_function_versioning (struct cgraph_node *old_version_node,
|
|
VEC(cgraph_edge_p,heap) *redirect_callers,
|
|
VEC (ipa_replace_map_p,gc)* tree_map,
|
|
bitmap args_to_skip,
|
|
bool skip_return,
|
|
bitmap bbs_to_copy,
|
|
basic_block new_entry_block,
|
|
const char *clone_name)
|
|
{
|
|
tree old_decl = old_version_node->symbol.decl;
|
|
struct cgraph_node *new_version_node = NULL;
|
|
tree new_decl;
|
|
|
|
if (!tree_versionable_function_p (old_decl))
|
|
return NULL;
|
|
|
|
gcc_assert (old_version_node->local.can_change_signature || !args_to_skip);
|
|
|
|
/* Make a new FUNCTION_DECL tree node for the new version. */
|
|
if (!args_to_skip && !skip_return)
|
|
new_decl = copy_node (old_decl);
|
|
else
|
|
new_decl
|
|
= build_function_decl_skip_args (old_decl, args_to_skip, skip_return);
|
|
|
|
/* Generate a new name for the new version. */
|
|
DECL_NAME (new_decl) = clone_function_name (old_decl, clone_name);
|
|
SET_DECL_ASSEMBLER_NAME (new_decl, DECL_NAME (new_decl));
|
|
SET_DECL_RTL (new_decl, NULL);
|
|
|
|
/* When the old decl was a con-/destructor make sure the clone isn't. */
|
|
DECL_STATIC_CONSTRUCTOR(new_decl) = 0;
|
|
DECL_STATIC_DESTRUCTOR(new_decl) = 0;
|
|
|
|
/* Create the new version's call-graph node.
|
|
and update the edges of the new node. */
|
|
new_version_node =
|
|
cgraph_copy_node_for_versioning (old_version_node, new_decl,
|
|
redirect_callers, bbs_to_copy);
|
|
|
|
/* Copy the OLD_VERSION_NODE function tree to the new version. */
|
|
tree_function_versioning (old_decl, new_decl, tree_map, false, args_to_skip,
|
|
skip_return, bbs_to_copy, new_entry_block);
|
|
|
|
/* Update the new version's properties.
|
|
Make The new version visible only within this translation unit. Make sure
|
|
that is not weak also.
|
|
??? We cannot use COMDAT linkage because there is no
|
|
ABI support for this. */
|
|
symtab_make_decl_local (new_version_node->symbol.decl);
|
|
DECL_VIRTUAL_P (new_version_node->symbol.decl) = 0;
|
|
new_version_node->symbol.externally_visible = 0;
|
|
new_version_node->local.local = 1;
|
|
new_version_node->lowered = true;
|
|
|
|
/* Update the call_expr on the edges to call the new version node. */
|
|
update_call_expr (new_version_node);
|
|
|
|
cgraph_call_function_insertion_hooks (new_version_node);
|
|
return new_version_node;
|
|
}
|
|
|
|
/* Given virtual clone, turn it into actual clone. */
|
|
|
|
static void
|
|
cgraph_materialize_clone (struct cgraph_node *node)
|
|
{
|
|
bitmap_obstack_initialize (NULL);
|
|
node->former_clone_of = node->clone_of->symbol.decl;
|
|
if (node->clone_of->former_clone_of)
|
|
node->former_clone_of = node->clone_of->former_clone_of;
|
|
/* Copy the OLD_VERSION_NODE function tree to the new version. */
|
|
tree_function_versioning (node->clone_of->symbol.decl, node->symbol.decl,
|
|
node->clone.tree_map, true,
|
|
node->clone.args_to_skip, false,
|
|
NULL, NULL);
|
|
if (cgraph_dump_file)
|
|
{
|
|
dump_function_to_file (node->clone_of->symbol.decl, cgraph_dump_file, dump_flags);
|
|
dump_function_to_file (node->symbol.decl, cgraph_dump_file, dump_flags);
|
|
}
|
|
|
|
/* Function is no longer clone. */
|
|
if (node->next_sibling_clone)
|
|
node->next_sibling_clone->prev_sibling_clone = node->prev_sibling_clone;
|
|
if (node->prev_sibling_clone)
|
|
node->prev_sibling_clone->next_sibling_clone = node->next_sibling_clone;
|
|
else
|
|
node->clone_of->clones = node->next_sibling_clone;
|
|
node->next_sibling_clone = NULL;
|
|
node->prev_sibling_clone = NULL;
|
|
if (!node->clone_of->analyzed && !node->clone_of->clones)
|
|
{
|
|
cgraph_release_function_body (node->clone_of);
|
|
cgraph_node_remove_callees (node->clone_of);
|
|
ipa_remove_all_references (&node->clone_of->symbol.ref_list);
|
|
}
|
|
node->clone_of = NULL;
|
|
bitmap_obstack_release (NULL);
|
|
}
|
|
|
|
/* Once all functions from compilation unit are in memory, produce all clones
|
|
and update all calls. We might also do this on demand if we don't want to
|
|
bring all functions to memory prior compilation, but current WHOPR
|
|
implementation does that and it is is bit easier to keep everything right in
|
|
this order. */
|
|
|
|
void
|
|
cgraph_materialize_all_clones (void)
|
|
{
|
|
struct cgraph_node *node;
|
|
bool stabilized = false;
|
|
|
|
if (cgraph_dump_file)
|
|
fprintf (cgraph_dump_file, "Materializing clones\n");
|
|
#ifdef ENABLE_CHECKING
|
|
verify_cgraph ();
|
|
#endif
|
|
|
|
/* We can also do topological order, but number of iterations should be
|
|
bounded by number of IPA passes since single IPA pass is probably not
|
|
going to create clones of clones it created itself. */
|
|
while (!stabilized)
|
|
{
|
|
stabilized = true;
|
|
FOR_EACH_FUNCTION (node)
|
|
{
|
|
if (node->clone_of && node->symbol.decl != node->clone_of->symbol.decl
|
|
&& !gimple_has_body_p (node->symbol.decl))
|
|
{
|
|
if (gimple_has_body_p (node->clone_of->symbol.decl))
|
|
{
|
|
if (cgraph_dump_file)
|
|
{
|
|
fprintf (cgraph_dump_file, "cloning %s to %s\n",
|
|
xstrdup (cgraph_node_name (node->clone_of)),
|
|
xstrdup (cgraph_node_name (node)));
|
|
if (node->clone.tree_map)
|
|
{
|
|
unsigned int i;
|
|
fprintf (cgraph_dump_file, " replace map: ");
|
|
for (i = 0; i < VEC_length (ipa_replace_map_p,
|
|
node->clone.tree_map);
|
|
i++)
|
|
{
|
|
struct ipa_replace_map *replace_info;
|
|
replace_info = VEC_index (ipa_replace_map_p,
|
|
node->clone.tree_map,
|
|
i);
|
|
print_generic_expr (cgraph_dump_file, replace_info->old_tree, 0);
|
|
fprintf (cgraph_dump_file, " -> ");
|
|
print_generic_expr (cgraph_dump_file, replace_info->new_tree, 0);
|
|
fprintf (cgraph_dump_file, "%s%s;",
|
|
replace_info->replace_p ? "(replace)":"",
|
|
replace_info->ref_p ? "(ref)":"");
|
|
}
|
|
fprintf (cgraph_dump_file, "\n");
|
|
}
|
|
if (node->clone.args_to_skip)
|
|
{
|
|
fprintf (cgraph_dump_file, " args_to_skip: ");
|
|
dump_bitmap (cgraph_dump_file, node->clone.args_to_skip);
|
|
}
|
|
if (node->clone.args_to_skip)
|
|
{
|
|
fprintf (cgraph_dump_file, " combined_args_to_skip:");
|
|
dump_bitmap (cgraph_dump_file, node->clone.combined_args_to_skip);
|
|
}
|
|
}
|
|
cgraph_materialize_clone (node);
|
|
stabilized = false;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
FOR_EACH_FUNCTION (node)
|
|
if (!node->analyzed && node->callees)
|
|
cgraph_node_remove_callees (node);
|
|
if (cgraph_dump_file)
|
|
fprintf (cgraph_dump_file, "Materialization Call site updates done.\n");
|
|
#ifdef ENABLE_CHECKING
|
|
verify_cgraph ();
|
|
#endif
|
|
symtab_remove_unreachable_nodes (false, cgraph_dump_file);
|
|
}
|
|
|
|
#include "gt-cgraphclones.h"
|