170082880f
From-SVN: r96250
2543 lines
68 KiB
C
2543 lines
68 KiB
C
/* Convert a program in SSA form into Normal form.
|
|
Copyright (C) 2004, 2005 Free Software Foundation, Inc.
|
|
Contributed by Andrew Macleod <amacleod@redhat.com>
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2, or (at your option)
|
|
any later version.
|
|
|
|
GCC is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING. If not, write to
|
|
the Free Software Foundation, 59 Temple Place - Suite 330,
|
|
Boston, MA 02111-1307, USA. */
|
|
|
|
#include "config.h"
|
|
#include "system.h"
|
|
#include "coretypes.h"
|
|
#include "tm.h"
|
|
#include "tree.h"
|
|
#include "flags.h"
|
|
#include "rtl.h"
|
|
#include "tm_p.h"
|
|
#include "ggc.h"
|
|
#include "langhooks.h"
|
|
#include "hard-reg-set.h"
|
|
#include "basic-block.h"
|
|
#include "output.h"
|
|
#include "errors.h"
|
|
#include "expr.h"
|
|
#include "function.h"
|
|
#include "diagnostic.h"
|
|
#include "bitmap.h"
|
|
#include "tree-flow.h"
|
|
#include "tree-gimple.h"
|
|
#include "tree-inline.h"
|
|
#include "varray.h"
|
|
#include "timevar.h"
|
|
#include "hashtab.h"
|
|
#include "tree-dump.h"
|
|
#include "tree-ssa-live.h"
|
|
#include "tree-pass.h"
|
|
|
|
/* Flags to pass to remove_ssa_form. */
|
|
|
|
#define SSANORM_PERFORM_TER 0x1
|
|
#define SSANORM_COMBINE_TEMPS 0x2
|
|
#define SSANORM_COALESCE_PARTITIONS 0x4
|
|
|
|
/* Used to hold all the components required to do SSA PHI elimination.
|
|
The node and pred/succ list is a simple linear list of nodes and
|
|
edges represented as pairs of nodes.
|
|
|
|
The predecessor and successor list: Nodes are entered in pairs, where
|
|
[0] ->PRED, [1]->SUCC. All the even indexes in the array represent
|
|
predecessors, all the odd elements are successors.
|
|
|
|
Rationale:
|
|
When implemented as bitmaps, very large programs SSA->Normal times were
|
|
being dominated by clearing the interference graph.
|
|
|
|
Typically this list of edges is extremely small since it only includes
|
|
PHI results and uses from a single edge which have not coalesced with
|
|
each other. This means that no virtual PHI nodes are included, and
|
|
empirical evidence suggests that the number of edges rarely exceed
|
|
3, and in a bootstrap of GCC, the maximum size encountered was 7.
|
|
This also limits the number of possible nodes that are involved to
|
|
rarely more than 6, and in the bootstrap of gcc, the maximum number
|
|
of nodes encountered was 12. */
|
|
|
|
typedef struct _elim_graph {
|
|
/* Size of the elimination vectors. */
|
|
int size;
|
|
|
|
/* List of nodes in the elimination graph. */
|
|
varray_type nodes;
|
|
|
|
/* The predecessor and successor edge list. */
|
|
varray_type edge_list;
|
|
|
|
/* Visited vector. */
|
|
sbitmap visited;
|
|
|
|
/* Stack for visited nodes. */
|
|
varray_type stack;
|
|
|
|
/* The variable partition map. */
|
|
var_map map;
|
|
|
|
/* Edge being eliminated by this graph. */
|
|
edge e;
|
|
|
|
/* List of constant copies to emit. These are pushed on in pairs. */
|
|
varray_type const_copies;
|
|
} *elim_graph;
|
|
|
|
|
|
/* Local functions. */
|
|
static tree create_temp (tree);
|
|
static void insert_copy_on_edge (edge, tree, tree);
|
|
static elim_graph new_elim_graph (int);
|
|
static inline void delete_elim_graph (elim_graph);
|
|
static inline void clear_elim_graph (elim_graph);
|
|
static inline int elim_graph_size (elim_graph);
|
|
static inline void elim_graph_add_node (elim_graph, tree);
|
|
static inline void elim_graph_add_edge (elim_graph, int, int);
|
|
static inline int elim_graph_remove_succ_edge (elim_graph, int);
|
|
|
|
static inline void eliminate_name (elim_graph, tree);
|
|
static void eliminate_build (elim_graph, basic_block);
|
|
static void elim_forward (elim_graph, int);
|
|
static int elim_unvisited_predecessor (elim_graph, int);
|
|
static void elim_backward (elim_graph, int);
|
|
static void elim_create (elim_graph, int);
|
|
static void eliminate_phi (edge, elim_graph);
|
|
static tree_live_info_p coalesce_ssa_name (var_map, int);
|
|
static void assign_vars (var_map);
|
|
static bool replace_use_variable (var_map, use_operand_p, tree *);
|
|
static bool replace_def_variable (var_map, def_operand_p, tree *);
|
|
static void eliminate_virtual_phis (void);
|
|
static void coalesce_abnormal_edges (var_map, conflict_graph, root_var_p);
|
|
static void print_exprs (FILE *, const char *, tree, const char *, tree,
|
|
const char *);
|
|
static void print_exprs_edge (FILE *, edge, const char *, tree, const char *,
|
|
tree);
|
|
|
|
|
|
/* Create a temporary variable based on the type of variable T. Use T's name
|
|
as the prefix. */
|
|
|
|
static tree
|
|
create_temp (tree t)
|
|
{
|
|
tree tmp;
|
|
const char *name = NULL;
|
|
tree type;
|
|
|
|
if (TREE_CODE (t) == SSA_NAME)
|
|
t = SSA_NAME_VAR (t);
|
|
|
|
gcc_assert (TREE_CODE (t) == VAR_DECL || TREE_CODE (t) == PARM_DECL);
|
|
|
|
type = TREE_TYPE (t);
|
|
tmp = DECL_NAME (t);
|
|
if (tmp)
|
|
name = IDENTIFIER_POINTER (tmp);
|
|
|
|
if (name == NULL)
|
|
name = "temp";
|
|
tmp = create_tmp_var (type, name);
|
|
|
|
if (DECL_DEBUG_EXPR (t) && DECL_DEBUG_EXPR_IS_FROM (t))
|
|
{
|
|
DECL_DEBUG_EXPR (tmp) = DECL_DEBUG_EXPR (t);
|
|
DECL_DEBUG_EXPR_IS_FROM (tmp) = 1;
|
|
}
|
|
else if (!DECL_IGNORED_P (t))
|
|
{
|
|
DECL_DEBUG_EXPR (tmp) = t;
|
|
DECL_DEBUG_EXPR_IS_FROM (tmp) = 1;
|
|
}
|
|
DECL_ARTIFICIAL (tmp) = DECL_ARTIFICIAL (t);
|
|
DECL_IGNORED_P (tmp) = DECL_IGNORED_P (t);
|
|
add_referenced_tmp_var (tmp);
|
|
|
|
/* add_referenced_tmp_var will create the annotation and set up some
|
|
of the flags in the annotation. However, some flags we need to
|
|
inherit from our original variable. */
|
|
var_ann (tmp)->type_mem_tag = var_ann (t)->type_mem_tag;
|
|
if (is_call_clobbered (t))
|
|
mark_call_clobbered (tmp);
|
|
|
|
return tmp;
|
|
}
|
|
|
|
|
|
/* This helper function fill insert a copy from a constant or variable SRC to
|
|
variable DEST on edge E. */
|
|
|
|
static void
|
|
insert_copy_on_edge (edge e, tree dest, tree src)
|
|
{
|
|
tree copy;
|
|
|
|
copy = build (MODIFY_EXPR, TREE_TYPE (dest), dest, src);
|
|
set_is_used (dest);
|
|
|
|
if (TREE_CODE (src) == ADDR_EXPR)
|
|
src = TREE_OPERAND (src, 0);
|
|
if (TREE_CODE (src) == VAR_DECL || TREE_CODE (src) == PARM_DECL)
|
|
set_is_used (src);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file,
|
|
"Inserting a copy on edge BB%d->BB%d :",
|
|
e->src->index,
|
|
e->dest->index);
|
|
print_generic_expr (dump_file, copy, dump_flags);
|
|
fprintf (dump_file, "\n");
|
|
}
|
|
|
|
bsi_insert_on_edge (e, copy);
|
|
}
|
|
|
|
|
|
/* Create an elimination graph with SIZE nodes and associated data
|
|
structures. */
|
|
|
|
static elim_graph
|
|
new_elim_graph (int size)
|
|
{
|
|
elim_graph g = (elim_graph) xmalloc (sizeof (struct _elim_graph));
|
|
|
|
VARRAY_TREE_INIT (g->nodes, 30, "Elimination Node List");
|
|
VARRAY_TREE_INIT (g->const_copies, 20, "Elimination Constant Copies");
|
|
VARRAY_INT_INIT (g->edge_list, 20, "Elimination Edge List");
|
|
VARRAY_INT_INIT (g->stack, 30, " Elimination Stack");
|
|
|
|
g->visited = sbitmap_alloc (size);
|
|
|
|
return g;
|
|
}
|
|
|
|
|
|
/* Empty elimination graph G. */
|
|
|
|
static inline void
|
|
clear_elim_graph (elim_graph g)
|
|
{
|
|
VARRAY_POP_ALL (g->nodes);
|
|
VARRAY_POP_ALL (g->edge_list);
|
|
}
|
|
|
|
|
|
/* Delete elimination graph G. */
|
|
|
|
static inline void
|
|
delete_elim_graph (elim_graph g)
|
|
{
|
|
sbitmap_free (g->visited);
|
|
free (g);
|
|
}
|
|
|
|
|
|
/* Return the number of nodes in graph G. */
|
|
|
|
static inline int
|
|
elim_graph_size (elim_graph g)
|
|
{
|
|
return VARRAY_ACTIVE_SIZE (g->nodes);
|
|
}
|
|
|
|
|
|
/* Add NODE to graph G, if it doesn't exist already. */
|
|
|
|
static inline void
|
|
elim_graph_add_node (elim_graph g, tree node)
|
|
{
|
|
int x;
|
|
for (x = 0; x < elim_graph_size (g); x++)
|
|
if (VARRAY_TREE (g->nodes, x) == node)
|
|
return;
|
|
VARRAY_PUSH_TREE (g->nodes, node);
|
|
}
|
|
|
|
|
|
/* Add the edge PRED->SUCC to graph G. */
|
|
|
|
static inline void
|
|
elim_graph_add_edge (elim_graph g, int pred, int succ)
|
|
{
|
|
VARRAY_PUSH_INT (g->edge_list, pred);
|
|
VARRAY_PUSH_INT (g->edge_list, succ);
|
|
}
|
|
|
|
|
|
/* Remove an edge from graph G for which NODE is the predecessor, and
|
|
return the successor node. -1 is returned if there is no such edge. */
|
|
|
|
static inline int
|
|
elim_graph_remove_succ_edge (elim_graph g, int node)
|
|
{
|
|
int y;
|
|
unsigned x;
|
|
for (x = 0; x < VARRAY_ACTIVE_SIZE (g->edge_list); x += 2)
|
|
if (VARRAY_INT (g->edge_list, x) == node)
|
|
{
|
|
VARRAY_INT (g->edge_list, x) = -1;
|
|
y = VARRAY_INT (g->edge_list, x + 1);
|
|
VARRAY_INT (g->edge_list, x + 1) = -1;
|
|
return y;
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
|
|
/* Find all the nodes in GRAPH which are successors to NODE in the
|
|
edge list. VAR will hold the partition number found. CODE is the
|
|
code fragment executed for every node found. */
|
|
|
|
#define FOR_EACH_ELIM_GRAPH_SUCC(GRAPH, NODE, VAR, CODE) \
|
|
do { \
|
|
unsigned x_; \
|
|
int y_; \
|
|
for (x_ = 0; x_ < VARRAY_ACTIVE_SIZE ((GRAPH)->edge_list); x_ += 2) \
|
|
{ \
|
|
y_ = VARRAY_INT ((GRAPH)->edge_list, x_); \
|
|
if (y_ != (NODE)) \
|
|
continue; \
|
|
(VAR) = VARRAY_INT ((GRAPH)->edge_list, x_ + 1); \
|
|
CODE; \
|
|
} \
|
|
} while (0)
|
|
|
|
|
|
/* Find all the nodes which are predecessors of NODE in the edge list for
|
|
GRAPH. VAR will hold the partition number found. CODE is the
|
|
code fragment executed for every node found. */
|
|
|
|
#define FOR_EACH_ELIM_GRAPH_PRED(GRAPH, NODE, VAR, CODE) \
|
|
do { \
|
|
unsigned x_; \
|
|
int y_; \
|
|
for (x_ = 0; x_ < VARRAY_ACTIVE_SIZE ((GRAPH)->edge_list); x_ += 2) \
|
|
{ \
|
|
y_ = VARRAY_INT ((GRAPH)->edge_list, x_ + 1); \
|
|
if (y_ != (NODE)) \
|
|
continue; \
|
|
(VAR) = VARRAY_INT ((GRAPH)->edge_list, x_); \
|
|
CODE; \
|
|
} \
|
|
} while (0)
|
|
|
|
|
|
/* Add T to elimination graph G. */
|
|
|
|
static inline void
|
|
eliminate_name (elim_graph g, tree T)
|
|
{
|
|
elim_graph_add_node (g, T);
|
|
}
|
|
|
|
|
|
/* Build elimination graph G for basic block BB on incoming PHI edge
|
|
G->e. */
|
|
|
|
static void
|
|
eliminate_build (elim_graph g, basic_block B)
|
|
{
|
|
tree phi;
|
|
tree T0, Ti;
|
|
int p0, pi;
|
|
|
|
clear_elim_graph (g);
|
|
|
|
for (phi = phi_nodes (B); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
T0 = var_to_partition_to_var (g->map, PHI_RESULT (phi));
|
|
|
|
/* Ignore results which are not in partitions. */
|
|
if (T0 == NULL_TREE)
|
|
continue;
|
|
|
|
Ti = PHI_ARG_DEF (phi, g->e->dest_idx);
|
|
|
|
/* If this argument is a constant, or a SSA_NAME which is being
|
|
left in SSA form, just queue a copy to be emitted on this
|
|
edge. */
|
|
if (!phi_ssa_name_p (Ti)
|
|
|| (TREE_CODE (Ti) == SSA_NAME
|
|
&& var_to_partition (g->map, Ti) == NO_PARTITION))
|
|
{
|
|
/* Save constant copies until all other copies have been emitted
|
|
on this edge. */
|
|
VARRAY_PUSH_TREE (g->const_copies, T0);
|
|
VARRAY_PUSH_TREE (g->const_copies, Ti);
|
|
}
|
|
else
|
|
{
|
|
Ti = var_to_partition_to_var (g->map, Ti);
|
|
if (T0 != Ti)
|
|
{
|
|
eliminate_name (g, T0);
|
|
eliminate_name (g, Ti);
|
|
p0 = var_to_partition (g->map, T0);
|
|
pi = var_to_partition (g->map, Ti);
|
|
elim_graph_add_edge (g, p0, pi);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/* Push successors of T onto the elimination stack for G. */
|
|
|
|
static void
|
|
elim_forward (elim_graph g, int T)
|
|
{
|
|
int S;
|
|
SET_BIT (g->visited, T);
|
|
FOR_EACH_ELIM_GRAPH_SUCC (g, T, S,
|
|
{
|
|
if (!TEST_BIT (g->visited, S))
|
|
elim_forward (g, S);
|
|
});
|
|
VARRAY_PUSH_INT (g->stack, T);
|
|
}
|
|
|
|
|
|
/* Return 1 if there unvisited predecessors of T in graph G. */
|
|
|
|
static int
|
|
elim_unvisited_predecessor (elim_graph g, int T)
|
|
{
|
|
int P;
|
|
FOR_EACH_ELIM_GRAPH_PRED (g, T, P,
|
|
{
|
|
if (!TEST_BIT (g->visited, P))
|
|
return 1;
|
|
});
|
|
return 0;
|
|
}
|
|
|
|
/* Process predecessors first, and insert a copy. */
|
|
|
|
static void
|
|
elim_backward (elim_graph g, int T)
|
|
{
|
|
int P;
|
|
SET_BIT (g->visited, T);
|
|
FOR_EACH_ELIM_GRAPH_PRED (g, T, P,
|
|
{
|
|
if (!TEST_BIT (g->visited, P))
|
|
{
|
|
elim_backward (g, P);
|
|
insert_copy_on_edge (g->e,
|
|
partition_to_var (g->map, P),
|
|
partition_to_var (g->map, T));
|
|
}
|
|
});
|
|
}
|
|
|
|
/* Insert required copies for T in graph G. Check for a strongly connected
|
|
region, and create a temporary to break the cycle if one is found. */
|
|
|
|
static void
|
|
elim_create (elim_graph g, int T)
|
|
{
|
|
tree U;
|
|
int P, S;
|
|
|
|
if (elim_unvisited_predecessor (g, T))
|
|
{
|
|
U = create_temp (partition_to_var (g->map, T));
|
|
insert_copy_on_edge (g->e, U, partition_to_var (g->map, T));
|
|
FOR_EACH_ELIM_GRAPH_PRED (g, T, P,
|
|
{
|
|
if (!TEST_BIT (g->visited, P))
|
|
{
|
|
elim_backward (g, P);
|
|
insert_copy_on_edge (g->e, partition_to_var (g->map, P), U);
|
|
}
|
|
});
|
|
}
|
|
else
|
|
{
|
|
S = elim_graph_remove_succ_edge (g, T);
|
|
if (S != -1)
|
|
{
|
|
SET_BIT (g->visited, T);
|
|
insert_copy_on_edge (g->e,
|
|
partition_to_var (g->map, T),
|
|
partition_to_var (g->map, S));
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
/* Eliminate all the phi nodes on edge E in graph G. */
|
|
|
|
static void
|
|
eliminate_phi (edge e, elim_graph g)
|
|
{
|
|
int x;
|
|
basic_block B = e->dest;
|
|
|
|
gcc_assert (VARRAY_ACTIVE_SIZE (g->const_copies) == 0);
|
|
|
|
/* Abnormal edges already have everything coalesced, or the coalescer
|
|
would have aborted. */
|
|
if (e->flags & EDGE_ABNORMAL)
|
|
return;
|
|
|
|
g->e = e;
|
|
|
|
eliminate_build (g, B);
|
|
|
|
if (elim_graph_size (g) != 0)
|
|
{
|
|
sbitmap_zero (g->visited);
|
|
VARRAY_POP_ALL (g->stack);
|
|
|
|
for (x = 0; x < elim_graph_size (g); x++)
|
|
{
|
|
tree var = VARRAY_TREE (g->nodes, x);
|
|
int p = var_to_partition (g->map, var);
|
|
if (!TEST_BIT (g->visited, p))
|
|
elim_forward (g, p);
|
|
}
|
|
|
|
sbitmap_zero (g->visited);
|
|
while (VARRAY_ACTIVE_SIZE (g->stack) > 0)
|
|
{
|
|
x = VARRAY_TOP_INT (g->stack);
|
|
VARRAY_POP (g->stack);
|
|
if (!TEST_BIT (g->visited, x))
|
|
elim_create (g, x);
|
|
}
|
|
}
|
|
|
|
/* If there are any pending constant copies, issue them now. */
|
|
while (VARRAY_ACTIVE_SIZE (g->const_copies) > 0)
|
|
{
|
|
tree src, dest;
|
|
src = VARRAY_TOP_TREE (g->const_copies);
|
|
VARRAY_POP (g->const_copies);
|
|
dest = VARRAY_TOP_TREE (g->const_copies);
|
|
VARRAY_POP (g->const_copies);
|
|
insert_copy_on_edge (e, dest, src);
|
|
}
|
|
}
|
|
|
|
|
|
/* Shortcut routine to print messages to file F of the form:
|
|
"STR1 EXPR1 STR2 EXPR2 STR3." */
|
|
|
|
static void
|
|
print_exprs (FILE *f, const char *str1, tree expr1, const char *str2,
|
|
tree expr2, const char *str3)
|
|
{
|
|
fprintf (f, "%s", str1);
|
|
print_generic_expr (f, expr1, TDF_SLIM);
|
|
fprintf (f, "%s", str2);
|
|
print_generic_expr (f, expr2, TDF_SLIM);
|
|
fprintf (f, "%s", str3);
|
|
}
|
|
|
|
|
|
/* Shortcut routine to print abnormal edge messages to file F of the form:
|
|
"STR1 EXPR1 STR2 EXPR2 across edge E. */
|
|
|
|
static void
|
|
print_exprs_edge (FILE *f, edge e, const char *str1, tree expr1,
|
|
const char *str2, tree expr2)
|
|
{
|
|
print_exprs (f, str1, expr1, str2, expr2, " across an abnormal edge");
|
|
fprintf (f, " from BB%d->BB%d\n", e->src->index,
|
|
e->dest->index);
|
|
}
|
|
|
|
|
|
/* Coalesce partitions in MAP which are live across abnormal edges in GRAPH.
|
|
RV is the root variable groupings of the partitions in MAP. Since code
|
|
cannot be inserted on these edges, failure to coalesce something across
|
|
an abnormal edge is an error. */
|
|
|
|
static void
|
|
coalesce_abnormal_edges (var_map map, conflict_graph graph, root_var_p rv)
|
|
{
|
|
basic_block bb;
|
|
edge e;
|
|
tree phi, var, tmp;
|
|
int x, y, z;
|
|
edge_iterator ei;
|
|
|
|
/* Code cannot be inserted on abnormal edges. Look for all abnormal
|
|
edges, and coalesce any PHI results with their arguments across
|
|
that edge. */
|
|
|
|
FOR_EACH_BB (bb)
|
|
FOR_EACH_EDGE (e, ei, bb->succs)
|
|
if (e->dest != EXIT_BLOCK_PTR && e->flags & EDGE_ABNORMAL)
|
|
for (phi = phi_nodes (e->dest); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
/* Visit each PHI on the destination side of this abnormal
|
|
edge, and attempt to coalesce the argument with the result. */
|
|
var = PHI_RESULT (phi);
|
|
x = var_to_partition (map, var);
|
|
|
|
/* Ignore results which are not relevant. */
|
|
if (x == NO_PARTITION)
|
|
continue;
|
|
|
|
tmp = PHI_ARG_DEF (phi, e->dest_idx);
|
|
#ifdef ENABLE_CHECKING
|
|
if (!phi_ssa_name_p (tmp))
|
|
{
|
|
print_exprs_edge (stderr, e,
|
|
"\nConstant argument in PHI. Can't insert :",
|
|
var, " = ", tmp);
|
|
internal_error ("SSA corruption");
|
|
}
|
|
#else
|
|
gcc_assert (phi_ssa_name_p (tmp));
|
|
#endif
|
|
y = var_to_partition (map, tmp);
|
|
gcc_assert (x != NO_PARTITION);
|
|
gcc_assert (y != NO_PARTITION);
|
|
#ifdef ENABLE_CHECKING
|
|
if (root_var_find (rv, x) != root_var_find (rv, y))
|
|
{
|
|
print_exprs_edge (stderr, e, "\nDifferent root vars: ",
|
|
root_var (rv, root_var_find (rv, x)),
|
|
" and ",
|
|
root_var (rv, root_var_find (rv, y)));
|
|
internal_error ("SSA corruption");
|
|
}
|
|
#else
|
|
gcc_assert (root_var_find (rv, x) == root_var_find (rv, y));
|
|
#endif
|
|
|
|
if (x != y)
|
|
{
|
|
#ifdef ENABLE_CHECKING
|
|
if (conflict_graph_conflict_p (graph, x, y))
|
|
{
|
|
print_exprs_edge (stderr, e, "\n Conflict ",
|
|
partition_to_var (map, x),
|
|
" and ", partition_to_var (map, y));
|
|
internal_error ("SSA corruption");
|
|
}
|
|
#else
|
|
gcc_assert (!conflict_graph_conflict_p (graph, x, y));
|
|
#endif
|
|
|
|
/* Now map the partitions back to their real variables. */
|
|
var = partition_to_var (map, x);
|
|
tmp = partition_to_var (map, y);
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
print_exprs_edge (dump_file, e,
|
|
"ABNORMAL: Coalescing ",
|
|
var, " and ", tmp);
|
|
}
|
|
z = var_union (map, var, tmp);
|
|
#ifdef ENABLE_CHECKING
|
|
if (z == NO_PARTITION)
|
|
{
|
|
print_exprs_edge (stderr, e, "\nUnable to coalesce",
|
|
partition_to_var (map, x), " and ",
|
|
partition_to_var (map, y));
|
|
internal_error ("SSA corruption");
|
|
}
|
|
#else
|
|
gcc_assert (z != NO_PARTITION);
|
|
#endif
|
|
gcc_assert (z == x || z == y);
|
|
if (z == x)
|
|
conflict_graph_merge_regs (graph, x, y);
|
|
else
|
|
conflict_graph_merge_regs (graph, y, x);
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/* Reduce the number of live ranges in MAP. Live range information is
|
|
returned if FLAGS indicates that we are combining temporaries, otherwise
|
|
NULL is returned. The only partitions which are associated with actual
|
|
variables at this point are those which are forced to be coalesced for
|
|
various reason. (live on entry, live across abnormal edges, etc.). */
|
|
|
|
static tree_live_info_p
|
|
coalesce_ssa_name (var_map map, int flags)
|
|
{
|
|
unsigned num, x, i;
|
|
sbitmap live;
|
|
tree var, phi;
|
|
root_var_p rv;
|
|
tree_live_info_p liveinfo;
|
|
var_ann_t ann;
|
|
conflict_graph graph;
|
|
basic_block bb;
|
|
coalesce_list_p cl = NULL;
|
|
|
|
if (num_var_partitions (map) <= 1)
|
|
return NULL;
|
|
|
|
liveinfo = calculate_live_on_entry (map);
|
|
calculate_live_on_exit (liveinfo);
|
|
rv = root_var_init (map);
|
|
|
|
/* Remove single element variable from the list. */
|
|
root_var_compact (rv);
|
|
|
|
cl = create_coalesce_list (map);
|
|
|
|
/* Add all potential copies via PHI arguments to the list. */
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
tree res = PHI_RESULT (phi);
|
|
int p = var_to_partition (map, res);
|
|
if (p == NO_PARTITION)
|
|
continue;
|
|
for (x = 0; x < (unsigned)PHI_NUM_ARGS (phi); x++)
|
|
{
|
|
tree arg = PHI_ARG_DEF (phi, x);
|
|
int p2;
|
|
|
|
if (TREE_CODE (arg) != SSA_NAME)
|
|
continue;
|
|
if (SSA_NAME_VAR (res) != SSA_NAME_VAR (arg))
|
|
continue;
|
|
p2 = var_to_partition (map, PHI_ARG_DEF (phi, x));
|
|
if (p2 != NO_PARTITION)
|
|
add_coalesce (cl, p, p2, 1);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Coalesce all the result decls together. */
|
|
var = NULL_TREE;
|
|
i = 0;
|
|
for (x = 0; x < num_var_partitions (map); x++)
|
|
{
|
|
tree p = partition_to_var (map, x);
|
|
if (TREE_CODE (SSA_NAME_VAR(p)) == RESULT_DECL)
|
|
{
|
|
if (var == NULL_TREE)
|
|
{
|
|
var = p;
|
|
i = x;
|
|
}
|
|
else
|
|
add_coalesce (cl, i, x, 1);
|
|
}
|
|
}
|
|
|
|
/* Build a conflict graph. */
|
|
graph = build_tree_conflict_graph (liveinfo, rv, cl);
|
|
|
|
if (cl)
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "Before sorting:\n");
|
|
dump_coalesce_list (dump_file, cl);
|
|
}
|
|
|
|
sort_coalesce_list (cl);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "\nAfter sorting:\n");
|
|
dump_coalesce_list (dump_file, cl);
|
|
}
|
|
}
|
|
|
|
/* Put the single element variables back in. */
|
|
root_var_decompact (rv);
|
|
|
|
/* First, coalesce all live on entry variables to their root variable.
|
|
This will ensure the first use is coming from the correct location. */
|
|
|
|
live = sbitmap_alloc (num_var_partitions (map));
|
|
sbitmap_zero (live);
|
|
|
|
/* Set 'live' vector to indicate live on entry partitions. */
|
|
num = num_var_partitions (map);
|
|
for (x = 0 ; x < num; x++)
|
|
{
|
|
var = partition_to_var (map, x);
|
|
if (default_def (SSA_NAME_VAR (var)) == var)
|
|
SET_BIT (live, x);
|
|
}
|
|
|
|
if ((flags & SSANORM_COMBINE_TEMPS) == 0)
|
|
{
|
|
delete_tree_live_info (liveinfo);
|
|
liveinfo = NULL;
|
|
}
|
|
|
|
/* Assign root variable as partition representative for each live on entry
|
|
partition. */
|
|
EXECUTE_IF_SET_IN_SBITMAP (live, 0, x,
|
|
{
|
|
var = root_var (rv, root_var_find (rv, x));
|
|
ann = var_ann (var);
|
|
/* If these aren't already coalesced... */
|
|
if (partition_to_var (map, x) != var)
|
|
{
|
|
/* This root variable should have not already been assigned
|
|
to another partition which is not coalesced with this one. */
|
|
gcc_assert (!ann->out_of_ssa_tag);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
print_exprs (dump_file, "Must coalesce ",
|
|
partition_to_var (map, x),
|
|
" with the root variable ", var, ".\n");
|
|
}
|
|
|
|
change_partition_var (map, var, x);
|
|
}
|
|
});
|
|
|
|
sbitmap_free (live);
|
|
|
|
/* Coalesce partitions live across abnormal edges. */
|
|
coalesce_abnormal_edges (map, graph, rv);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
dump_var_map (dump_file, map);
|
|
|
|
/* Coalesce partitions. */
|
|
coalesce_tpa_members (rv, graph, map, cl,
|
|
((dump_flags & TDF_DETAILS) ? dump_file
|
|
: NULL));
|
|
|
|
if (flags & SSANORM_COALESCE_PARTITIONS)
|
|
coalesce_tpa_members (rv, graph, map, NULL,
|
|
((dump_flags & TDF_DETAILS) ? dump_file
|
|
: NULL));
|
|
if (cl)
|
|
delete_coalesce_list (cl);
|
|
root_var_delete (rv);
|
|
conflict_graph_delete (graph);
|
|
|
|
return liveinfo;
|
|
}
|
|
|
|
|
|
/* Take the ssa-name var_map MAP, and assign real variables to each
|
|
partition. */
|
|
|
|
static void
|
|
assign_vars (var_map map)
|
|
{
|
|
int x, i, num, rep;
|
|
tree t, var;
|
|
var_ann_t ann;
|
|
root_var_p rv;
|
|
|
|
rv = root_var_init (map);
|
|
if (!rv)
|
|
return;
|
|
|
|
/* Coalescing may already have forced some partitions to their root
|
|
variable. Find these and tag them. */
|
|
|
|
num = num_var_partitions (map);
|
|
for (x = 0; x < num; x++)
|
|
{
|
|
var = partition_to_var (map, x);
|
|
if (TREE_CODE (var) != SSA_NAME)
|
|
{
|
|
/* Coalescing will already have verified that more than one
|
|
partition doesn't have the same root variable. Simply marked
|
|
the variable as assigned. */
|
|
ann = var_ann (var);
|
|
ann->out_of_ssa_tag = 1;
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "partition %d has variable ", x);
|
|
print_generic_expr (dump_file, var, TDF_SLIM);
|
|
fprintf (dump_file, " assigned to it.\n");
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
num = root_var_num (rv);
|
|
for (x = 0; x < num; x++)
|
|
{
|
|
var = root_var (rv, x);
|
|
ann = var_ann (var);
|
|
for (i = root_var_first_partition (rv, x);
|
|
i != ROOT_VAR_NONE;
|
|
i = root_var_next_partition (rv, i))
|
|
{
|
|
t = partition_to_var (map, i);
|
|
|
|
if (t == var || TREE_CODE (t) != SSA_NAME)
|
|
continue;
|
|
|
|
rep = var_to_partition (map, t);
|
|
|
|
if (!ann->out_of_ssa_tag)
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
print_exprs (dump_file, "", t, " --> ", var, "\n");
|
|
change_partition_var (map, var, rep);
|
|
continue;
|
|
}
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
print_exprs (dump_file, "", t, " not coalesced with ", var,
|
|
"");
|
|
|
|
var = create_temp (t);
|
|
change_partition_var (map, var, rep);
|
|
ann = var_ann (var);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, " --> New temp: '");
|
|
print_generic_expr (dump_file, var, TDF_SLIM);
|
|
fprintf (dump_file, "'\n");
|
|
}
|
|
}
|
|
}
|
|
|
|
root_var_delete (rv);
|
|
}
|
|
|
|
|
|
/* Replace use operand P with whatever variable it has been rewritten to based
|
|
on the partitions in MAP. EXPR is an optional expression vector over SSA
|
|
versions which is used to replace P with an expression instead of a variable.
|
|
If the stmt is changed, return true. */
|
|
|
|
static inline bool
|
|
replace_use_variable (var_map map, use_operand_p p, tree *expr)
|
|
{
|
|
tree new_var;
|
|
tree var = USE_FROM_PTR (p);
|
|
|
|
/* Check if we are replacing this variable with an expression. */
|
|
if (expr)
|
|
{
|
|
int version = SSA_NAME_VERSION (var);
|
|
if (expr[version])
|
|
{
|
|
tree new_expr = TREE_OPERAND (expr[version], 1);
|
|
SET_USE (p, new_expr);
|
|
/* Clear the stmt's RHS, or GC might bite us. */
|
|
TREE_OPERAND (expr[version], 1) = NULL_TREE;
|
|
return true;
|
|
}
|
|
}
|
|
|
|
new_var = var_to_partition_to_var (map, var);
|
|
if (new_var)
|
|
{
|
|
SET_USE (p, new_var);
|
|
set_is_used (new_var);
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
|
|
/* Replace def operand DEF_P with whatever variable it has been rewritten to
|
|
based on the partitions in MAP. EXPR is an optional expression vector over
|
|
SSA versions which is used to replace DEF_P with an expression instead of a
|
|
variable. If the stmt is changed, return true. */
|
|
|
|
static inline bool
|
|
replace_def_variable (var_map map, def_operand_p def_p, tree *expr)
|
|
{
|
|
tree new_var;
|
|
tree var = DEF_FROM_PTR (def_p);
|
|
|
|
/* Check if we are replacing this variable with an expression. */
|
|
if (expr)
|
|
{
|
|
int version = SSA_NAME_VERSION (var);
|
|
if (expr[version])
|
|
{
|
|
tree new_expr = TREE_OPERAND (expr[version], 1);
|
|
SET_DEF (def_p, new_expr);
|
|
/* Clear the stmt's RHS, or GC might bite us. */
|
|
TREE_OPERAND (expr[version], 1) = NULL_TREE;
|
|
return true;
|
|
}
|
|
}
|
|
|
|
new_var = var_to_partition_to_var (map, var);
|
|
if (new_var)
|
|
{
|
|
SET_DEF (def_p, new_var);
|
|
set_is_used (new_var);
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
|
|
/* Remove any PHI node which is a virtual PHI. */
|
|
|
|
static void
|
|
eliminate_virtual_phis (void)
|
|
{
|
|
basic_block bb;
|
|
tree phi, next;
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
for (phi = phi_nodes (bb); phi; phi = next)
|
|
{
|
|
next = PHI_CHAIN (phi);
|
|
if (!is_gimple_reg (SSA_NAME_VAR (PHI_RESULT (phi))))
|
|
{
|
|
#ifdef ENABLE_CHECKING
|
|
int i;
|
|
/* There should be no arguments of this PHI which are in
|
|
the partition list, or we get incorrect results. */
|
|
for (i = 0; i < PHI_NUM_ARGS (phi); i++)
|
|
{
|
|
tree arg = PHI_ARG_DEF (phi, i);
|
|
if (TREE_CODE (arg) == SSA_NAME
|
|
&& is_gimple_reg (SSA_NAME_VAR (arg)))
|
|
{
|
|
fprintf (stderr, "Argument of PHI is not virtual (");
|
|
print_generic_expr (stderr, arg, TDF_SLIM);
|
|
fprintf (stderr, "), but the result is :");
|
|
print_generic_stmt (stderr, phi, TDF_SLIM);
|
|
internal_error ("SSA corruption");
|
|
}
|
|
}
|
|
#endif
|
|
remove_phi_node (phi, NULL_TREE);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/* This routine will coalesce variables in MAP of the same type which do not
|
|
interfere with each other. LIVEINFO is the live range info for variables
|
|
of interest. This will both reduce the memory footprint of the stack, and
|
|
allow us to coalesce together local copies of globals and scalarized
|
|
component refs. */
|
|
|
|
static void
|
|
coalesce_vars (var_map map, tree_live_info_p liveinfo)
|
|
{
|
|
basic_block bb;
|
|
type_var_p tv;
|
|
tree var;
|
|
unsigned x, p, p2;
|
|
coalesce_list_p cl;
|
|
conflict_graph graph;
|
|
|
|
cl = create_coalesce_list (map);
|
|
|
|
/* Merge all the live on entry vectors for coalesced partitions. */
|
|
for (x = 0; x < num_var_partitions (map); x++)
|
|
{
|
|
var = partition_to_var (map, x);
|
|
p = var_to_partition (map, var);
|
|
if (p != x)
|
|
live_merge_and_clear (liveinfo, p, x);
|
|
}
|
|
|
|
/* When PHI nodes are turned into copies, the result of each PHI node
|
|
becomes live on entry to the block. Mark these now. */
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
tree phi, arg;
|
|
unsigned p;
|
|
|
|
for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
p = var_to_partition (map, PHI_RESULT (phi));
|
|
|
|
/* Skip virtual PHI nodes. */
|
|
if (p == (unsigned)NO_PARTITION)
|
|
continue;
|
|
|
|
make_live_on_entry (liveinfo, bb, p);
|
|
|
|
/* Each argument is a potential copy operation. Add any arguments
|
|
which are not coalesced to the result to the coalesce list. */
|
|
for (x = 0; x < (unsigned)PHI_NUM_ARGS (phi); x++)
|
|
{
|
|
arg = PHI_ARG_DEF (phi, x);
|
|
if (!phi_ssa_name_p (arg))
|
|
continue;
|
|
p2 = var_to_partition (map, arg);
|
|
if (p2 == (unsigned)NO_PARTITION)
|
|
continue;
|
|
if (p != p2)
|
|
add_coalesce (cl, p, p2, 1);
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/* Re-calculate live on exit info. */
|
|
calculate_live_on_exit (liveinfo);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "Live range info for variable memory coalescing.\n");
|
|
dump_live_info (dump_file, liveinfo, LIVEDUMP_ALL);
|
|
|
|
fprintf (dump_file, "Coalesce list from phi nodes:\n");
|
|
dump_coalesce_list (dump_file, cl);
|
|
}
|
|
|
|
|
|
tv = type_var_init (map);
|
|
if (dump_file)
|
|
type_var_dump (dump_file, tv);
|
|
type_var_compact (tv);
|
|
if (dump_file)
|
|
type_var_dump (dump_file, tv);
|
|
|
|
graph = build_tree_conflict_graph (liveinfo, tv, cl);
|
|
|
|
type_var_decompact (tv);
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "type var list now looks like:n");
|
|
type_var_dump (dump_file, tv);
|
|
|
|
fprintf (dump_file, "Coalesce list after conflict graph build:\n");
|
|
dump_coalesce_list (dump_file, cl);
|
|
}
|
|
|
|
sort_coalesce_list (cl);
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "Coalesce list after sorting:\n");
|
|
dump_coalesce_list (dump_file, cl);
|
|
}
|
|
|
|
coalesce_tpa_members (tv, graph, map, cl,
|
|
((dump_flags & TDF_DETAILS) ? dump_file : NULL));
|
|
|
|
type_var_delete (tv);
|
|
delete_coalesce_list (cl);
|
|
}
|
|
|
|
|
|
/* Temporary Expression Replacement (TER)
|
|
|
|
Replace SSA version variables during out-of-ssa with their defining
|
|
expression if there is only one use of the variable.
|
|
|
|
A pass is made through the function, one block at a time. No cross block
|
|
information is tracked.
|
|
|
|
Variables which only have one use, and whose defining stmt is considered
|
|
a replaceable expression (see check_replaceable) are entered into
|
|
consideration by adding a list of dependent partitions to the version_info
|
|
vector for that ssa_name_version. This information comes from the partition
|
|
mapping for each USE. At the same time, the partition_dep_list vector for
|
|
these partitions have this version number entered into their lists.
|
|
|
|
When the use of a replaceable ssa_variable is encountered, the dependence
|
|
list in version_info[] is moved to the "pending_dependence" list in case
|
|
the current expression is also replaceable. (To be determined later in
|
|
processing this stmt.) version_info[] for the version is then updated to
|
|
point to the defining stmt and the 'replaceable' bit is set.
|
|
|
|
Any partition which is defined by a statement 'kills' any expression which
|
|
is dependent on this partition. Every ssa version in the partitions'
|
|
dependence list is removed from future consideration.
|
|
|
|
All virtual references are lumped together. Any expression which is
|
|
dependent on any virtual variable (via a VUSE) has a dependence added
|
|
to the special partition defined by VIRTUAL_PARTITION.
|
|
|
|
Whenever a V_MAY_DEF is seen, all expressions dependent this
|
|
VIRTUAL_PARTITION are removed from consideration.
|
|
|
|
At the end of a basic block, all expression are removed from consideration
|
|
in preparation for the next block.
|
|
|
|
The end result is a vector over SSA_NAME_VERSION which is passed back to
|
|
rewrite_out_of_ssa. As the SSA variables are being rewritten, instead of
|
|
replacing the SSA_NAME tree element with the partition it was assigned,
|
|
it is replaced with the RHS of the defining expression. */
|
|
|
|
|
|
/* Dependency list element. This can contain either a partition index or a
|
|
version number, depending on which list it is in. */
|
|
|
|
typedef struct value_expr_d
|
|
{
|
|
int value;
|
|
struct value_expr_d *next;
|
|
} *value_expr_p;
|
|
|
|
|
|
/* Temporary Expression Replacement (TER) table information. */
|
|
|
|
typedef struct temp_expr_table_d
|
|
{
|
|
var_map map;
|
|
void **version_info;
|
|
value_expr_p *partition_dep_list;
|
|
bitmap replaceable;
|
|
bool saw_replaceable;
|
|
int virtual_partition;
|
|
bitmap partition_in_use;
|
|
value_expr_p free_list;
|
|
value_expr_p pending_dependence;
|
|
} *temp_expr_table_p;
|
|
|
|
/* Used to indicate a dependency on V_MAY_DEFs. */
|
|
#define VIRTUAL_PARTITION(table) (table->virtual_partition)
|
|
|
|
static temp_expr_table_p new_temp_expr_table (var_map);
|
|
static tree *free_temp_expr_table (temp_expr_table_p);
|
|
static inline value_expr_p new_value_expr (temp_expr_table_p);
|
|
static inline void free_value_expr (temp_expr_table_p, value_expr_p);
|
|
static inline value_expr_p find_value_in_list (value_expr_p, int,
|
|
value_expr_p *);
|
|
static inline void add_value_to_list (temp_expr_table_p, value_expr_p *, int);
|
|
static inline void add_info_to_list (temp_expr_table_p, value_expr_p *,
|
|
value_expr_p);
|
|
static value_expr_p remove_value_from_list (value_expr_p *, int);
|
|
static void add_dependance (temp_expr_table_p, int, tree);
|
|
static bool check_replaceable (temp_expr_table_p, tree);
|
|
static void finish_expr (temp_expr_table_p, int, bool);
|
|
static void mark_replaceable (temp_expr_table_p, tree);
|
|
static inline void kill_expr (temp_expr_table_p, int, bool);
|
|
static inline void kill_virtual_exprs (temp_expr_table_p, bool);
|
|
static void find_replaceable_in_bb (temp_expr_table_p, basic_block);
|
|
static tree *find_replaceable_exprs (var_map);
|
|
static void dump_replaceable_exprs (FILE *, tree *);
|
|
|
|
|
|
/* Create a new TER table for MAP. */
|
|
|
|
static temp_expr_table_p
|
|
new_temp_expr_table (var_map map)
|
|
{
|
|
temp_expr_table_p t;
|
|
|
|
t = (temp_expr_table_p) xmalloc (sizeof (struct temp_expr_table_d));
|
|
t->map = map;
|
|
|
|
t->version_info = xcalloc (num_ssa_names + 1, sizeof (void *));
|
|
t->partition_dep_list = xcalloc (num_var_partitions (map) + 1,
|
|
sizeof (value_expr_p));
|
|
|
|
t->replaceable = BITMAP_ALLOC (NULL);
|
|
t->partition_in_use = BITMAP_ALLOC (NULL);
|
|
|
|
t->saw_replaceable = false;
|
|
t->virtual_partition = num_var_partitions (map);
|
|
t->free_list = NULL;
|
|
t->pending_dependence = NULL;
|
|
|
|
return t;
|
|
}
|
|
|
|
|
|
/* Free TER table T. If there are valid replacements, return the expression
|
|
vector. */
|
|
|
|
static tree *
|
|
free_temp_expr_table (temp_expr_table_p t)
|
|
{
|
|
value_expr_p p;
|
|
tree *ret = NULL;
|
|
|
|
#ifdef ENABLE_CHECKING
|
|
unsigned x;
|
|
for (x = 0; x <= num_var_partitions (t->map); x++)
|
|
gcc_assert (!t->partition_dep_list[x]);
|
|
#endif
|
|
|
|
while ((p = t->free_list))
|
|
{
|
|
t->free_list = p->next;
|
|
free (p);
|
|
}
|
|
|
|
BITMAP_FREE (t->partition_in_use);
|
|
BITMAP_FREE (t->replaceable);
|
|
|
|
free (t->partition_dep_list);
|
|
if (t->saw_replaceable)
|
|
ret = (tree *)t->version_info;
|
|
else
|
|
free (t->version_info);
|
|
|
|
free (t);
|
|
return ret;
|
|
}
|
|
|
|
|
|
/* Allocate a new value list node. Take it from the free list in TABLE if
|
|
possible. */
|
|
|
|
static inline value_expr_p
|
|
new_value_expr (temp_expr_table_p table)
|
|
{
|
|
value_expr_p p;
|
|
if (table->free_list)
|
|
{
|
|
p = table->free_list;
|
|
table->free_list = p->next;
|
|
}
|
|
else
|
|
p = (value_expr_p) xmalloc (sizeof (struct value_expr_d));
|
|
|
|
return p;
|
|
}
|
|
|
|
|
|
/* Add value list node P to the free list in TABLE. */
|
|
|
|
static inline void
|
|
free_value_expr (temp_expr_table_p table, value_expr_p p)
|
|
{
|
|
p->next = table->free_list;
|
|
table->free_list = p;
|
|
}
|
|
|
|
|
|
/* Find VALUE if it's in LIST. Return a pointer to the list object if found,
|
|
else return NULL. If LAST_PTR is provided, it will point to the previous
|
|
item upon return, or NULL if this is the first item in the list. */
|
|
|
|
static inline value_expr_p
|
|
find_value_in_list (value_expr_p list, int value, value_expr_p *last_ptr)
|
|
{
|
|
value_expr_p curr;
|
|
value_expr_p last = NULL;
|
|
|
|
for (curr = list; curr; last = curr, curr = curr->next)
|
|
{
|
|
if (curr->value == value)
|
|
break;
|
|
}
|
|
if (last_ptr)
|
|
*last_ptr = last;
|
|
return curr;
|
|
}
|
|
|
|
|
|
/* Add VALUE to LIST, if it isn't already present. TAB is the expression
|
|
table */
|
|
|
|
static inline void
|
|
add_value_to_list (temp_expr_table_p tab, value_expr_p *list, int value)
|
|
{
|
|
value_expr_p info;
|
|
|
|
if (!find_value_in_list (*list, value, NULL))
|
|
{
|
|
info = new_value_expr (tab);
|
|
info->value = value;
|
|
info->next = *list;
|
|
*list = info;
|
|
}
|
|
}
|
|
|
|
|
|
/* Add value node INFO if it's value isn't already in LIST. Free INFO if
|
|
it is already in the list. TAB is the expression table. */
|
|
|
|
static inline void
|
|
add_info_to_list (temp_expr_table_p tab, value_expr_p *list, value_expr_p info)
|
|
{
|
|
if (find_value_in_list (*list, info->value, NULL))
|
|
free_value_expr (tab, info);
|
|
else
|
|
{
|
|
info->next = *list;
|
|
*list = info;
|
|
}
|
|
}
|
|
|
|
|
|
/* Look for VALUE in LIST. If found, remove it from the list and return it's
|
|
pointer. */
|
|
|
|
static value_expr_p
|
|
remove_value_from_list (value_expr_p *list, int value)
|
|
{
|
|
value_expr_p info, last;
|
|
|
|
info = find_value_in_list (*list, value, &last);
|
|
if (!info)
|
|
return NULL;
|
|
if (!last)
|
|
*list = info->next;
|
|
else
|
|
last->next = info->next;
|
|
|
|
return info;
|
|
}
|
|
|
|
|
|
/* Add a dependency between the def of ssa VERSION and VAR. If VAR is
|
|
replaceable by an expression, add a dependence each of the elements of the
|
|
expression. These are contained in the pending list. TAB is the
|
|
expression table. */
|
|
|
|
static void
|
|
add_dependance (temp_expr_table_p tab, int version, tree var)
|
|
{
|
|
int i, x;
|
|
value_expr_p info;
|
|
|
|
i = SSA_NAME_VERSION (var);
|
|
if (bitmap_bit_p (tab->replaceable, i))
|
|
{
|
|
/* This variable is being substituted, so use whatever dependences
|
|
were queued up when we marked this as replaceable earlier. */
|
|
while ((info = tab->pending_dependence))
|
|
{
|
|
tab->pending_dependence = info->next;
|
|
/* Get the partition this variable was dependent on. Reuse this
|
|
object to represent the current expression instead. */
|
|
x = info->value;
|
|
info->value = version;
|
|
add_info_to_list (tab, &(tab->partition_dep_list[x]), info);
|
|
add_value_to_list (tab,
|
|
(value_expr_p *)&(tab->version_info[version]), x);
|
|
bitmap_set_bit (tab->partition_in_use, x);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
i = var_to_partition (tab->map, var);
|
|
gcc_assert (i != NO_PARTITION);
|
|
add_value_to_list (tab, &(tab->partition_dep_list[i]), version);
|
|
add_value_to_list (tab,
|
|
(value_expr_p *)&(tab->version_info[version]), i);
|
|
bitmap_set_bit (tab->partition_in_use, i);
|
|
}
|
|
}
|
|
|
|
|
|
/* Check if expression STMT is suitable for replacement in table TAB. If so,
|
|
create an expression entry. Return true if this stmt is replaceable. */
|
|
|
|
static bool
|
|
check_replaceable (temp_expr_table_p tab, tree stmt)
|
|
{
|
|
stmt_ann_t ann;
|
|
vuse_optype vuseops;
|
|
def_optype defs;
|
|
use_optype uses;
|
|
tree var, def;
|
|
int num_use_ops, version;
|
|
var_map map = tab->map;
|
|
ssa_op_iter iter;
|
|
tree call_expr;
|
|
|
|
if (TREE_CODE (stmt) != MODIFY_EXPR)
|
|
return false;
|
|
|
|
ann = stmt_ann (stmt);
|
|
defs = DEF_OPS (ann);
|
|
|
|
/* Punt if there is more than 1 def, or more than 1 use. */
|
|
if (NUM_DEFS (defs) != 1)
|
|
return false;
|
|
def = DEF_OP (defs, 0);
|
|
if (version_ref_count (map, def) != 1)
|
|
return false;
|
|
|
|
/* There must be no V_MAY_DEFS. */
|
|
if (NUM_V_MAY_DEFS (V_MAY_DEF_OPS (ann)) != 0)
|
|
return false;
|
|
|
|
/* There must be no V_MUST_DEFS. */
|
|
if (NUM_V_MUST_DEFS (V_MUST_DEF_OPS (ann)) != 0)
|
|
return false;
|
|
|
|
/* Float expressions must go through memory if float-store is on. */
|
|
if (flag_float_store && FLOAT_TYPE_P (TREE_TYPE (TREE_OPERAND (stmt, 1))))
|
|
return false;
|
|
|
|
/* Calls to functions with side-effects cannot be replaced. */
|
|
if ((call_expr = get_call_expr_in (stmt)) != NULL_TREE)
|
|
{
|
|
int call_flags = call_expr_flags (call_expr);
|
|
if (TREE_SIDE_EFFECTS (call_expr)
|
|
&& !(call_flags & (ECF_PURE | ECF_CONST | ECF_NORETURN)))
|
|
return false;
|
|
}
|
|
|
|
uses = USE_OPS (ann);
|
|
num_use_ops = NUM_USES (uses);
|
|
vuseops = VUSE_OPS (ann);
|
|
|
|
/* Any expression which has no virtual operands and no real operands
|
|
should have been propagated if it's possible to do anything with them.
|
|
If this happens here, it probably exists that way for a reason, so we
|
|
won't touch it. An example is:
|
|
b_4 = &tab
|
|
There are no virtual uses nor any real uses, so we just leave this
|
|
alone to be safe. */
|
|
|
|
if (num_use_ops == 0 && NUM_VUSES (vuseops) == 0)
|
|
return false;
|
|
|
|
version = SSA_NAME_VERSION (def);
|
|
|
|
/* Add this expression to the dependency list for each use partition. */
|
|
FOR_EACH_SSA_TREE_OPERAND (var, stmt, iter, SSA_OP_USE)
|
|
{
|
|
add_dependance (tab, version, var);
|
|
}
|
|
|
|
/* If there are VUSES, add a dependence on virtual defs. */
|
|
if (NUM_VUSES (vuseops) != 0)
|
|
{
|
|
add_value_to_list (tab, (value_expr_p *)&(tab->version_info[version]),
|
|
VIRTUAL_PARTITION (tab));
|
|
add_value_to_list (tab,
|
|
&(tab->partition_dep_list[VIRTUAL_PARTITION (tab)]),
|
|
version);
|
|
bitmap_set_bit (tab->partition_in_use, VIRTUAL_PARTITION (tab));
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/* This function will remove the expression for VERSION from replacement
|
|
consideration.n table TAB If 'replace' is true, it is marked as
|
|
replaceable, otherwise not. */
|
|
|
|
static void
|
|
finish_expr (temp_expr_table_p tab, int version, bool replace)
|
|
{
|
|
value_expr_p info, tmp;
|
|
int partition;
|
|
|
|
/* Remove this expression from its dependent lists. The partition dependence
|
|
list is retained and transfered later to whomever uses this version. */
|
|
for (info = (value_expr_p) tab->version_info[version]; info; info = tmp)
|
|
{
|
|
partition = info->value;
|
|
gcc_assert (tab->partition_dep_list[partition]);
|
|
tmp = remove_value_from_list (&(tab->partition_dep_list[partition]),
|
|
version);
|
|
gcc_assert (tmp);
|
|
free_value_expr (tab, tmp);
|
|
/* Only clear the bit when the dependency list is emptied via
|
|
a replacement. Otherwise kill_expr will take care of it. */
|
|
if (!(tab->partition_dep_list[partition]) && replace)
|
|
bitmap_clear_bit (tab->partition_in_use, partition);
|
|
tmp = info->next;
|
|
if (!replace)
|
|
free_value_expr (tab, info);
|
|
}
|
|
|
|
if (replace)
|
|
{
|
|
tab->saw_replaceable = true;
|
|
bitmap_set_bit (tab->replaceable, version);
|
|
}
|
|
else
|
|
{
|
|
gcc_assert (!bitmap_bit_p (tab->replaceable, version));
|
|
tab->version_info[version] = NULL;
|
|
}
|
|
}
|
|
|
|
|
|
/* Mark the expression associated with VAR as replaceable, and enter
|
|
the defining stmt into the version_info table TAB. */
|
|
|
|
static void
|
|
mark_replaceable (temp_expr_table_p tab, tree var)
|
|
{
|
|
value_expr_p info;
|
|
int version = SSA_NAME_VERSION (var);
|
|
finish_expr (tab, version, true);
|
|
|
|
/* Move the dependence list to the pending list. */
|
|
if (tab->version_info[version])
|
|
{
|
|
info = (value_expr_p) tab->version_info[version];
|
|
for ( ; info->next; info = info->next)
|
|
continue;
|
|
info->next = tab->pending_dependence;
|
|
tab->pending_dependence = (value_expr_p)tab->version_info[version];
|
|
}
|
|
|
|
tab->version_info[version] = SSA_NAME_DEF_STMT (var);
|
|
}
|
|
|
|
|
|
/* This function marks any expression in TAB which is dependent on PARTITION
|
|
as NOT replaceable. CLEAR_BIT is used to determine whether partition_in_use
|
|
should have its bit cleared. Since this routine can be called within an
|
|
EXECUTE_IF_SET_IN_BITMAP, the bit can't always be cleared. */
|
|
|
|
static inline void
|
|
kill_expr (temp_expr_table_p tab, int partition, bool clear_bit)
|
|
{
|
|
value_expr_p ptr;
|
|
|
|
/* Mark every active expr dependent on this var as not replaceable. */
|
|
while ((ptr = tab->partition_dep_list[partition]) != NULL)
|
|
finish_expr (tab, ptr->value, false);
|
|
|
|
if (clear_bit)
|
|
bitmap_clear_bit (tab->partition_in_use, partition);
|
|
}
|
|
|
|
|
|
/* This function kills all expressions in TAB which are dependent on virtual
|
|
DEFs. CLEAR_BIT determines whether partition_in_use gets cleared. */
|
|
|
|
static inline void
|
|
kill_virtual_exprs (temp_expr_table_p tab, bool clear_bit)
|
|
{
|
|
kill_expr (tab, VIRTUAL_PARTITION (tab), clear_bit);
|
|
}
|
|
|
|
|
|
/* This function processes basic block BB, and looks for variables which can
|
|
be replaced by their expressions. Results are stored in TAB. */
|
|
|
|
static void
|
|
find_replaceable_in_bb (temp_expr_table_p tab, basic_block bb)
|
|
{
|
|
block_stmt_iterator bsi;
|
|
tree stmt, def;
|
|
stmt_ann_t ann;
|
|
int partition;
|
|
var_map map = tab->map;
|
|
value_expr_p p;
|
|
ssa_op_iter iter;
|
|
|
|
for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
|
|
{
|
|
stmt = bsi_stmt (bsi);
|
|
ann = stmt_ann (stmt);
|
|
|
|
/* Determine if this stmt finishes an existing expression. */
|
|
FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_USE)
|
|
{
|
|
if (tab->version_info[SSA_NAME_VERSION (def)])
|
|
{
|
|
bool same_root_var = false;
|
|
tree def2;
|
|
ssa_op_iter iter2;
|
|
|
|
/* See if the root variables are the same. If they are, we
|
|
do not want to do the replacement to avoid problems with
|
|
code size, see PR tree-optimization/17549. */
|
|
FOR_EACH_SSA_TREE_OPERAND (def2, stmt, iter2, SSA_OP_DEF)
|
|
if (SSA_NAME_VAR (def) == SSA_NAME_VAR (def2))
|
|
{
|
|
same_root_var = true;
|
|
break;
|
|
}
|
|
|
|
/* Mark expression as replaceable unless stmt is volatile
|
|
or DEF sets the same root variable as STMT. */
|
|
if (!ann->has_volatile_ops && !same_root_var)
|
|
mark_replaceable (tab, def);
|
|
else
|
|
finish_expr (tab, SSA_NAME_VERSION (def), false);
|
|
}
|
|
}
|
|
|
|
/* Next, see if this stmt kills off an active expression. */
|
|
FOR_EACH_SSA_TREE_OPERAND (def, stmt, iter, SSA_OP_DEF)
|
|
{
|
|
partition = var_to_partition (map, def);
|
|
if (partition != NO_PARTITION && tab->partition_dep_list[partition])
|
|
kill_expr (tab, partition, true);
|
|
}
|
|
|
|
/* Now see if we are creating a new expression or not. */
|
|
if (!ann->has_volatile_ops)
|
|
check_replaceable (tab, stmt);
|
|
|
|
/* Free any unused dependency lists. */
|
|
while ((p = tab->pending_dependence))
|
|
{
|
|
tab->pending_dependence = p->next;
|
|
free_value_expr (tab, p);
|
|
}
|
|
|
|
/* A V_MAY_DEF kills any expression using a virtual operand. */
|
|
if (NUM_V_MAY_DEFS (V_MAY_DEF_OPS (ann)) > 0)
|
|
kill_virtual_exprs (tab, true);
|
|
|
|
/* A V_MUST_DEF kills any expression using a virtual operand. */
|
|
if (NUM_V_MUST_DEFS (V_MUST_DEF_OPS (ann)) > 0)
|
|
kill_virtual_exprs (tab, true);
|
|
}
|
|
}
|
|
|
|
|
|
/* This function is the driver routine for replacement of temporary expressions
|
|
in the SSA->normal phase, operating on MAP. If there are replaceable
|
|
expressions, a table is returned which maps SSA versions to the
|
|
expressions they should be replaced with. A NULL_TREE indicates no
|
|
replacement should take place. If there are no replacements at all,
|
|
NULL is returned by the function, otherwise an expression vector indexed
|
|
by SSA_NAME version numbers. */
|
|
|
|
static tree *
|
|
find_replaceable_exprs (var_map map)
|
|
{
|
|
basic_block bb;
|
|
unsigned i;
|
|
temp_expr_table_p table;
|
|
tree *ret;
|
|
|
|
table = new_temp_expr_table (map);
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
bitmap_iterator bi;
|
|
|
|
find_replaceable_in_bb (table, bb);
|
|
EXECUTE_IF_SET_IN_BITMAP ((table->partition_in_use), 0, i, bi)
|
|
{
|
|
kill_expr (table, i, false);
|
|
}
|
|
}
|
|
|
|
ret = free_temp_expr_table (table);
|
|
return ret;
|
|
}
|
|
|
|
|
|
/* Dump TER expression table EXPR to file F. */
|
|
|
|
static void
|
|
dump_replaceable_exprs (FILE *f, tree *expr)
|
|
{
|
|
tree stmt, var;
|
|
int x;
|
|
fprintf (f, "\nReplacing Expressions\n");
|
|
for (x = 0; x < (int)num_ssa_names + 1; x++)
|
|
if (expr[x])
|
|
{
|
|
stmt = expr[x];
|
|
var = DEF_OP (STMT_DEF_OPS (stmt), 0);
|
|
print_generic_expr (f, var, TDF_SLIM);
|
|
fprintf (f, " replace with --> ");
|
|
print_generic_expr (f, TREE_OPERAND (stmt, 1), TDF_SLIM);
|
|
fprintf (f, "\n");
|
|
}
|
|
fprintf (f, "\n");
|
|
}
|
|
|
|
|
|
/* Helper function for discover_nonconstant_array_refs.
|
|
Look for ARRAY_REF nodes with non-constant indexes and mark them
|
|
addressable. */
|
|
|
|
static tree
|
|
discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
|
|
void *data ATTRIBUTE_UNUSED)
|
|
{
|
|
tree t = *tp;
|
|
|
|
if (IS_TYPE_OR_DECL_P (t))
|
|
*walk_subtrees = 0;
|
|
else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
|
|
{
|
|
while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
|
|
&& is_gimple_min_invariant (TREE_OPERAND (t, 1))
|
|
&& (!TREE_OPERAND (t, 2)
|
|
|| is_gimple_min_invariant (TREE_OPERAND (t, 2))))
|
|
|| (TREE_CODE (t) == COMPONENT_REF
|
|
&& (!TREE_OPERAND (t,2)
|
|
|| is_gimple_min_invariant (TREE_OPERAND (t, 2))))
|
|
|| TREE_CODE (t) == BIT_FIELD_REF
|
|
|| TREE_CODE (t) == REALPART_EXPR
|
|
|| TREE_CODE (t) == IMAGPART_EXPR
|
|
|| TREE_CODE (t) == VIEW_CONVERT_EXPR
|
|
|| TREE_CODE (t) == NOP_EXPR
|
|
|| TREE_CODE (t) == CONVERT_EXPR)
|
|
t = TREE_OPERAND (t, 0);
|
|
|
|
if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
|
|
{
|
|
t = get_base_address (t);
|
|
if (t && DECL_P (t))
|
|
TREE_ADDRESSABLE (t) = 1;
|
|
}
|
|
|
|
*walk_subtrees = 0;
|
|
}
|
|
|
|
return NULL_TREE;
|
|
}
|
|
|
|
|
|
/* RTL expansion is not able to compile array references with variable
|
|
offsets for arrays stored in single register. Discover such
|
|
expressions and mark variables as addressable to avoid this
|
|
scenario. */
|
|
|
|
static void
|
|
discover_nonconstant_array_refs (void)
|
|
{
|
|
basic_block bb;
|
|
block_stmt_iterator bsi;
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
|
|
walk_tree (bsi_stmt_ptr (bsi), discover_nonconstant_array_refs_r,
|
|
NULL , NULL);
|
|
}
|
|
}
|
|
|
|
|
|
/* This function will rewrite the current program using the variable mapping
|
|
found in MAP. If the replacement vector VALUES is provided, any
|
|
occurrences of partitions with non-null entries in the vector will be
|
|
replaced with the expression in the vector instead of its mapped
|
|
variable. */
|
|
|
|
static void
|
|
rewrite_trees (var_map map, tree *values)
|
|
{
|
|
elim_graph g;
|
|
basic_block bb;
|
|
block_stmt_iterator si;
|
|
edge e;
|
|
tree phi;
|
|
bool changed;
|
|
|
|
#ifdef ENABLE_CHECKING
|
|
/* Search for PHIs where the destination has no partition, but one
|
|
or more arguments has a partition. This should not happen and can
|
|
create incorrect code. */
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
tree phi;
|
|
|
|
for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
tree T0 = var_to_partition_to_var (map, PHI_RESULT (phi));
|
|
|
|
if (T0 == NULL_TREE)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < PHI_NUM_ARGS (phi); i++)
|
|
{
|
|
tree arg = PHI_ARG_DEF (phi, i);
|
|
|
|
if (TREE_CODE (arg) == SSA_NAME
|
|
&& var_to_partition (map, arg) != NO_PARTITION)
|
|
{
|
|
fprintf (stderr, "Argument of PHI is in a partition :(");
|
|
print_generic_expr (stderr, arg, TDF_SLIM);
|
|
fprintf (stderr, "), but the result is not :");
|
|
print_generic_stmt (stderr, phi, TDF_SLIM);
|
|
internal_error ("SSA corruption");
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
#endif
|
|
|
|
/* Replace PHI nodes with any required copies. */
|
|
g = new_elim_graph (map->num_partitions);
|
|
g->map = map;
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
for (si = bsi_start (bb); !bsi_end_p (si); )
|
|
{
|
|
size_t num_uses, num_defs;
|
|
use_optype uses;
|
|
def_optype defs;
|
|
tree stmt = bsi_stmt (si);
|
|
use_operand_p use_p;
|
|
def_operand_p def_p;
|
|
int remove = 0, is_copy = 0;
|
|
stmt_ann_t ann;
|
|
ssa_op_iter iter;
|
|
|
|
get_stmt_operands (stmt);
|
|
ann = stmt_ann (stmt);
|
|
changed = false;
|
|
|
|
if (TREE_CODE (stmt) == MODIFY_EXPR
|
|
&& (TREE_CODE (TREE_OPERAND (stmt, 1)) == SSA_NAME))
|
|
is_copy = 1;
|
|
|
|
uses = USE_OPS (ann);
|
|
num_uses = NUM_USES (uses);
|
|
FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
|
|
{
|
|
if (replace_use_variable (map, use_p, values))
|
|
changed = true;
|
|
}
|
|
|
|
defs = DEF_OPS (ann);
|
|
num_defs = NUM_DEFS (defs);
|
|
|
|
/* Mark this stmt for removal if it is the list of replaceable
|
|
expressions. */
|
|
if (values && num_defs == 1)
|
|
{
|
|
tree def = DEF_OP (defs, 0);
|
|
tree val;
|
|
val = values[SSA_NAME_VERSION (def)];
|
|
if (val)
|
|
remove = 1;
|
|
}
|
|
if (!remove)
|
|
{
|
|
FOR_EACH_SSA_DEF_OPERAND (def_p, stmt, iter, SSA_OP_DEF)
|
|
{
|
|
if (replace_def_variable (map, def_p, NULL))
|
|
changed = true;
|
|
|
|
/* If both SSA_NAMEs coalesce to the same variable,
|
|
mark the now redundant copy for removal. */
|
|
if (is_copy
|
|
&& num_uses == 1
|
|
&& (DEF_FROM_PTR (def_p) == USE_OP (uses, 0)))
|
|
remove = 1;
|
|
}
|
|
if (changed & !remove)
|
|
modify_stmt (stmt);
|
|
}
|
|
|
|
/* Remove any stmts marked for removal. */
|
|
if (remove)
|
|
bsi_remove (&si);
|
|
else
|
|
bsi_next (&si);
|
|
}
|
|
|
|
phi = phi_nodes (bb);
|
|
if (phi)
|
|
{
|
|
edge_iterator ei;
|
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
|
eliminate_phi (e, g);
|
|
}
|
|
}
|
|
|
|
delete_elim_graph (g);
|
|
}
|
|
|
|
|
|
/* These are the local work structures used to determine the best place to
|
|
insert the copies that were placed on edges by the SSA->normal pass.. */
|
|
static varray_type edge_leader = NULL;
|
|
static varray_type GTY(()) stmt_list = NULL;
|
|
static bitmap leader_has_match = NULL;
|
|
static edge leader_match = NULL;
|
|
|
|
|
|
/* Pass this function to make_forwarder_block so that all the edges with
|
|
matching PENDING_STMT lists to 'curr_stmt_list' get redirected. */
|
|
static bool
|
|
same_stmt_list_p (edge e)
|
|
{
|
|
return (e->aux == (PTR) leader_match) ? true : false;
|
|
}
|
|
|
|
|
|
/* Return TRUE if S1 and S2 are equivalent copies. */
|
|
static inline bool
|
|
identical_copies_p (tree s1, tree s2)
|
|
{
|
|
#ifdef ENABLE_CHECKING
|
|
gcc_assert (TREE_CODE (s1) == MODIFY_EXPR);
|
|
gcc_assert (TREE_CODE (s2) == MODIFY_EXPR);
|
|
gcc_assert (DECL_P (TREE_OPERAND (s1, 0)));
|
|
gcc_assert (DECL_P (TREE_OPERAND (s2, 0)));
|
|
#endif
|
|
|
|
if (TREE_OPERAND (s1, 0) != TREE_OPERAND (s2, 0))
|
|
return false;
|
|
|
|
s1 = TREE_OPERAND (s1, 1);
|
|
s2 = TREE_OPERAND (s2, 1);
|
|
|
|
if (s1 != s2)
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/* Compare the PENDING_STMT list for two edges, and return true if the lists
|
|
contain the same sequence of copies. */
|
|
|
|
static inline bool
|
|
identical_stmt_lists_p (edge e1, edge e2)
|
|
{
|
|
tree t1 = PENDING_STMT (e1);
|
|
tree t2 = PENDING_STMT (e2);
|
|
tree_stmt_iterator tsi1, tsi2;
|
|
|
|
gcc_assert (TREE_CODE (t1) == STATEMENT_LIST);
|
|
gcc_assert (TREE_CODE (t2) == STATEMENT_LIST);
|
|
|
|
for (tsi1 = tsi_start (t1), tsi2 = tsi_start (t2);
|
|
!tsi_end_p (tsi1) && !tsi_end_p (tsi2);
|
|
tsi_next (&tsi1), tsi_next (&tsi2))
|
|
{
|
|
if (!identical_copies_p (tsi_stmt (tsi1), tsi_stmt (tsi2)))
|
|
break;
|
|
}
|
|
|
|
if (!tsi_end_p (tsi1) || ! tsi_end_p (tsi2))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/* Look at all the incoming edges to block BB, and decide where the best place
|
|
to insert the stmts on each edge are, and perform those insertions. Output
|
|
any debug information to DEBUG_FILE. */
|
|
|
|
static void
|
|
analyze_edges_for_bb (basic_block bb, FILE *debug_file)
|
|
{
|
|
edge e;
|
|
edge_iterator ei;
|
|
int count;
|
|
unsigned int x;
|
|
bool have_opportunity;
|
|
block_stmt_iterator bsi;
|
|
tree stmt;
|
|
edge single_edge = NULL;
|
|
bool is_label;
|
|
|
|
count = 0;
|
|
|
|
/* Blocks which contain at least one abnormal edge cannot use
|
|
make_forwarder_block. Look for these blocks, and commit any PENDING_STMTs
|
|
found on edges in these block. */
|
|
have_opportunity = true;
|
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
|
if (e->flags & EDGE_ABNORMAL)
|
|
{
|
|
have_opportunity = false;
|
|
break;
|
|
}
|
|
|
|
if (!have_opportunity)
|
|
{
|
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
|
if (PENDING_STMT (e))
|
|
bsi_commit_one_edge_insert (e, NULL);
|
|
return;
|
|
}
|
|
/* Find out how many edges there are with interesting pending stmts on them.
|
|
Commit the stmts on edges we are not interested in. */
|
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
|
{
|
|
if (PENDING_STMT (e))
|
|
{
|
|
gcc_assert (!(e->flags & EDGE_ABNORMAL));
|
|
if (e->flags & EDGE_FALLTHRU)
|
|
{
|
|
bsi = bsi_start (e->src);
|
|
if (!bsi_end_p (bsi))
|
|
{
|
|
stmt = bsi_stmt (bsi);
|
|
bsi_next (&bsi);
|
|
gcc_assert (stmt != NULL_TREE);
|
|
is_label = (TREE_CODE (stmt) == LABEL_EXPR);
|
|
/* Punt if it has non-label stmts, or isn't local. */
|
|
if (!is_label || DECL_NONLOCAL (TREE_OPERAND (stmt, 0))
|
|
|| !bsi_end_p (bsi))
|
|
{
|
|
bsi_commit_one_edge_insert (e, NULL);
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
single_edge = e;
|
|
count++;
|
|
}
|
|
}
|
|
|
|
/* If there aren't at least 2 edges, no sharing will happen. */
|
|
if (count < 2)
|
|
{
|
|
if (single_edge)
|
|
bsi_commit_one_edge_insert (single_edge, NULL);
|
|
return;
|
|
}
|
|
|
|
/* Ensure that we have empty worklists. */
|
|
if (edge_leader == NULL)
|
|
{
|
|
VARRAY_EDGE_INIT (edge_leader, 25, "edge_leader");
|
|
VARRAY_TREE_INIT (stmt_list, 25, "stmt_list");
|
|
leader_has_match = BITMAP_ALLOC (NULL);
|
|
}
|
|
else
|
|
{
|
|
#ifdef ENABLE_CHECKING
|
|
gcc_assert (VARRAY_ACTIVE_SIZE (edge_leader) == 0);
|
|
gcc_assert (VARRAY_ACTIVE_SIZE (stmt_list) == 0);
|
|
gcc_assert (bitmap_empty_p (leader_has_match));
|
|
#endif
|
|
}
|
|
|
|
/* Find the "leader" block for each set of unique stmt lists. Preference is
|
|
given to FALLTHRU blocks since they would need a GOTO to arrive at another
|
|
block. The leader edge destination is the block which all the other edges
|
|
with the same stmt list will be redirected to. */
|
|
have_opportunity = false;
|
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
|
{
|
|
if (PENDING_STMT (e))
|
|
{
|
|
bool found = false;
|
|
|
|
/* Look for the same stmt list in edge leaders list. */
|
|
for (x = 0; x < VARRAY_ACTIVE_SIZE (edge_leader); x++)
|
|
{
|
|
edge leader = VARRAY_EDGE (edge_leader, x);
|
|
if (identical_stmt_lists_p (leader, e))
|
|
{
|
|
/* Give this edge the same stmt list pointer. */
|
|
PENDING_STMT (e) = NULL;
|
|
e->aux = leader;
|
|
bitmap_set_bit (leader_has_match, x);
|
|
have_opportunity = found = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* If no similar stmt list, add this edge to the leader list. */
|
|
if (!found)
|
|
{
|
|
VARRAY_PUSH_EDGE (edge_leader, e);
|
|
VARRAY_PUSH_TREE (stmt_list, PENDING_STMT (e));
|
|
}
|
|
}
|
|
}
|
|
|
|
/* If there are no similar lists, just issue the stmts. */
|
|
if (!have_opportunity)
|
|
{
|
|
for (x = 0; x < VARRAY_ACTIVE_SIZE (edge_leader); x++)
|
|
bsi_commit_one_edge_insert (VARRAY_EDGE (edge_leader, x), NULL);
|
|
VARRAY_POP_ALL (edge_leader);
|
|
VARRAY_POP_ALL (stmt_list);
|
|
bitmap_clear (leader_has_match);
|
|
return;
|
|
}
|
|
|
|
|
|
if (debug_file)
|
|
fprintf (debug_file, "\nOpportunities in BB %d for stmt/block reduction:\n",
|
|
bb->index);
|
|
|
|
|
|
/* For each common list, create a forwarding block and issue the stmt's
|
|
in that block. */
|
|
for (x = 0 ; x < VARRAY_ACTIVE_SIZE (edge_leader); x++)
|
|
if (bitmap_bit_p (leader_has_match, x))
|
|
{
|
|
edge new_edge, leader_edge;
|
|
block_stmt_iterator bsi;
|
|
tree curr_stmt_list;
|
|
|
|
leader_match = leader_edge = VARRAY_EDGE (edge_leader, x);
|
|
|
|
/* The tree_* cfg manipulation routines use the PENDING_EDGE field
|
|
for various PHI manipulations, so it gets cleared whhen calls are
|
|
made to make_forwarder_block(). So make sure the edge is clear,
|
|
and use the saved stmt list. */
|
|
PENDING_STMT (leader_edge) = NULL;
|
|
leader_edge->aux = leader_edge;
|
|
curr_stmt_list = VARRAY_TREE (stmt_list, x);
|
|
|
|
new_edge = make_forwarder_block (leader_edge->dest, same_stmt_list_p,
|
|
NULL);
|
|
bb = new_edge->dest;
|
|
if (debug_file)
|
|
{
|
|
fprintf (debug_file, "Splitting BB %d for Common stmt list. ",
|
|
leader_edge->dest->index);
|
|
fprintf (debug_file, "Original block is now BB%d.\n", bb->index);
|
|
print_generic_stmt (debug_file, curr_stmt_list, TDF_VOPS);
|
|
}
|
|
|
|
FOR_EACH_EDGE (e, ei, new_edge->src->preds)
|
|
{
|
|
e->aux = NULL;
|
|
if (debug_file)
|
|
fprintf (debug_file, " Edge (%d->%d) lands here.\n",
|
|
e->src->index, e->dest->index);
|
|
}
|
|
|
|
bsi = bsi_last (leader_edge->dest);
|
|
bsi_insert_after (&bsi, curr_stmt_list, BSI_NEW_STMT);
|
|
|
|
leader_match = NULL;
|
|
/* We should never get a new block now. */
|
|
}
|
|
else
|
|
{
|
|
e = VARRAY_EDGE (edge_leader, x);
|
|
PENDING_STMT (e) = VARRAY_TREE (stmt_list, x);
|
|
bsi_commit_one_edge_insert (e, NULL);
|
|
}
|
|
|
|
|
|
/* Clear the working data structures. */
|
|
VARRAY_POP_ALL (edge_leader);
|
|
VARRAY_POP_ALL (stmt_list);
|
|
bitmap_clear (leader_has_match);
|
|
}
|
|
|
|
|
|
/* This function will analyze the insertions which were performed on edges,
|
|
and decide whether they should be left on that edge, or whether it is more
|
|
efficient to emit some subset of them in a single block. All stmts are
|
|
inserted somewhere, and if non-NULL, debug information is printed via
|
|
DUMP_FILE. */
|
|
|
|
static void
|
|
perform_edge_inserts (FILE *dump_file)
|
|
{
|
|
basic_block bb;
|
|
|
|
if (dump_file)
|
|
fprintf(dump_file, "Analyzing Edge Insertions.\n");
|
|
|
|
/* analyze_edges_for_bb calls make_forwarder_block, which tries to
|
|
incrementally update the dominator information. Since we don't
|
|
need dominator information after this pass, go ahead and free the
|
|
dominator information. */
|
|
free_dominance_info (CDI_DOMINATORS);
|
|
free_dominance_info (CDI_POST_DOMINATORS);
|
|
|
|
FOR_EACH_BB (bb)
|
|
analyze_edges_for_bb (bb, dump_file);
|
|
|
|
analyze_edges_for_bb (EXIT_BLOCK_PTR, dump_file);
|
|
|
|
/* Clear out any tables which were created. */
|
|
edge_leader = NULL;
|
|
BITMAP_FREE (leader_has_match);
|
|
|
|
#ifdef ENABLE_CHECKING
|
|
{
|
|
edge_iterator ei;
|
|
edge e;
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
|
{
|
|
if (PENDING_STMT (e))
|
|
error (" Pending stmts not issued on PRED edge (%d, %d)\n",
|
|
e->src->index, e->dest->index);
|
|
}
|
|
FOR_EACH_EDGE (e, ei, bb->succs)
|
|
{
|
|
if (PENDING_STMT (e))
|
|
error (" Pending stmts not issued on SUCC edge (%d, %d)\n",
|
|
e->src->index, e->dest->index);
|
|
}
|
|
}
|
|
FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR->succs)
|
|
{
|
|
if (PENDING_STMT (e))
|
|
error (" Pending stmts not issued on ENTRY edge (%d, %d)\n",
|
|
e->src->index, e->dest->index);
|
|
}
|
|
FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR->preds)
|
|
{
|
|
if (PENDING_STMT (e))
|
|
error (" Pending stmts not issued on EXIT edge (%d, %d)\n",
|
|
e->src->index, e->dest->index);
|
|
}
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
/* Remove the variables specified in MAP from SSA form. Any debug information
|
|
is sent to DUMP. FLAGS indicate what options should be used. */
|
|
|
|
static void
|
|
remove_ssa_form (FILE *dump, var_map map, int flags)
|
|
{
|
|
tree_live_info_p liveinfo;
|
|
basic_block bb;
|
|
tree phi, next;
|
|
FILE *save;
|
|
tree *values = NULL;
|
|
|
|
save = dump_file;
|
|
dump_file = dump;
|
|
|
|
/* If we are not combining temps, don't calculate live ranges for variables
|
|
with only one SSA version. */
|
|
if ((flags & SSANORM_COMBINE_TEMPS) == 0)
|
|
compact_var_map (map, VARMAP_NO_SINGLE_DEFS);
|
|
else
|
|
compact_var_map (map, VARMAP_NORMAL);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
dump_var_map (dump_file, map);
|
|
|
|
liveinfo = coalesce_ssa_name (map, flags);
|
|
|
|
/* Make sure even single occurrence variables are in the list now. */
|
|
if ((flags & SSANORM_COMBINE_TEMPS) == 0)
|
|
compact_var_map (map, VARMAP_NORMAL);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "After Coalescing:\n");
|
|
dump_var_map (dump_file, map);
|
|
}
|
|
|
|
if (flags & SSANORM_PERFORM_TER)
|
|
{
|
|
values = find_replaceable_exprs (map);
|
|
if (values && dump_file && (dump_flags & TDF_DETAILS))
|
|
dump_replaceable_exprs (dump_file, values);
|
|
}
|
|
|
|
/* Assign real variables to the partitions now. */
|
|
assign_vars (map);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "After Root variable replacement:\n");
|
|
dump_var_map (dump_file, map);
|
|
}
|
|
|
|
if ((flags & SSANORM_COMBINE_TEMPS) && liveinfo)
|
|
{
|
|
coalesce_vars (map, liveinfo);
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fprintf (dump_file, "After variable memory coalescing:\n");
|
|
dump_var_map (dump_file, map);
|
|
}
|
|
}
|
|
|
|
if (liveinfo)
|
|
delete_tree_live_info (liveinfo);
|
|
|
|
rewrite_trees (map, values);
|
|
|
|
if (values)
|
|
free (values);
|
|
|
|
/* Remove phi nodes which have been translated back to real variables. */
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
for (phi = phi_nodes (bb); phi; phi = next)
|
|
{
|
|
next = PHI_CHAIN (phi);
|
|
remove_phi_node (phi, NULL_TREE);
|
|
}
|
|
}
|
|
|
|
/* If any copies were inserted on edges, analyze and insert them now. */
|
|
perform_edge_inserts (dump_file);
|
|
|
|
dump_file = save;
|
|
}
|
|
|
|
/* Search every PHI node for arguments associated with backedges which
|
|
we can trivially determine will need a copy (the argument is either
|
|
not an SSA_NAME or the argument has a different underlying variable
|
|
than the PHI result).
|
|
|
|
Insert a copy from the PHI argument to a new destination at the
|
|
end of the block with the backedge to the top of the loop. Update
|
|
the PHI argument to reference this new destination. */
|
|
|
|
static void
|
|
insert_backedge_copies (void)
|
|
{
|
|
basic_block bb;
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
tree phi;
|
|
|
|
for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
tree result = PHI_RESULT (phi);
|
|
tree result_var;
|
|
int i;
|
|
|
|
if (!is_gimple_reg (result))
|
|
continue;
|
|
|
|
result_var = SSA_NAME_VAR (result);
|
|
for (i = 0; i < PHI_NUM_ARGS (phi); i++)
|
|
{
|
|
tree arg = PHI_ARG_DEF (phi, i);
|
|
edge e = PHI_ARG_EDGE (phi, i);
|
|
|
|
/* If the argument is not an SSA_NAME, then we will
|
|
need a constant initialization. If the argument is
|
|
an SSA_NAME with a different underlying variable and
|
|
we are not combining temporaries, then we will
|
|
need a copy statement. */
|
|
if ((e->flags & EDGE_DFS_BACK)
|
|
&& (TREE_CODE (arg) != SSA_NAME
|
|
|| (!flag_tree_combine_temps
|
|
&& SSA_NAME_VAR (arg) != result_var)))
|
|
{
|
|
tree stmt, name, last = NULL;
|
|
block_stmt_iterator bsi;
|
|
|
|
bsi = bsi_last (PHI_ARG_EDGE (phi, i)->src);
|
|
if (!bsi_end_p (bsi))
|
|
last = bsi_stmt (bsi);
|
|
|
|
/* In theory the only way we ought to get back to the
|
|
start of a loop should be with a COND_EXPR or GOTO_EXPR.
|
|
However, better safe than sorry.
|
|
|
|
If the block ends with a control statement or
|
|
something that might throw, then we have to
|
|
insert this assignment before the last
|
|
statement. Else insert it after the last statement. */
|
|
if (last && stmt_ends_bb_p (last))
|
|
{
|
|
/* If the last statement in the block is the definition
|
|
site of the PHI argument, then we can't insert
|
|
anything after it. */
|
|
if (TREE_CODE (arg) == SSA_NAME
|
|
&& SSA_NAME_DEF_STMT (arg) == last)
|
|
continue;
|
|
}
|
|
|
|
/* Create a new instance of the underlying
|
|
variable of the PHI result. */
|
|
stmt = build (MODIFY_EXPR, TREE_TYPE (result_var),
|
|
NULL, PHI_ARG_DEF (phi, i));
|
|
name = make_ssa_name (result_var, stmt);
|
|
TREE_OPERAND (stmt, 0) = name;
|
|
|
|
/* Insert the new statement into the block and update
|
|
the PHI node. */
|
|
if (last && stmt_ends_bb_p (last))
|
|
bsi_insert_before (&bsi, stmt, BSI_NEW_STMT);
|
|
else
|
|
bsi_insert_after (&bsi, stmt, BSI_NEW_STMT);
|
|
modify_stmt (stmt);
|
|
SET_PHI_ARG_DEF (phi, i, name);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Take the current function out of SSA form, as described in
|
|
R. Morgan, ``Building an Optimizing Compiler'',
|
|
Butterworth-Heinemann, Boston, MA, 1998. pp 176-186. */
|
|
|
|
static void
|
|
rewrite_out_of_ssa (void)
|
|
{
|
|
var_map map;
|
|
int var_flags = 0;
|
|
int ssa_flags = 0;
|
|
|
|
/* If elimination of a PHI requires inserting a copy on a backedge,
|
|
then we will have to split the backedge which has numerous
|
|
undesirable performance effects.
|
|
|
|
A significant number of such cases can be handled here by inserting
|
|
copies into the loop itself. */
|
|
insert_backedge_copies ();
|
|
|
|
if (!flag_tree_live_range_split)
|
|
ssa_flags |= SSANORM_COALESCE_PARTITIONS;
|
|
|
|
eliminate_virtual_phis ();
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
dump_tree_cfg (dump_file, dump_flags & ~TDF_DETAILS);
|
|
|
|
/* We cannot allow unssa to un-gimplify trees before we instrument them. */
|
|
if (flag_tree_ter && !flag_mudflap)
|
|
var_flags = SSA_VAR_MAP_REF_COUNT;
|
|
|
|
map = create_ssa_var_map (var_flags);
|
|
|
|
if (flag_tree_combine_temps)
|
|
ssa_flags |= SSANORM_COMBINE_TEMPS;
|
|
if (flag_tree_ter && !flag_mudflap)
|
|
ssa_flags |= SSANORM_PERFORM_TER;
|
|
|
|
remove_ssa_form (dump_file, map, ssa_flags);
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
dump_tree_cfg (dump_file, dump_flags & ~TDF_DETAILS);
|
|
|
|
/* Do some cleanups which reduce the amount of data the
|
|
tree->rtl expanders deal with. */
|
|
cfg_remove_useless_stmts ();
|
|
|
|
/* Flush out flow graph and SSA data. */
|
|
delete_var_map (map);
|
|
|
|
/* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
|
|
discover_nonconstant_array_refs ();
|
|
}
|
|
|
|
|
|
/* Define the parameters of the out of SSA pass. */
|
|
|
|
struct tree_opt_pass pass_del_ssa =
|
|
{
|
|
"optimized", /* name */
|
|
NULL, /* gate */
|
|
rewrite_out_of_ssa, /* execute */
|
|
NULL, /* sub */
|
|
NULL, /* next */
|
|
0, /* static_pass_number */
|
|
TV_TREE_SSA_TO_NORMAL, /* tv_id */
|
|
PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
|
|
0, /* properties_provided */
|
|
/* ??? If TER is enabled, we also kill gimple. */
|
|
PROP_ssa, /* properties_destroyed */
|
|
TODO_verify_ssa | TODO_verify_flow
|
|
| TODO_verify_stmts, /* todo_flags_start */
|
|
TODO_dump_func | TODO_ggc_collect, /* todo_flags_finish */
|
|
0 /* letter */
|
|
};
|