4d0cdd0ce6
2016-10-13 Thomas Preud'homme <thomas.preudhomme@arm.com> gcc/ * coretypes.h: Move MEMMODEL_* macros and enum memmodel definition into ... * memmodel.h: This file. * alias.c, asan.c, auto-inc-dec.c, bb-reorder.c, bt-load.c, caller-save.c, calls.c, ccmp.c, cfgbuild.c, cfgcleanup.c, cfgexpand.c, cfgloopanal.c, cfgrtl.c, cilk-common.c, combine.c, combine-stack-adj.c, common/config/aarch64/aarch64-common.c, common/config/arm/arm-common.c, common/config/bfin/bfin-common.c, common/config/c6x/c6x-common.c, common/config/i386/i386-common.c, common/config/ia64/ia64-common.c, common/config/nvptx/nvptx-common.c, compare-elim.c, config/aarch64/aarch64-builtins.c, config/aarch64/aarch64-c.c, config/aarch64/cortex-a57-fma-steering.c, config/arc/arc.c, config/arc/arc-c.c, config/arm/arm-builtins.c, config/arm/arm-c.c, config/avr/avr.c, config/avr/avr-c.c, config/avr/avr-log.c, config/bfin/bfin.c, config/c6x/c6x.c, config/cr16/cr16.c, config/cris/cris.c, config/darwin-c.c, config/darwin.c, config/epiphany/epiphany.c, config/epiphany/mode-switch-use.c, config/epiphany/resolve-sw-modes.c, config/fr30/fr30.c, config/frv/frv.c, config/ft32/ft32.c, config/h8300/h8300.c, config/i386/i386-c.c, config/i386/winnt.c, config/iq2000/iq2000.c, config/lm32/lm32.c, config/m32c/m32c.c, config/m32r/m32r.c, config/m68k/m68k.c, config/mcore/mcore.c, config/microblaze/microblaze.c, config/mmix/mmix.c, config/mn10300/mn10300.c, config/moxie/moxie.c, config/msp430/msp430.c, config/nds32/nds32-cost.c, config/nds32/nds32-intrinsic.c, config/nds32/nds32-md-auxiliary.c, config/nds32/nds32-memory-manipulation.c, config/nds32/nds32-predicates.c, config/nds32/nds32.c, config/nios2/nios2.c, config/nvptx/nvptx.c, config/pa/pa.c, config/pdp11/pdp11.c, config/rl78/rl78.c, config/rs6000/rs6000-c.c, config/rx/rx.c, config/s390/s390-c.c, config/s390/s390.c, config/sh/sh.c, config/sh/sh-c.c, config/sh/sh-mem.cc, config/sh/sh_treg_combine.cc, config/sol2.c, config/spu/spu.c, config/stormy16/stormy16.c, config/tilegx/tilegx.c, config/tilepro/tilepro.c, config/v850/v850.c, config/vax/vax.c, config/visium/visium.c, config/vms/vms-c.c, config/xtensa/xtensa.c, coverage.c, cppbuiltin.c, cprop.c, cse.c, cselib.c, dbxout.c, dce.c, df-core.c, df-problems.c, df-scan.c, dojump.c, dse.c, dwarf2asm.c, dwarf2cfi.c, dwarf2out.c, emit-rtl.c, except.c, explow.c, expmed.c, expr.c, final.c, fold-const.c, function.c, fwprop.c, gcse.c, ggc-page.c, haifa-sched.c, hsa-brig.c, hsa-gen.c, hw-doloop.c, ifcvt.c, init-regs.c, internal-fn.c, ira-build.c, ira-color.c, ira-conflicts.c, ira-costs.c, ira-emit.c, ira-lives.c, ira.c, jump.c, loop-doloop.c, loop-invariant.c, loop-iv.c, loop-unroll.c, lower-subreg.c, lra.c, lra-assigns.c, lra-coalesce.c, lra-constraints.c, lra-eliminations.c, lra-lives.c, lra-remat.c, lra-spills.c, mode-switching.c, modulo-sched.c, omp-low.c, passes.c, postreload-gcse.c, postreload.c, predict.c, print-rtl-function.c, recog.c, ree.c, reg-stack.c, regcprop.c, reginfo.c, regrename.c, reload.c, reload1.c, reorg.c, resource.c, rtl-chkp.c, rtl-tests.c, rtlanal.c, rtlhooks.c, sched-deps.c, sched-rgn.c, sdbout.c, sel-sched-ir.c, sel-sched.c, shrink-wrap.c, simplify-rtx.c, stack-ptr-mod.c, stmt.c, stor-layout.c, target-globals.c, targhooks.c, toplev.c, tree-nested.c, tree-outof-ssa.c, tree-profile.c, tree-ssa-coalesce.c, tree-ssa-ifcombine.c, tree-ssa-loop-ivopts.c, tree-ssa-loop.c, tree-ssa-reassoc.c, tree-ssa-sccvn.c, tree-vect-data-refs.c, ubsan.c, valtrack.c, var-tracking.c, varasm.c: Include memmodel.h. * genattrtab.c (write_header): Include memmodel.h in generated file. * genautomata.c (main): Likewise. * gengtype.c (open_base_files): Likewise. * genopinit.c (main): Likewise. * genconditions.c (write_header): Include memmodel.h earlier in generated file. * genemit.c (main): Likewise. * genoutput.c (output_prologue): Likewise. * genpeep.c (main): Likewise. * genpreds.c (write_insn_preds_c): Likewise. * genrecog.c (write_header): Likewise. * Makefile.in (PLUGIN_HEADERS): Include memmodel.h gcc/ada/ * gcc-interface/utils2.c: Include memmodel.h. gcc/c-family/ * c-cppbuiltin.c: Include memmodel.h. * c-opts.c: Likewise. * c-pragma.c: Likewise. * c-warn.c: Likewise. gcc/c/ * c-typeck.c: Include memmodel.h. gcc/cp/ * decl2.c: Include memmodel.h. * rtti.c: Likewise. gcc/fortran/ * trans-intrinsic.c: Include memmodel.h. gcc/go/ * go-backend.c: Include memmodel.h. libgcc/ * libgcov-profiler.c: Replace MEMMODEL_* macros by their __ATOMIC_* equivalent. * config/tilepro/atomic.c: Likewise and stop casting model to enum memmodel. From-SVN: r241121
1596 lines
46 KiB
C
1596 lines
46 KiB
C
/* IRA processing allocno lives to build allocno live ranges.
|
|
Copyright (C) 2006-2016 Free Software Foundation, Inc.
|
|
Contributed by Vladimir Makarov <vmakarov@redhat.com>.
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free
|
|
Software Foundation; either version 3, or (at your option) any later
|
|
version.
|
|
|
|
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING3. If not see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "config.h"
|
|
#include "system.h"
|
|
#include "coretypes.h"
|
|
#include "backend.h"
|
|
#include "target.h"
|
|
#include "rtl.h"
|
|
#include "predict.h"
|
|
#include "df.h"
|
|
#include "memmodel.h"
|
|
#include "tm_p.h"
|
|
#include "insn-config.h"
|
|
#include "regs.h"
|
|
#include "ira.h"
|
|
#include "ira-int.h"
|
|
#include "sparseset.h"
|
|
|
|
/* The code in this file is similar to one in global but the code
|
|
works on the allocno basis and creates live ranges instead of
|
|
pseudo-register conflicts. */
|
|
|
|
/* Program points are enumerated by numbers from range
|
|
0..IRA_MAX_POINT-1. There are approximately two times more program
|
|
points than insns. Program points are places in the program where
|
|
liveness info can be changed. In most general case (there are more
|
|
complicated cases too) some program points correspond to places
|
|
where input operand dies and other ones correspond to places where
|
|
output operands are born. */
|
|
int ira_max_point;
|
|
|
|
/* Arrays of size IRA_MAX_POINT mapping a program point to the allocno
|
|
live ranges with given start/finish point. */
|
|
live_range_t *ira_start_point_ranges, *ira_finish_point_ranges;
|
|
|
|
/* Number of the current program point. */
|
|
static int curr_point;
|
|
|
|
/* Point where register pressure excess started or -1 if there is no
|
|
register pressure excess. Excess pressure for a register class at
|
|
some point means that there are more allocnos of given register
|
|
class living at the point than number of hard-registers of the
|
|
class available for the allocation. It is defined only for
|
|
pressure classes. */
|
|
static int high_pressure_start_point[N_REG_CLASSES];
|
|
|
|
/* Objects live at current point in the scan. */
|
|
static sparseset objects_live;
|
|
|
|
/* A temporary bitmap used in functions that wish to avoid visiting an allocno
|
|
multiple times. */
|
|
static sparseset allocnos_processed;
|
|
|
|
/* Set of hard regs (except eliminable ones) currently live. */
|
|
static HARD_REG_SET hard_regs_live;
|
|
|
|
/* The loop tree node corresponding to the current basic block. */
|
|
static ira_loop_tree_node_t curr_bb_node;
|
|
|
|
/* The number of the last processed call. */
|
|
static int last_call_num;
|
|
/* The number of last call at which given allocno was saved. */
|
|
static int *allocno_saved_at_call;
|
|
|
|
/* The value of get_preferred_alternatives for the current instruction,
|
|
supplemental to recog_data. */
|
|
static alternative_mask preferred_alternatives;
|
|
|
|
/* Record the birth of hard register REGNO, updating hard_regs_live and
|
|
hard reg conflict information for living allocnos. */
|
|
static void
|
|
make_hard_regno_born (int regno)
|
|
{
|
|
unsigned int i;
|
|
|
|
SET_HARD_REG_BIT (hard_regs_live, regno);
|
|
EXECUTE_IF_SET_IN_SPARSESET (objects_live, i)
|
|
{
|
|
ira_object_t obj = ira_object_id_map[i];
|
|
|
|
SET_HARD_REG_BIT (OBJECT_CONFLICT_HARD_REGS (obj), regno);
|
|
SET_HARD_REG_BIT (OBJECT_TOTAL_CONFLICT_HARD_REGS (obj), regno);
|
|
}
|
|
}
|
|
|
|
/* Process the death of hard register REGNO. This updates
|
|
hard_regs_live. */
|
|
static void
|
|
make_hard_regno_dead (int regno)
|
|
{
|
|
CLEAR_HARD_REG_BIT (hard_regs_live, regno);
|
|
}
|
|
|
|
/* Record the birth of object OBJ. Set a bit for it in objects_live,
|
|
start a new live range for it if necessary and update hard register
|
|
conflicts. */
|
|
static void
|
|
make_object_born (ira_object_t obj)
|
|
{
|
|
live_range_t lr = OBJECT_LIVE_RANGES (obj);
|
|
|
|
sparseset_set_bit (objects_live, OBJECT_CONFLICT_ID (obj));
|
|
IOR_HARD_REG_SET (OBJECT_CONFLICT_HARD_REGS (obj), hard_regs_live);
|
|
IOR_HARD_REG_SET (OBJECT_TOTAL_CONFLICT_HARD_REGS (obj), hard_regs_live);
|
|
|
|
if (lr == NULL
|
|
|| (lr->finish != curr_point && lr->finish + 1 != curr_point))
|
|
ira_add_live_range_to_object (obj, curr_point, -1);
|
|
}
|
|
|
|
/* Update ALLOCNO_EXCESS_PRESSURE_POINTS_NUM for the allocno
|
|
associated with object OBJ. */
|
|
static void
|
|
update_allocno_pressure_excess_length (ira_object_t obj)
|
|
{
|
|
ira_allocno_t a = OBJECT_ALLOCNO (obj);
|
|
int start, i;
|
|
enum reg_class aclass, pclass, cl;
|
|
live_range_t p;
|
|
|
|
aclass = ALLOCNO_CLASS (a);
|
|
pclass = ira_pressure_class_translate[aclass];
|
|
for (i = 0;
|
|
(cl = ira_reg_class_super_classes[pclass][i]) != LIM_REG_CLASSES;
|
|
i++)
|
|
{
|
|
if (! ira_reg_pressure_class_p[cl])
|
|
continue;
|
|
if (high_pressure_start_point[cl] < 0)
|
|
continue;
|
|
p = OBJECT_LIVE_RANGES (obj);
|
|
ira_assert (p != NULL);
|
|
start = (high_pressure_start_point[cl] > p->start
|
|
? high_pressure_start_point[cl] : p->start);
|
|
ALLOCNO_EXCESS_PRESSURE_POINTS_NUM (a) += curr_point - start + 1;
|
|
}
|
|
}
|
|
|
|
/* Process the death of object OBJ, which is associated with allocno
|
|
A. This finishes the current live range for it. */
|
|
static void
|
|
make_object_dead (ira_object_t obj)
|
|
{
|
|
live_range_t lr;
|
|
|
|
sparseset_clear_bit (objects_live, OBJECT_CONFLICT_ID (obj));
|
|
lr = OBJECT_LIVE_RANGES (obj);
|
|
ira_assert (lr != NULL);
|
|
lr->finish = curr_point;
|
|
update_allocno_pressure_excess_length (obj);
|
|
}
|
|
|
|
/* The current register pressures for each pressure class for the current
|
|
basic block. */
|
|
static int curr_reg_pressure[N_REG_CLASSES];
|
|
|
|
/* Record that register pressure for PCLASS increased by N registers.
|
|
Update the current register pressure, maximal register pressure for
|
|
the current BB and the start point of the register pressure
|
|
excess. */
|
|
static void
|
|
inc_register_pressure (enum reg_class pclass, int n)
|
|
{
|
|
int i;
|
|
enum reg_class cl;
|
|
|
|
for (i = 0;
|
|
(cl = ira_reg_class_super_classes[pclass][i]) != LIM_REG_CLASSES;
|
|
i++)
|
|
{
|
|
if (! ira_reg_pressure_class_p[cl])
|
|
continue;
|
|
curr_reg_pressure[cl] += n;
|
|
if (high_pressure_start_point[cl] < 0
|
|
&& (curr_reg_pressure[cl] > ira_class_hard_regs_num[cl]))
|
|
high_pressure_start_point[cl] = curr_point;
|
|
if (curr_bb_node->reg_pressure[cl] < curr_reg_pressure[cl])
|
|
curr_bb_node->reg_pressure[cl] = curr_reg_pressure[cl];
|
|
}
|
|
}
|
|
|
|
/* Record that register pressure for PCLASS has decreased by NREGS
|
|
registers; update current register pressure, start point of the
|
|
register pressure excess, and register pressure excess length for
|
|
living allocnos. */
|
|
|
|
static void
|
|
dec_register_pressure (enum reg_class pclass, int nregs)
|
|
{
|
|
int i;
|
|
unsigned int j;
|
|
enum reg_class cl;
|
|
bool set_p = false;
|
|
|
|
for (i = 0;
|
|
(cl = ira_reg_class_super_classes[pclass][i]) != LIM_REG_CLASSES;
|
|
i++)
|
|
{
|
|
if (! ira_reg_pressure_class_p[cl])
|
|
continue;
|
|
curr_reg_pressure[cl] -= nregs;
|
|
ira_assert (curr_reg_pressure[cl] >= 0);
|
|
if (high_pressure_start_point[cl] >= 0
|
|
&& curr_reg_pressure[cl] <= ira_class_hard_regs_num[cl])
|
|
set_p = true;
|
|
}
|
|
if (set_p)
|
|
{
|
|
EXECUTE_IF_SET_IN_SPARSESET (objects_live, j)
|
|
update_allocno_pressure_excess_length (ira_object_id_map[j]);
|
|
for (i = 0;
|
|
(cl = ira_reg_class_super_classes[pclass][i]) != LIM_REG_CLASSES;
|
|
i++)
|
|
{
|
|
if (! ira_reg_pressure_class_p[cl])
|
|
continue;
|
|
if (high_pressure_start_point[cl] >= 0
|
|
&& curr_reg_pressure[cl] <= ira_class_hard_regs_num[cl])
|
|
high_pressure_start_point[cl] = -1;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Determine from the objects_live bitmap whether REGNO is currently live,
|
|
and occupies only one object. Return false if we have no information. */
|
|
static bool
|
|
pseudo_regno_single_word_and_live_p (int regno)
|
|
{
|
|
ira_allocno_t a = ira_curr_regno_allocno_map[regno];
|
|
ira_object_t obj;
|
|
|
|
if (a == NULL)
|
|
return false;
|
|
if (ALLOCNO_NUM_OBJECTS (a) > 1)
|
|
return false;
|
|
|
|
obj = ALLOCNO_OBJECT (a, 0);
|
|
|
|
return sparseset_bit_p (objects_live, OBJECT_CONFLICT_ID (obj));
|
|
}
|
|
|
|
/* Mark the pseudo register REGNO as live. Update all information about
|
|
live ranges and register pressure. */
|
|
static void
|
|
mark_pseudo_regno_live (int regno)
|
|
{
|
|
ira_allocno_t a = ira_curr_regno_allocno_map[regno];
|
|
enum reg_class pclass;
|
|
int i, n, nregs;
|
|
|
|
if (a == NULL)
|
|
return;
|
|
|
|
/* Invalidate because it is referenced. */
|
|
allocno_saved_at_call[ALLOCNO_NUM (a)] = 0;
|
|
|
|
n = ALLOCNO_NUM_OBJECTS (a);
|
|
pclass = ira_pressure_class_translate[ALLOCNO_CLASS (a)];
|
|
nregs = ira_reg_class_max_nregs[ALLOCNO_CLASS (a)][ALLOCNO_MODE (a)];
|
|
if (n > 1)
|
|
{
|
|
/* We track every subobject separately. */
|
|
gcc_assert (nregs == n);
|
|
nregs = 1;
|
|
}
|
|
|
|
for (i = 0; i < n; i++)
|
|
{
|
|
ira_object_t obj = ALLOCNO_OBJECT (a, i);
|
|
|
|
if (sparseset_bit_p (objects_live, OBJECT_CONFLICT_ID (obj)))
|
|
continue;
|
|
|
|
inc_register_pressure (pclass, nregs);
|
|
make_object_born (obj);
|
|
}
|
|
}
|
|
|
|
/* Like mark_pseudo_regno_live, but try to only mark one subword of
|
|
the pseudo as live. SUBWORD indicates which; a value of 0
|
|
indicates the low part. */
|
|
static void
|
|
mark_pseudo_regno_subword_live (int regno, int subword)
|
|
{
|
|
ira_allocno_t a = ira_curr_regno_allocno_map[regno];
|
|
int n;
|
|
enum reg_class pclass;
|
|
ira_object_t obj;
|
|
|
|
if (a == NULL)
|
|
return;
|
|
|
|
/* Invalidate because it is referenced. */
|
|
allocno_saved_at_call[ALLOCNO_NUM (a)] = 0;
|
|
|
|
n = ALLOCNO_NUM_OBJECTS (a);
|
|
if (n == 1)
|
|
{
|
|
mark_pseudo_regno_live (regno);
|
|
return;
|
|
}
|
|
|
|
pclass = ira_pressure_class_translate[ALLOCNO_CLASS (a)];
|
|
gcc_assert
|
|
(n == ira_reg_class_max_nregs[ALLOCNO_CLASS (a)][ALLOCNO_MODE (a)]);
|
|
obj = ALLOCNO_OBJECT (a, subword);
|
|
|
|
if (sparseset_bit_p (objects_live, OBJECT_CONFLICT_ID (obj)))
|
|
return;
|
|
|
|
inc_register_pressure (pclass, 1);
|
|
make_object_born (obj);
|
|
}
|
|
|
|
/* Mark the register REG as live. Store a 1 in hard_regs_live for
|
|
this register, record how many consecutive hardware registers it
|
|
actually needs. */
|
|
static void
|
|
mark_hard_reg_live (rtx reg)
|
|
{
|
|
int regno = REGNO (reg);
|
|
|
|
if (! TEST_HARD_REG_BIT (ira_no_alloc_regs, regno))
|
|
{
|
|
int last = END_REGNO (reg);
|
|
enum reg_class aclass, pclass;
|
|
|
|
while (regno < last)
|
|
{
|
|
if (! TEST_HARD_REG_BIT (hard_regs_live, regno)
|
|
&& ! TEST_HARD_REG_BIT (eliminable_regset, regno))
|
|
{
|
|
aclass = ira_hard_regno_allocno_class[regno];
|
|
pclass = ira_pressure_class_translate[aclass];
|
|
inc_register_pressure (pclass, 1);
|
|
make_hard_regno_born (regno);
|
|
}
|
|
regno++;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Mark a pseudo, or one of its subwords, as live. REGNO is the pseudo's
|
|
register number; ORIG_REG is the access in the insn, which may be a
|
|
subreg. */
|
|
static void
|
|
mark_pseudo_reg_live (rtx orig_reg, unsigned regno)
|
|
{
|
|
if (df_read_modify_subreg_p (orig_reg))
|
|
{
|
|
mark_pseudo_regno_subword_live (regno,
|
|
subreg_lowpart_p (orig_reg) ? 0 : 1);
|
|
}
|
|
else
|
|
mark_pseudo_regno_live (regno);
|
|
}
|
|
|
|
/* Mark the register referenced by use or def REF as live. */
|
|
static void
|
|
mark_ref_live (df_ref ref)
|
|
{
|
|
rtx reg = DF_REF_REG (ref);
|
|
rtx orig_reg = reg;
|
|
|
|
if (GET_CODE (reg) == SUBREG)
|
|
reg = SUBREG_REG (reg);
|
|
|
|
if (REGNO (reg) >= FIRST_PSEUDO_REGISTER)
|
|
mark_pseudo_reg_live (orig_reg, REGNO (reg));
|
|
else
|
|
mark_hard_reg_live (reg);
|
|
}
|
|
|
|
/* Mark the pseudo register REGNO as dead. Update all information about
|
|
live ranges and register pressure. */
|
|
static void
|
|
mark_pseudo_regno_dead (int regno)
|
|
{
|
|
ira_allocno_t a = ira_curr_regno_allocno_map[regno];
|
|
int n, i, nregs;
|
|
enum reg_class cl;
|
|
|
|
if (a == NULL)
|
|
return;
|
|
|
|
/* Invalidate because it is referenced. */
|
|
allocno_saved_at_call[ALLOCNO_NUM (a)] = 0;
|
|
|
|
n = ALLOCNO_NUM_OBJECTS (a);
|
|
cl = ira_pressure_class_translate[ALLOCNO_CLASS (a)];
|
|
nregs = ira_reg_class_max_nregs[ALLOCNO_CLASS (a)][ALLOCNO_MODE (a)];
|
|
if (n > 1)
|
|
{
|
|
/* We track every subobject separately. */
|
|
gcc_assert (nregs == n);
|
|
nregs = 1;
|
|
}
|
|
for (i = 0; i < n; i++)
|
|
{
|
|
ira_object_t obj = ALLOCNO_OBJECT (a, i);
|
|
if (!sparseset_bit_p (objects_live, OBJECT_CONFLICT_ID (obj)))
|
|
continue;
|
|
|
|
dec_register_pressure (cl, nregs);
|
|
make_object_dead (obj);
|
|
}
|
|
}
|
|
|
|
/* Like mark_pseudo_regno_dead, but called when we know that only part of the
|
|
register dies. SUBWORD indicates which; a value of 0 indicates the low part. */
|
|
static void
|
|
mark_pseudo_regno_subword_dead (int regno, int subword)
|
|
{
|
|
ira_allocno_t a = ira_curr_regno_allocno_map[regno];
|
|
int n;
|
|
enum reg_class cl;
|
|
ira_object_t obj;
|
|
|
|
if (a == NULL)
|
|
return;
|
|
|
|
/* Invalidate because it is referenced. */
|
|
allocno_saved_at_call[ALLOCNO_NUM (a)] = 0;
|
|
|
|
n = ALLOCNO_NUM_OBJECTS (a);
|
|
if (n == 1)
|
|
/* The allocno as a whole doesn't die in this case. */
|
|
return;
|
|
|
|
cl = ira_pressure_class_translate[ALLOCNO_CLASS (a)];
|
|
gcc_assert
|
|
(n == ira_reg_class_max_nregs[ALLOCNO_CLASS (a)][ALLOCNO_MODE (a)]);
|
|
|
|
obj = ALLOCNO_OBJECT (a, subword);
|
|
if (!sparseset_bit_p (objects_live, OBJECT_CONFLICT_ID (obj)))
|
|
return;
|
|
|
|
dec_register_pressure (cl, 1);
|
|
make_object_dead (obj);
|
|
}
|
|
|
|
/* Mark the hard register REG as dead. Store a 0 in hard_regs_live for the
|
|
register. */
|
|
static void
|
|
mark_hard_reg_dead (rtx reg)
|
|
{
|
|
int regno = REGNO (reg);
|
|
|
|
if (! TEST_HARD_REG_BIT (ira_no_alloc_regs, regno))
|
|
{
|
|
int last = END_REGNO (reg);
|
|
enum reg_class aclass, pclass;
|
|
|
|
while (regno < last)
|
|
{
|
|
if (TEST_HARD_REG_BIT (hard_regs_live, regno))
|
|
{
|
|
aclass = ira_hard_regno_allocno_class[regno];
|
|
pclass = ira_pressure_class_translate[aclass];
|
|
dec_register_pressure (pclass, 1);
|
|
make_hard_regno_dead (regno);
|
|
}
|
|
regno++;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Mark a pseudo, or one of its subwords, as dead. REGNO is the pseudo's
|
|
register number; ORIG_REG is the access in the insn, which may be a
|
|
subreg. */
|
|
static void
|
|
mark_pseudo_reg_dead (rtx orig_reg, unsigned regno)
|
|
{
|
|
if (df_read_modify_subreg_p (orig_reg))
|
|
{
|
|
mark_pseudo_regno_subword_dead (regno,
|
|
subreg_lowpart_p (orig_reg) ? 0 : 1);
|
|
}
|
|
else
|
|
mark_pseudo_regno_dead (regno);
|
|
}
|
|
|
|
/* Mark the register referenced by definition DEF as dead, if the
|
|
definition is a total one. */
|
|
static void
|
|
mark_ref_dead (df_ref def)
|
|
{
|
|
rtx reg = DF_REF_REG (def);
|
|
rtx orig_reg = reg;
|
|
|
|
if (DF_REF_FLAGS_IS_SET (def, DF_REF_CONDITIONAL))
|
|
return;
|
|
|
|
if (GET_CODE (reg) == SUBREG)
|
|
reg = SUBREG_REG (reg);
|
|
|
|
if (DF_REF_FLAGS_IS_SET (def, DF_REF_PARTIAL)
|
|
&& (GET_CODE (orig_reg) != SUBREG
|
|
|| REGNO (reg) < FIRST_PSEUDO_REGISTER
|
|
|| !df_read_modify_subreg_p (orig_reg)))
|
|
return;
|
|
|
|
if (REGNO (reg) >= FIRST_PSEUDO_REGISTER)
|
|
mark_pseudo_reg_dead (orig_reg, REGNO (reg));
|
|
else
|
|
mark_hard_reg_dead (reg);
|
|
}
|
|
|
|
/* If REG is a pseudo or a subreg of it, and the class of its allocno
|
|
intersects CL, make a conflict with pseudo DREG. ORIG_DREG is the
|
|
rtx actually accessed, it may be identical to DREG or a subreg of it.
|
|
Advance the current program point before making the conflict if
|
|
ADVANCE_P. Return TRUE if we will need to advance the current
|
|
program point. */
|
|
static bool
|
|
make_pseudo_conflict (rtx reg, enum reg_class cl, rtx dreg, rtx orig_dreg,
|
|
bool advance_p)
|
|
{
|
|
rtx orig_reg = reg;
|
|
ira_allocno_t a;
|
|
|
|
if (GET_CODE (reg) == SUBREG)
|
|
reg = SUBREG_REG (reg);
|
|
|
|
if (! REG_P (reg) || REGNO (reg) < FIRST_PSEUDO_REGISTER)
|
|
return advance_p;
|
|
|
|
a = ira_curr_regno_allocno_map[REGNO (reg)];
|
|
if (! reg_classes_intersect_p (cl, ALLOCNO_CLASS (a)))
|
|
return advance_p;
|
|
|
|
if (advance_p)
|
|
curr_point++;
|
|
|
|
mark_pseudo_reg_live (orig_reg, REGNO (reg));
|
|
mark_pseudo_reg_live (orig_dreg, REGNO (dreg));
|
|
mark_pseudo_reg_dead (orig_reg, REGNO (reg));
|
|
mark_pseudo_reg_dead (orig_dreg, REGNO (dreg));
|
|
|
|
return false;
|
|
}
|
|
|
|
/* Check and make if necessary conflicts for pseudo DREG of class
|
|
DEF_CL of the current insn with input operand USE of class USE_CL.
|
|
ORIG_DREG is the rtx actually accessed, it may be identical to
|
|
DREG or a subreg of it. Advance the current program point before
|
|
making the conflict if ADVANCE_P. Return TRUE if we will need to
|
|
advance the current program point. */
|
|
static bool
|
|
check_and_make_def_use_conflict (rtx dreg, rtx orig_dreg,
|
|
enum reg_class def_cl, int use,
|
|
enum reg_class use_cl, bool advance_p)
|
|
{
|
|
if (! reg_classes_intersect_p (def_cl, use_cl))
|
|
return advance_p;
|
|
|
|
advance_p = make_pseudo_conflict (recog_data.operand[use],
|
|
use_cl, dreg, orig_dreg, advance_p);
|
|
|
|
/* Reload may end up swapping commutative operands, so you
|
|
have to take both orderings into account. The
|
|
constraints for the two operands can be completely
|
|
different. (Indeed, if the constraints for the two
|
|
operands are the same for all alternatives, there's no
|
|
point marking them as commutative.) */
|
|
if (use < recog_data.n_operands - 1
|
|
&& recog_data.constraints[use][0] == '%')
|
|
advance_p
|
|
= make_pseudo_conflict (recog_data.operand[use + 1],
|
|
use_cl, dreg, orig_dreg, advance_p);
|
|
if (use >= 1
|
|
&& recog_data.constraints[use - 1][0] == '%')
|
|
advance_p
|
|
= make_pseudo_conflict (recog_data.operand[use - 1],
|
|
use_cl, dreg, orig_dreg, advance_p);
|
|
return advance_p;
|
|
}
|
|
|
|
/* Check and make if necessary conflicts for definition DEF of class
|
|
DEF_CL of the current insn with input operands. Process only
|
|
constraints of alternative ALT. */
|
|
static void
|
|
check_and_make_def_conflict (int alt, int def, enum reg_class def_cl)
|
|
{
|
|
int use, use_match;
|
|
ira_allocno_t a;
|
|
enum reg_class use_cl, acl;
|
|
bool advance_p;
|
|
rtx dreg = recog_data.operand[def];
|
|
rtx orig_dreg = dreg;
|
|
|
|
if (def_cl == NO_REGS)
|
|
return;
|
|
|
|
if (GET_CODE (dreg) == SUBREG)
|
|
dreg = SUBREG_REG (dreg);
|
|
|
|
if (! REG_P (dreg) || REGNO (dreg) < FIRST_PSEUDO_REGISTER)
|
|
return;
|
|
|
|
a = ira_curr_regno_allocno_map[REGNO (dreg)];
|
|
acl = ALLOCNO_CLASS (a);
|
|
if (! reg_classes_intersect_p (acl, def_cl))
|
|
return;
|
|
|
|
advance_p = true;
|
|
|
|
int n_operands = recog_data.n_operands;
|
|
const operand_alternative *op_alt = &recog_op_alt[alt * n_operands];
|
|
for (use = 0; use < n_operands; use++)
|
|
{
|
|
int alt1;
|
|
|
|
if (use == def || recog_data.operand_type[use] == OP_OUT)
|
|
continue;
|
|
|
|
if (op_alt[use].anything_ok)
|
|
use_cl = ALL_REGS;
|
|
else
|
|
use_cl = op_alt[use].cl;
|
|
|
|
/* If there's any alternative that allows USE to match DEF, do not
|
|
record a conflict. If that causes us to create an invalid
|
|
instruction due to the earlyclobber, reload must fix it up. */
|
|
for (alt1 = 0; alt1 < recog_data.n_alternatives; alt1++)
|
|
{
|
|
if (!TEST_BIT (preferred_alternatives, alt1))
|
|
continue;
|
|
const operand_alternative *op_alt1
|
|
= &recog_op_alt[alt1 * n_operands];
|
|
if (op_alt1[use].matches == def
|
|
|| (use < n_operands - 1
|
|
&& recog_data.constraints[use][0] == '%'
|
|
&& op_alt1[use + 1].matches == def)
|
|
|| (use >= 1
|
|
&& recog_data.constraints[use - 1][0] == '%'
|
|
&& op_alt1[use - 1].matches == def))
|
|
break;
|
|
}
|
|
|
|
if (alt1 < recog_data.n_alternatives)
|
|
continue;
|
|
|
|
advance_p = check_and_make_def_use_conflict (dreg, orig_dreg, def_cl,
|
|
use, use_cl, advance_p);
|
|
|
|
if ((use_match = op_alt[use].matches) >= 0)
|
|
{
|
|
if (use_match == def)
|
|
continue;
|
|
|
|
if (op_alt[use_match].anything_ok)
|
|
use_cl = ALL_REGS;
|
|
else
|
|
use_cl = op_alt[use_match].cl;
|
|
advance_p = check_and_make_def_use_conflict (dreg, orig_dreg, def_cl,
|
|
use, use_cl, advance_p);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Make conflicts of early clobber pseudo registers of the current
|
|
insn with its inputs. Avoid introducing unnecessary conflicts by
|
|
checking classes of the constraints and pseudos because otherwise
|
|
significant code degradation is possible for some targets. */
|
|
static void
|
|
make_early_clobber_and_input_conflicts (void)
|
|
{
|
|
int alt;
|
|
int def, def_match;
|
|
enum reg_class def_cl;
|
|
|
|
int n_alternatives = recog_data.n_alternatives;
|
|
int n_operands = recog_data.n_operands;
|
|
const operand_alternative *op_alt = recog_op_alt;
|
|
for (alt = 0; alt < n_alternatives; alt++, op_alt += n_operands)
|
|
if (TEST_BIT (preferred_alternatives, alt))
|
|
for (def = 0; def < n_operands; def++)
|
|
{
|
|
def_cl = NO_REGS;
|
|
if (op_alt[def].earlyclobber)
|
|
{
|
|
if (op_alt[def].anything_ok)
|
|
def_cl = ALL_REGS;
|
|
else
|
|
def_cl = op_alt[def].cl;
|
|
check_and_make_def_conflict (alt, def, def_cl);
|
|
}
|
|
if ((def_match = op_alt[def].matches) >= 0
|
|
&& (op_alt[def_match].earlyclobber
|
|
|| op_alt[def].earlyclobber))
|
|
{
|
|
if (op_alt[def_match].anything_ok)
|
|
def_cl = ALL_REGS;
|
|
else
|
|
def_cl = op_alt[def_match].cl;
|
|
check_and_make_def_conflict (alt, def, def_cl);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Mark early clobber hard registers of the current INSN as live (if
|
|
LIVE_P) or dead. Return true if there are such registers. */
|
|
static bool
|
|
mark_hard_reg_early_clobbers (rtx_insn *insn, bool live_p)
|
|
{
|
|
df_ref def;
|
|
bool set_p = false;
|
|
|
|
FOR_EACH_INSN_DEF (def, insn)
|
|
if (DF_REF_FLAGS_IS_SET (def, DF_REF_MUST_CLOBBER))
|
|
{
|
|
rtx dreg = DF_REF_REG (def);
|
|
|
|
if (GET_CODE (dreg) == SUBREG)
|
|
dreg = SUBREG_REG (dreg);
|
|
if (! REG_P (dreg) || REGNO (dreg) >= FIRST_PSEUDO_REGISTER)
|
|
continue;
|
|
|
|
/* Hard register clobbers are believed to be early clobber
|
|
because there is no way to say that non-operand hard
|
|
register clobbers are not early ones. */
|
|
if (live_p)
|
|
mark_ref_live (def);
|
|
else
|
|
mark_ref_dead (def);
|
|
set_p = true;
|
|
}
|
|
|
|
return set_p;
|
|
}
|
|
|
|
/* Checks that CONSTRAINTS permits to use only one hard register. If
|
|
it is so, the function returns the class of the hard register.
|
|
Otherwise it returns NO_REGS. */
|
|
static enum reg_class
|
|
single_reg_class (const char *constraints, rtx op, rtx equiv_const)
|
|
{
|
|
int c;
|
|
enum reg_class cl, next_cl;
|
|
enum constraint_num cn;
|
|
|
|
cl = NO_REGS;
|
|
alternative_mask preferred = preferred_alternatives;
|
|
for (; (c = *constraints); constraints += CONSTRAINT_LEN (c, constraints))
|
|
if (c == '#')
|
|
preferred &= ~ALTERNATIVE_BIT (0);
|
|
else if (c == ',')
|
|
preferred >>= 1;
|
|
else if (preferred & 1)
|
|
switch (c)
|
|
{
|
|
case 'g':
|
|
return NO_REGS;
|
|
|
|
default:
|
|
/* ??? Is this the best way to handle memory constraints? */
|
|
cn = lookup_constraint (constraints);
|
|
if (insn_extra_memory_constraint (cn)
|
|
|| insn_extra_special_memory_constraint (cn)
|
|
|| insn_extra_address_constraint (cn))
|
|
return NO_REGS;
|
|
if (constraint_satisfied_p (op, cn)
|
|
|| (equiv_const != NULL_RTX
|
|
&& CONSTANT_P (equiv_const)
|
|
&& constraint_satisfied_p (equiv_const, cn)))
|
|
return NO_REGS;
|
|
next_cl = reg_class_for_constraint (cn);
|
|
if (next_cl == NO_REGS)
|
|
break;
|
|
if (cl == NO_REGS
|
|
? ira_class_singleton[next_cl][GET_MODE (op)] < 0
|
|
: (ira_class_singleton[cl][GET_MODE (op)]
|
|
!= ira_class_singleton[next_cl][GET_MODE (op)]))
|
|
return NO_REGS;
|
|
cl = next_cl;
|
|
break;
|
|
|
|
case '0': case '1': case '2': case '3': case '4':
|
|
case '5': case '6': case '7': case '8': case '9':
|
|
next_cl
|
|
= single_reg_class (recog_data.constraints[c - '0'],
|
|
recog_data.operand[c - '0'], NULL_RTX);
|
|
if (cl == NO_REGS
|
|
? ira_class_singleton[next_cl][GET_MODE (op)] < 0
|
|
: (ira_class_singleton[cl][GET_MODE (op)]
|
|
!= ira_class_singleton[next_cl][GET_MODE (op)]))
|
|
return NO_REGS;
|
|
cl = next_cl;
|
|
break;
|
|
}
|
|
return cl;
|
|
}
|
|
|
|
/* The function checks that operand OP_NUM of the current insn can use
|
|
only one hard register. If it is so, the function returns the
|
|
class of the hard register. Otherwise it returns NO_REGS. */
|
|
static enum reg_class
|
|
single_reg_operand_class (int op_num)
|
|
{
|
|
if (op_num < 0 || recog_data.n_alternatives == 0)
|
|
return NO_REGS;
|
|
return single_reg_class (recog_data.constraints[op_num],
|
|
recog_data.operand[op_num], NULL_RTX);
|
|
}
|
|
|
|
/* The function sets up hard register set *SET to hard registers which
|
|
might be used by insn reloads because the constraints are too
|
|
strict. */
|
|
void
|
|
ira_implicitly_set_insn_hard_regs (HARD_REG_SET *set,
|
|
alternative_mask preferred)
|
|
{
|
|
int i, c, regno = 0;
|
|
enum reg_class cl;
|
|
rtx op;
|
|
machine_mode mode;
|
|
|
|
CLEAR_HARD_REG_SET (*set);
|
|
for (i = 0; i < recog_data.n_operands; i++)
|
|
{
|
|
op = recog_data.operand[i];
|
|
|
|
if (GET_CODE (op) == SUBREG)
|
|
op = SUBREG_REG (op);
|
|
|
|
if (GET_CODE (op) == SCRATCH
|
|
|| (REG_P (op) && (regno = REGNO (op)) >= FIRST_PSEUDO_REGISTER))
|
|
{
|
|
const char *p = recog_data.constraints[i];
|
|
|
|
mode = (GET_CODE (op) == SCRATCH
|
|
? GET_MODE (op) : PSEUDO_REGNO_MODE (regno));
|
|
cl = NO_REGS;
|
|
for (; (c = *p); p += CONSTRAINT_LEN (c, p))
|
|
if (c == '#')
|
|
preferred &= ~ALTERNATIVE_BIT (0);
|
|
else if (c == ',')
|
|
preferred >>= 1;
|
|
else if (preferred & 1)
|
|
{
|
|
cl = reg_class_for_constraint (lookup_constraint (p));
|
|
if (cl != NO_REGS)
|
|
{
|
|
/* There is no register pressure problem if all of the
|
|
regs in this class are fixed. */
|
|
int regno = ira_class_singleton[cl][mode];
|
|
if (regno >= 0)
|
|
add_to_hard_reg_set (set, mode, regno);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
/* Processes input operands, if IN_P, or output operands otherwise of
|
|
the current insn with FREQ to find allocno which can use only one
|
|
hard register and makes other currently living allocnos conflicting
|
|
with the hard register. */
|
|
static void
|
|
process_single_reg_class_operands (bool in_p, int freq)
|
|
{
|
|
int i, regno;
|
|
unsigned int px;
|
|
enum reg_class cl;
|
|
rtx operand;
|
|
ira_allocno_t operand_a, a;
|
|
|
|
for (i = 0; i < recog_data.n_operands; i++)
|
|
{
|
|
operand = recog_data.operand[i];
|
|
if (in_p && recog_data.operand_type[i] != OP_IN
|
|
&& recog_data.operand_type[i] != OP_INOUT)
|
|
continue;
|
|
if (! in_p && recog_data.operand_type[i] != OP_OUT
|
|
&& recog_data.operand_type[i] != OP_INOUT)
|
|
continue;
|
|
cl = single_reg_operand_class (i);
|
|
if (cl == NO_REGS)
|
|
continue;
|
|
|
|
operand_a = NULL;
|
|
|
|
if (GET_CODE (operand) == SUBREG)
|
|
operand = SUBREG_REG (operand);
|
|
|
|
if (REG_P (operand)
|
|
&& (regno = REGNO (operand)) >= FIRST_PSEUDO_REGISTER)
|
|
{
|
|
enum reg_class aclass;
|
|
|
|
operand_a = ira_curr_regno_allocno_map[regno];
|
|
aclass = ALLOCNO_CLASS (operand_a);
|
|
if (ira_class_subset_p[cl][aclass])
|
|
{
|
|
/* View the desired allocation of OPERAND as:
|
|
|
|
(REG:YMODE YREGNO),
|
|
|
|
a simplification of:
|
|
|
|
(subreg:YMODE (reg:XMODE XREGNO) OFFSET). */
|
|
machine_mode ymode, xmode;
|
|
int xregno, yregno;
|
|
HOST_WIDE_INT offset;
|
|
|
|
xmode = recog_data.operand_mode[i];
|
|
xregno = ira_class_singleton[cl][xmode];
|
|
gcc_assert (xregno >= 0);
|
|
ymode = ALLOCNO_MODE (operand_a);
|
|
offset = subreg_lowpart_offset (ymode, xmode);
|
|
yregno = simplify_subreg_regno (xregno, xmode, offset, ymode);
|
|
if (yregno >= 0
|
|
&& ira_class_hard_reg_index[aclass][yregno] >= 0)
|
|
{
|
|
int cost;
|
|
|
|
ira_allocate_and_set_costs
|
|
(&ALLOCNO_CONFLICT_HARD_REG_COSTS (operand_a),
|
|
aclass, 0);
|
|
ira_init_register_move_cost_if_necessary (xmode);
|
|
cost = freq * (in_p
|
|
? ira_register_move_cost[xmode][aclass][cl]
|
|
: ira_register_move_cost[xmode][cl][aclass]);
|
|
ALLOCNO_CONFLICT_HARD_REG_COSTS (operand_a)
|
|
[ira_class_hard_reg_index[aclass][yregno]] -= cost;
|
|
}
|
|
}
|
|
}
|
|
|
|
EXECUTE_IF_SET_IN_SPARSESET (objects_live, px)
|
|
{
|
|
ira_object_t obj = ira_object_id_map[px];
|
|
a = OBJECT_ALLOCNO (obj);
|
|
if (a != operand_a)
|
|
{
|
|
/* We could increase costs of A instead of making it
|
|
conflicting with the hard register. But it works worse
|
|
because it will be spilled in reload in anyway. */
|
|
IOR_HARD_REG_SET (OBJECT_CONFLICT_HARD_REGS (obj),
|
|
reg_class_contents[cl]);
|
|
IOR_HARD_REG_SET (OBJECT_TOTAL_CONFLICT_HARD_REGS (obj),
|
|
reg_class_contents[cl]);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Look through the CALL_INSN_FUNCTION_USAGE of a call insn INSN, and see if
|
|
we find a SET rtx that we can use to deduce that a register can be cheaply
|
|
caller-saved. Return such a register, or NULL_RTX if none is found. */
|
|
static rtx
|
|
find_call_crossed_cheap_reg (rtx_insn *insn)
|
|
{
|
|
rtx cheap_reg = NULL_RTX;
|
|
rtx exp = CALL_INSN_FUNCTION_USAGE (insn);
|
|
|
|
while (exp != NULL)
|
|
{
|
|
rtx x = XEXP (exp, 0);
|
|
if (GET_CODE (x) == SET)
|
|
{
|
|
exp = x;
|
|
break;
|
|
}
|
|
exp = XEXP (exp, 1);
|
|
}
|
|
if (exp != NULL)
|
|
{
|
|
basic_block bb = BLOCK_FOR_INSN (insn);
|
|
rtx reg = SET_SRC (exp);
|
|
rtx_insn *prev = PREV_INSN (insn);
|
|
while (prev && !(INSN_P (prev)
|
|
&& BLOCK_FOR_INSN (prev) != bb))
|
|
{
|
|
if (NONDEBUG_INSN_P (prev))
|
|
{
|
|
rtx set = single_set (prev);
|
|
|
|
if (set && rtx_equal_p (SET_DEST (set), reg))
|
|
{
|
|
rtx src = SET_SRC (set);
|
|
if (!REG_P (src) || HARD_REGISTER_P (src)
|
|
|| !pseudo_regno_single_word_and_live_p (REGNO (src)))
|
|
break;
|
|
if (!modified_between_p (src, prev, insn))
|
|
cheap_reg = src;
|
|
break;
|
|
}
|
|
if (set && rtx_equal_p (SET_SRC (set), reg))
|
|
{
|
|
rtx dest = SET_DEST (set);
|
|
if (!REG_P (dest) || HARD_REGISTER_P (dest)
|
|
|| !pseudo_regno_single_word_and_live_p (REGNO (dest)))
|
|
break;
|
|
if (!modified_between_p (dest, prev, insn))
|
|
cheap_reg = dest;
|
|
break;
|
|
}
|
|
|
|
if (reg_set_p (reg, prev))
|
|
break;
|
|
}
|
|
prev = PREV_INSN (prev);
|
|
}
|
|
}
|
|
return cheap_reg;
|
|
}
|
|
|
|
/* Process insns of the basic block given by its LOOP_TREE_NODE to
|
|
update allocno live ranges, allocno hard register conflicts,
|
|
intersected calls, and register pressure info for allocnos for the
|
|
basic block for and regions containing the basic block. */
|
|
static void
|
|
process_bb_node_lives (ira_loop_tree_node_t loop_tree_node)
|
|
{
|
|
int i, freq;
|
|
unsigned int j;
|
|
basic_block bb;
|
|
rtx_insn *insn;
|
|
bitmap_iterator bi;
|
|
bitmap reg_live_out;
|
|
unsigned int px;
|
|
bool set_p;
|
|
|
|
bb = loop_tree_node->bb;
|
|
if (bb != NULL)
|
|
{
|
|
for (i = 0; i < ira_pressure_classes_num; i++)
|
|
{
|
|
curr_reg_pressure[ira_pressure_classes[i]] = 0;
|
|
high_pressure_start_point[ira_pressure_classes[i]] = -1;
|
|
}
|
|
curr_bb_node = loop_tree_node;
|
|
reg_live_out = df_get_live_out (bb);
|
|
sparseset_clear (objects_live);
|
|
REG_SET_TO_HARD_REG_SET (hard_regs_live, reg_live_out);
|
|
AND_COMPL_HARD_REG_SET (hard_regs_live, eliminable_regset);
|
|
AND_COMPL_HARD_REG_SET (hard_regs_live, ira_no_alloc_regs);
|
|
for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
|
|
if (TEST_HARD_REG_BIT (hard_regs_live, i))
|
|
{
|
|
enum reg_class aclass, pclass, cl;
|
|
|
|
aclass = ira_allocno_class_translate[REGNO_REG_CLASS (i)];
|
|
pclass = ira_pressure_class_translate[aclass];
|
|
for (j = 0;
|
|
(cl = ira_reg_class_super_classes[pclass][j])
|
|
!= LIM_REG_CLASSES;
|
|
j++)
|
|
{
|
|
if (! ira_reg_pressure_class_p[cl])
|
|
continue;
|
|
curr_reg_pressure[cl]++;
|
|
if (curr_bb_node->reg_pressure[cl] < curr_reg_pressure[cl])
|
|
curr_bb_node->reg_pressure[cl] = curr_reg_pressure[cl];
|
|
ira_assert (curr_reg_pressure[cl]
|
|
<= ira_class_hard_regs_num[cl]);
|
|
}
|
|
}
|
|
EXECUTE_IF_SET_IN_BITMAP (reg_live_out, FIRST_PSEUDO_REGISTER, j, bi)
|
|
mark_pseudo_regno_live (j);
|
|
|
|
freq = REG_FREQ_FROM_BB (bb);
|
|
if (freq == 0)
|
|
freq = 1;
|
|
|
|
/* Invalidate all allocno_saved_at_call entries. */
|
|
last_call_num++;
|
|
|
|
/* Scan the code of this basic block, noting which allocnos and
|
|
hard regs are born or die.
|
|
|
|
Note that this loop treats uninitialized values as live until
|
|
the beginning of the block. For example, if an instruction
|
|
uses (reg:DI foo), and only (subreg:SI (reg:DI foo) 0) is ever
|
|
set, FOO will remain live until the beginning of the block.
|
|
Likewise if FOO is not set at all. This is unnecessarily
|
|
pessimistic, but it probably doesn't matter much in practice. */
|
|
FOR_BB_INSNS_REVERSE (bb, insn)
|
|
{
|
|
ira_allocno_t a;
|
|
df_ref def, use;
|
|
bool call_p;
|
|
|
|
if (!NONDEBUG_INSN_P (insn))
|
|
continue;
|
|
|
|
if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL)
|
|
fprintf (ira_dump_file, " Insn %u(l%d): point = %d\n",
|
|
INSN_UID (insn), loop_tree_node->parent->loop_num,
|
|
curr_point);
|
|
|
|
call_p = CALL_P (insn);
|
|
#ifdef REAL_PIC_OFFSET_TABLE_REGNUM
|
|
int regno;
|
|
bool clear_pic_use_conflict_p = false;
|
|
/* Processing insn usage in call insn can create conflict
|
|
with pic pseudo and pic hard reg and that is wrong.
|
|
Check this situation and fix it at the end of the insn
|
|
processing. */
|
|
if (call_p && pic_offset_table_rtx != NULL_RTX
|
|
&& (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
|
|
&& (a = ira_curr_regno_allocno_map[regno]) != NULL)
|
|
clear_pic_use_conflict_p
|
|
= (find_regno_fusage (insn, USE, REAL_PIC_OFFSET_TABLE_REGNUM)
|
|
&& ! TEST_HARD_REG_BIT (OBJECT_CONFLICT_HARD_REGS
|
|
(ALLOCNO_OBJECT (a, 0)),
|
|
REAL_PIC_OFFSET_TABLE_REGNUM));
|
|
#endif
|
|
|
|
/* Mark each defined value as live. We need to do this for
|
|
unused values because they still conflict with quantities
|
|
that are live at the time of the definition.
|
|
|
|
Ignore DF_REF_MAY_CLOBBERs on a call instruction. Such
|
|
references represent the effect of the called function
|
|
on a call-clobbered register. Marking the register as
|
|
live would stop us from allocating it to a call-crossing
|
|
allocno. */
|
|
FOR_EACH_INSN_DEF (def, insn)
|
|
if (!call_p || !DF_REF_FLAGS_IS_SET (def, DF_REF_MAY_CLOBBER))
|
|
mark_ref_live (def);
|
|
|
|
/* If INSN has multiple outputs, then any value used in one
|
|
of the outputs conflicts with the other outputs. Model this
|
|
by making the used value live during the output phase.
|
|
|
|
It is unsafe to use !single_set here since it will ignore
|
|
an unused output. Just because an output is unused does
|
|
not mean the compiler can assume the side effect will not
|
|
occur. Consider if ALLOCNO appears in the address of an
|
|
output and we reload the output. If we allocate ALLOCNO
|
|
to the same hard register as an unused output we could
|
|
set the hard register before the output reload insn. */
|
|
if (GET_CODE (PATTERN (insn)) == PARALLEL && multiple_sets (insn))
|
|
FOR_EACH_INSN_USE (use, insn)
|
|
{
|
|
int i;
|
|
rtx reg;
|
|
|
|
reg = DF_REF_REG (use);
|
|
for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
|
|
{
|
|
rtx set;
|
|
|
|
set = XVECEXP (PATTERN (insn), 0, i);
|
|
if (GET_CODE (set) == SET
|
|
&& reg_overlap_mentioned_p (reg, SET_DEST (set)))
|
|
{
|
|
/* After the previous loop, this is a no-op if
|
|
REG is contained within SET_DEST (SET). */
|
|
mark_ref_live (use);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
extract_insn (insn);
|
|
preferred_alternatives = get_preferred_alternatives (insn);
|
|
preprocess_constraints (insn);
|
|
process_single_reg_class_operands (false, freq);
|
|
|
|
/* See which defined values die here. */
|
|
FOR_EACH_INSN_DEF (def, insn)
|
|
if (!call_p || !DF_REF_FLAGS_IS_SET (def, DF_REF_MAY_CLOBBER))
|
|
mark_ref_dead (def);
|
|
|
|
if (call_p)
|
|
{
|
|
/* Try to find a SET in the CALL_INSN_FUNCTION_USAGE, and from
|
|
there, try to find a pseudo that is live across the call but
|
|
can be cheaply reconstructed from the return value. */
|
|
rtx cheap_reg = find_call_crossed_cheap_reg (insn);
|
|
if (cheap_reg != NULL_RTX)
|
|
add_reg_note (insn, REG_RETURNED, cheap_reg);
|
|
|
|
last_call_num++;
|
|
sparseset_clear (allocnos_processed);
|
|
/* The current set of live allocnos are live across the call. */
|
|
EXECUTE_IF_SET_IN_SPARSESET (objects_live, i)
|
|
{
|
|
ira_object_t obj = ira_object_id_map[i];
|
|
a = OBJECT_ALLOCNO (obj);
|
|
int num = ALLOCNO_NUM (a);
|
|
HARD_REG_SET this_call_used_reg_set;
|
|
|
|
get_call_reg_set_usage (insn, &this_call_used_reg_set,
|
|
call_used_reg_set);
|
|
|
|
/* Don't allocate allocnos that cross setjmps or any
|
|
call, if this function receives a nonlocal
|
|
goto. */
|
|
if (cfun->has_nonlocal_label
|
|
|| find_reg_note (insn, REG_SETJMP,
|
|
NULL_RTX) != NULL_RTX)
|
|
{
|
|
SET_HARD_REG_SET (OBJECT_CONFLICT_HARD_REGS (obj));
|
|
SET_HARD_REG_SET (OBJECT_TOTAL_CONFLICT_HARD_REGS (obj));
|
|
}
|
|
if (can_throw_internal (insn))
|
|
{
|
|
IOR_HARD_REG_SET (OBJECT_CONFLICT_HARD_REGS (obj),
|
|
this_call_used_reg_set);
|
|
IOR_HARD_REG_SET (OBJECT_TOTAL_CONFLICT_HARD_REGS (obj),
|
|
this_call_used_reg_set);
|
|
}
|
|
|
|
if (sparseset_bit_p (allocnos_processed, num))
|
|
continue;
|
|
sparseset_set_bit (allocnos_processed, num);
|
|
|
|
if (allocno_saved_at_call[num] != last_call_num)
|
|
/* Here we are mimicking caller-save.c behavior
|
|
which does not save hard register at a call if
|
|
it was saved on previous call in the same basic
|
|
block and the hard register was not mentioned
|
|
between the two calls. */
|
|
ALLOCNO_CALL_FREQ (a) += freq;
|
|
/* Mark it as saved at the next call. */
|
|
allocno_saved_at_call[num] = last_call_num + 1;
|
|
ALLOCNO_CALLS_CROSSED_NUM (a)++;
|
|
IOR_HARD_REG_SET (ALLOCNO_CROSSED_CALLS_CLOBBERED_REGS (a),
|
|
this_call_used_reg_set);
|
|
if (cheap_reg != NULL_RTX
|
|
&& ALLOCNO_REGNO (a) == (int) REGNO (cheap_reg))
|
|
ALLOCNO_CHEAP_CALLS_CROSSED_NUM (a)++;
|
|
}
|
|
}
|
|
|
|
make_early_clobber_and_input_conflicts ();
|
|
|
|
curr_point++;
|
|
|
|
/* Mark each used value as live. */
|
|
FOR_EACH_INSN_USE (use, insn)
|
|
mark_ref_live (use);
|
|
|
|
process_single_reg_class_operands (true, freq);
|
|
|
|
set_p = mark_hard_reg_early_clobbers (insn, true);
|
|
|
|
if (set_p)
|
|
{
|
|
mark_hard_reg_early_clobbers (insn, false);
|
|
|
|
/* Mark each hard reg as live again. For example, a
|
|
hard register can be in clobber and in an insn
|
|
input. */
|
|
FOR_EACH_INSN_USE (use, insn)
|
|
{
|
|
rtx ureg = DF_REF_REG (use);
|
|
|
|
if (GET_CODE (ureg) == SUBREG)
|
|
ureg = SUBREG_REG (ureg);
|
|
if (! REG_P (ureg) || REGNO (ureg) >= FIRST_PSEUDO_REGISTER)
|
|
continue;
|
|
|
|
mark_ref_live (use);
|
|
}
|
|
}
|
|
|
|
#ifdef REAL_PIC_OFFSET_TABLE_REGNUM
|
|
if (clear_pic_use_conflict_p)
|
|
{
|
|
regno = REGNO (pic_offset_table_rtx);
|
|
a = ira_curr_regno_allocno_map[regno];
|
|
CLEAR_HARD_REG_BIT (OBJECT_CONFLICT_HARD_REGS (ALLOCNO_OBJECT (a, 0)),
|
|
REAL_PIC_OFFSET_TABLE_REGNUM);
|
|
CLEAR_HARD_REG_BIT (OBJECT_TOTAL_CONFLICT_HARD_REGS
|
|
(ALLOCNO_OBJECT (a, 0)),
|
|
REAL_PIC_OFFSET_TABLE_REGNUM);
|
|
}
|
|
#endif
|
|
curr_point++;
|
|
}
|
|
|
|
if (bb_has_eh_pred (bb))
|
|
for (j = 0; ; ++j)
|
|
{
|
|
unsigned int regno = EH_RETURN_DATA_REGNO (j);
|
|
if (regno == INVALID_REGNUM)
|
|
break;
|
|
make_hard_regno_born (regno);
|
|
}
|
|
|
|
/* Allocnos can't go in stack regs at the start of a basic block
|
|
that is reached by an abnormal edge. Likewise for call
|
|
clobbered regs, because caller-save, fixup_abnormal_edges and
|
|
possibly the table driven EH machinery are not quite ready to
|
|
handle such allocnos live across such edges. */
|
|
if (bb_has_abnormal_pred (bb))
|
|
{
|
|
#ifdef STACK_REGS
|
|
EXECUTE_IF_SET_IN_SPARSESET (objects_live, px)
|
|
{
|
|
ira_allocno_t a = OBJECT_ALLOCNO (ira_object_id_map[px]);
|
|
|
|
ALLOCNO_NO_STACK_REG_P (a) = true;
|
|
ALLOCNO_TOTAL_NO_STACK_REG_P (a) = true;
|
|
}
|
|
for (px = FIRST_STACK_REG; px <= LAST_STACK_REG; px++)
|
|
make_hard_regno_born (px);
|
|
#endif
|
|
/* No need to record conflicts for call clobbered regs if we
|
|
have nonlocal labels around, as we don't ever try to
|
|
allocate such regs in this case. */
|
|
if (!cfun->has_nonlocal_label
|
|
&& has_abnormal_call_or_eh_pred_edge_p (bb))
|
|
for (px = 0; px < FIRST_PSEUDO_REGISTER; px++)
|
|
if (call_used_regs[px]
|
|
#ifdef REAL_PIC_OFFSET_TABLE_REGNUM
|
|
/* We should create a conflict of PIC pseudo with
|
|
PIC hard reg as PIC hard reg can have a wrong
|
|
value after jump described by the abnormal edge.
|
|
In this case we can not allocate PIC hard reg to
|
|
PIC pseudo as PIC pseudo will also have a wrong
|
|
value. This code is not critical as LRA can fix
|
|
it but it is better to have the right allocation
|
|
earlier. */
|
|
|| (px == REAL_PIC_OFFSET_TABLE_REGNUM
|
|
&& pic_offset_table_rtx != NULL_RTX
|
|
&& REGNO (pic_offset_table_rtx) >= FIRST_PSEUDO_REGISTER)
|
|
#endif
|
|
)
|
|
make_hard_regno_born (px);
|
|
}
|
|
|
|
EXECUTE_IF_SET_IN_SPARSESET (objects_live, i)
|
|
make_object_dead (ira_object_id_map[i]);
|
|
|
|
curr_point++;
|
|
|
|
}
|
|
/* Propagate register pressure to upper loop tree nodes. */
|
|
if (loop_tree_node != ira_loop_tree_root)
|
|
for (i = 0; i < ira_pressure_classes_num; i++)
|
|
{
|
|
enum reg_class pclass;
|
|
|
|
pclass = ira_pressure_classes[i];
|
|
if (loop_tree_node->reg_pressure[pclass]
|
|
> loop_tree_node->parent->reg_pressure[pclass])
|
|
loop_tree_node->parent->reg_pressure[pclass]
|
|
= loop_tree_node->reg_pressure[pclass];
|
|
}
|
|
}
|
|
|
|
/* Create and set up IRA_START_POINT_RANGES and
|
|
IRA_FINISH_POINT_RANGES. */
|
|
static void
|
|
create_start_finish_chains (void)
|
|
{
|
|
ira_object_t obj;
|
|
ira_object_iterator oi;
|
|
live_range_t r;
|
|
|
|
ira_start_point_ranges
|
|
= (live_range_t *) ira_allocate (ira_max_point * sizeof (live_range_t));
|
|
memset (ira_start_point_ranges, 0, ira_max_point * sizeof (live_range_t));
|
|
ira_finish_point_ranges
|
|
= (live_range_t *) ira_allocate (ira_max_point * sizeof (live_range_t));
|
|
memset (ira_finish_point_ranges, 0, ira_max_point * sizeof (live_range_t));
|
|
FOR_EACH_OBJECT (obj, oi)
|
|
for (r = OBJECT_LIVE_RANGES (obj); r != NULL; r = r->next)
|
|
{
|
|
r->start_next = ira_start_point_ranges[r->start];
|
|
ira_start_point_ranges[r->start] = r;
|
|
r->finish_next = ira_finish_point_ranges[r->finish];
|
|
ira_finish_point_ranges[r->finish] = r;
|
|
}
|
|
}
|
|
|
|
/* Rebuild IRA_START_POINT_RANGES and IRA_FINISH_POINT_RANGES after
|
|
new live ranges and program points were added as a result if new
|
|
insn generation. */
|
|
void
|
|
ira_rebuild_start_finish_chains (void)
|
|
{
|
|
ira_free (ira_finish_point_ranges);
|
|
ira_free (ira_start_point_ranges);
|
|
create_start_finish_chains ();
|
|
}
|
|
|
|
/* Compress allocno live ranges by removing program points where
|
|
nothing happens. */
|
|
static void
|
|
remove_some_program_points_and_update_live_ranges (void)
|
|
{
|
|
unsigned i;
|
|
int n;
|
|
int *map;
|
|
ira_object_t obj;
|
|
ira_object_iterator oi;
|
|
live_range_t r, prev_r, next_r;
|
|
sbitmap_iterator sbi;
|
|
bool born_p, dead_p, prev_born_p, prev_dead_p;
|
|
|
|
auto_sbitmap born (ira_max_point);
|
|
auto_sbitmap dead (ira_max_point);
|
|
bitmap_clear (born);
|
|
bitmap_clear (dead);
|
|
FOR_EACH_OBJECT (obj, oi)
|
|
for (r = OBJECT_LIVE_RANGES (obj); r != NULL; r = r->next)
|
|
{
|
|
ira_assert (r->start <= r->finish);
|
|
bitmap_set_bit (born, r->start);
|
|
bitmap_set_bit (dead, r->finish);
|
|
}
|
|
|
|
auto_sbitmap born_or_dead (ira_max_point);
|
|
bitmap_ior (born_or_dead, born, dead);
|
|
map = (int *) ira_allocate (sizeof (int) * ira_max_point);
|
|
n = -1;
|
|
prev_born_p = prev_dead_p = false;
|
|
EXECUTE_IF_SET_IN_BITMAP (born_or_dead, 0, i, sbi)
|
|
{
|
|
born_p = bitmap_bit_p (born, i);
|
|
dead_p = bitmap_bit_p (dead, i);
|
|
if ((prev_born_p && ! prev_dead_p && born_p && ! dead_p)
|
|
|| (prev_dead_p && ! prev_born_p && dead_p && ! born_p))
|
|
map[i] = n;
|
|
else
|
|
map[i] = ++n;
|
|
prev_born_p = born_p;
|
|
prev_dead_p = dead_p;
|
|
}
|
|
|
|
n++;
|
|
if (internal_flag_ira_verbose > 1 && ira_dump_file != NULL)
|
|
fprintf (ira_dump_file, "Compressing live ranges: from %d to %d - %d%%\n",
|
|
ira_max_point, n, 100 * n / ira_max_point);
|
|
ira_max_point = n;
|
|
|
|
FOR_EACH_OBJECT (obj, oi)
|
|
for (r = OBJECT_LIVE_RANGES (obj), prev_r = NULL; r != NULL; r = next_r)
|
|
{
|
|
next_r = r->next;
|
|
r->start = map[r->start];
|
|
r->finish = map[r->finish];
|
|
if (prev_r == NULL || prev_r->start > r->finish + 1)
|
|
{
|
|
prev_r = r;
|
|
continue;
|
|
}
|
|
prev_r->start = r->start;
|
|
prev_r->next = next_r;
|
|
ira_finish_live_range (r);
|
|
}
|
|
|
|
ira_free (map);
|
|
}
|
|
|
|
/* Print live ranges R to file F. */
|
|
void
|
|
ira_print_live_range_list (FILE *f, live_range_t r)
|
|
{
|
|
for (; r != NULL; r = r->next)
|
|
fprintf (f, " [%d..%d]", r->start, r->finish);
|
|
fprintf (f, "\n");
|
|
}
|
|
|
|
DEBUG_FUNCTION void
|
|
debug (live_range &ref)
|
|
{
|
|
ira_print_live_range_list (stderr, &ref);
|
|
}
|
|
|
|
DEBUG_FUNCTION void
|
|
debug (live_range *ptr)
|
|
{
|
|
if (ptr)
|
|
debug (*ptr);
|
|
else
|
|
fprintf (stderr, "<nil>\n");
|
|
}
|
|
|
|
/* Print live ranges R to stderr. */
|
|
void
|
|
ira_debug_live_range_list (live_range_t r)
|
|
{
|
|
ira_print_live_range_list (stderr, r);
|
|
}
|
|
|
|
/* Print live ranges of object OBJ to file F. */
|
|
static void
|
|
print_object_live_ranges (FILE *f, ira_object_t obj)
|
|
{
|
|
ira_print_live_range_list (f, OBJECT_LIVE_RANGES (obj));
|
|
}
|
|
|
|
/* Print live ranges of allocno A to file F. */
|
|
static void
|
|
print_allocno_live_ranges (FILE *f, ira_allocno_t a)
|
|
{
|
|
int n = ALLOCNO_NUM_OBJECTS (a);
|
|
int i;
|
|
|
|
for (i = 0; i < n; i++)
|
|
{
|
|
fprintf (f, " a%d(r%d", ALLOCNO_NUM (a), ALLOCNO_REGNO (a));
|
|
if (n > 1)
|
|
fprintf (f, " [%d]", i);
|
|
fprintf (f, "):");
|
|
print_object_live_ranges (f, ALLOCNO_OBJECT (a, i));
|
|
}
|
|
}
|
|
|
|
/* Print live ranges of allocno A to stderr. */
|
|
void
|
|
ira_debug_allocno_live_ranges (ira_allocno_t a)
|
|
{
|
|
print_allocno_live_ranges (stderr, a);
|
|
}
|
|
|
|
/* Print live ranges of all allocnos to file F. */
|
|
static void
|
|
print_live_ranges (FILE *f)
|
|
{
|
|
ira_allocno_t a;
|
|
ira_allocno_iterator ai;
|
|
|
|
FOR_EACH_ALLOCNO (a, ai)
|
|
print_allocno_live_ranges (f, a);
|
|
}
|
|
|
|
/* Print live ranges of all allocnos to stderr. */
|
|
void
|
|
ira_debug_live_ranges (void)
|
|
{
|
|
print_live_ranges (stderr);
|
|
}
|
|
|
|
/* The main entry function creates live ranges, set up
|
|
CONFLICT_HARD_REGS and TOTAL_CONFLICT_HARD_REGS for objects, and
|
|
calculate register pressure info. */
|
|
void
|
|
ira_create_allocno_live_ranges (void)
|
|
{
|
|
objects_live = sparseset_alloc (ira_objects_num);
|
|
allocnos_processed = sparseset_alloc (ira_allocnos_num);
|
|
curr_point = 0;
|
|
last_call_num = 0;
|
|
allocno_saved_at_call
|
|
= (int *) ira_allocate (ira_allocnos_num * sizeof (int));
|
|
memset (allocno_saved_at_call, 0, ira_allocnos_num * sizeof (int));
|
|
ira_traverse_loop_tree (true, ira_loop_tree_root, NULL,
|
|
process_bb_node_lives);
|
|
ira_max_point = curr_point;
|
|
create_start_finish_chains ();
|
|
if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL)
|
|
print_live_ranges (ira_dump_file);
|
|
/* Clean up. */
|
|
ira_free (allocno_saved_at_call);
|
|
sparseset_free (objects_live);
|
|
sparseset_free (allocnos_processed);
|
|
}
|
|
|
|
/* Compress allocno live ranges. */
|
|
void
|
|
ira_compress_allocno_live_ranges (void)
|
|
{
|
|
remove_some_program_points_and_update_live_ranges ();
|
|
ira_rebuild_start_finish_chains ();
|
|
if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL)
|
|
{
|
|
fprintf (ira_dump_file, "Ranges after the compression:\n");
|
|
print_live_ranges (ira_dump_file);
|
|
}
|
|
}
|
|
|
|
/* Free arrays IRA_START_POINT_RANGES and IRA_FINISH_POINT_RANGES. */
|
|
void
|
|
ira_finish_allocno_live_ranges (void)
|
|
{
|
|
ira_free (ira_finish_point_ranges);
|
|
ira_free (ira_start_point_ranges);
|
|
}
|