709 lines
18 KiB
C
709 lines
18 KiB
C
|
/* Transformations based on profile information for values.
|
|||
|
Copyright (C) 2003 Free Software Foundation, Inc.
|
|||
|
|
|||
|
This file is part of GCC.
|
|||
|
|
|||
|
GCC is free software; you can redistribute it and/or modify it under
|
|||
|
the terms of the GNU General Public License as published by the Free
|
|||
|
Software Foundation; either version 2, or (at your option) any later
|
|||
|
version.
|
|||
|
|
|||
|
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
|
|||
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|||
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|||
|
for more details.
|
|||
|
|
|||
|
You should have received a copy of the GNU General Public License
|
|||
|
along with GCC; see the file COPYING. If not, write to the Free
|
|||
|
Software Foundation, 59 Temple Place - Suite 330, Boston, MA
|
|||
|
02111-1307, USA. */
|
|||
|
|
|||
|
#include "config.h"
|
|||
|
#include "system.h"
|
|||
|
#include "coretypes.h"
|
|||
|
#include "tm.h"
|
|||
|
#include "rtl.h"
|
|||
|
#include "expr.h"
|
|||
|
#include "hard-reg-set.h"
|
|||
|
#include "basic-block.h"
|
|||
|
#include "value-prof.h"
|
|||
|
#include "output.h"
|
|||
|
#include "flags.h"
|
|||
|
#include "insn-config.h"
|
|||
|
#include "recog.h"
|
|||
|
#include "optabs.h"
|
|||
|
#include "regs.h"
|
|||
|
|
|||
|
/* In this file value profile based optimizations will be placed (none are
|
|||
|
here just now, but they are hopefully coming soon).
|
|||
|
|
|||
|
Every such optimization should add its requirements for profiled values to
|
|||
|
insn_values_to_profile function. This function is called from branch_prob
|
|||
|
in profile.c and the requested values are instrumented by it in the first
|
|||
|
compilation with -fprofile-arcs. The optimization may then read the
|
|||
|
gathered data in the second compilation with -fbranch-probabilities.
|
|||
|
The measured data is appended as REG_VALUE_PROFILE note to the instrumented
|
|||
|
insn. The argument to the note consists of an EXPR_LIST where its
|
|||
|
members have the following meaning (from the first to the last):
|
|||
|
|
|||
|
-- type of information gathered (HIST_TYPE*)
|
|||
|
-- the expression that is profiled
|
|||
|
-- list of counters starting from the first one. */
|
|||
|
|
|||
|
static void insn_divmod_values_to_profile (rtx, unsigned *,
|
|||
|
struct histogram_value **);
|
|||
|
static void insn_values_to_profile (rtx, unsigned *, struct histogram_value **);
|
|||
|
static rtx gen_divmod_fixed_value (enum machine_mode, enum rtx_code, rtx, rtx,
|
|||
|
rtx, gcov_type);
|
|||
|
static rtx gen_mod_pow2 (enum machine_mode, enum rtx_code, rtx, rtx, rtx);
|
|||
|
static rtx gen_mod_subtract (enum machine_mode, enum rtx_code, rtx, rtx, rtx,
|
|||
|
int);
|
|||
|
static bool divmod_fixed_value_transform (rtx insn);
|
|||
|
static bool mod_pow2_value_transform (rtx);
|
|||
|
static bool mod_subtract_transform (rtx);
|
|||
|
|
|||
|
/* Release the list of VALUES of length N_VALUES for that we want to measure
|
|||
|
histograms. */
|
|||
|
void
|
|||
|
free_profiled_values (unsigned n_values ATTRIBUTE_UNUSED,
|
|||
|
struct histogram_value *values)
|
|||
|
{
|
|||
|
free (values);
|
|||
|
}
|
|||
|
|
|||
|
/* Find values inside INSN for that we want to measure histograms for
|
|||
|
division/modulo optimization. */
|
|||
|
static void
|
|||
|
insn_divmod_values_to_profile (rtx insn, unsigned *n_values,
|
|||
|
struct histogram_value **values)
|
|||
|
{
|
|||
|
rtx set, set_src, op1, op2;
|
|||
|
enum machine_mode mode;
|
|||
|
|
|||
|
if (!INSN_P (insn))
|
|||
|
return;
|
|||
|
|
|||
|
set = single_set (insn);
|
|||
|
if (!set)
|
|||
|
return;
|
|||
|
|
|||
|
mode = GET_MODE (SET_DEST (set));
|
|||
|
if (!INTEGRAL_MODE_P (mode))
|
|||
|
return;
|
|||
|
|
|||
|
set_src = SET_SRC (set);
|
|||
|
switch (GET_CODE (set_src))
|
|||
|
{
|
|||
|
case DIV:
|
|||
|
case MOD:
|
|||
|
case UDIV:
|
|||
|
case UMOD:
|
|||
|
op1 = XEXP (set_src, 0);
|
|||
|
op2 = XEXP (set_src, 1);
|
|||
|
if (side_effects_p (op2))
|
|||
|
return;
|
|||
|
|
|||
|
/* Check for a special case where the divisor is power of 2. */
|
|||
|
if ((GET_CODE (set_src) == UMOD) && !CONSTANT_P (op2))
|
|||
|
{
|
|||
|
*values = xrealloc (*values,
|
|||
|
(*n_values + 1)
|
|||
|
* sizeof (struct histogram_value));
|
|||
|
(*values)[*n_values].value = op2;
|
|||
|
(*values)[*n_values].seq = NULL_RTX;
|
|||
|
(*values)[*n_values].mode = mode;
|
|||
|
(*values)[*n_values].insn = insn;
|
|||
|
(*values)[*n_values].type = HIST_TYPE_POW2;
|
|||
|
(*values)[*n_values].hdata.pow2.may_be_other = 1;
|
|||
|
(*n_values)++;
|
|||
|
}
|
|||
|
|
|||
|
/* Check whether the divisor is not in fact a constant. */
|
|||
|
if (!CONSTANT_P (op2))
|
|||
|
{
|
|||
|
*values = xrealloc (*values,
|
|||
|
(*n_values + 1)
|
|||
|
* sizeof (struct histogram_value));
|
|||
|
(*values)[*n_values].value = op2;
|
|||
|
(*values)[*n_values].mode = mode;
|
|||
|
(*values)[*n_values].seq = NULL_RTX;
|
|||
|
(*values)[*n_values].insn = insn;
|
|||
|
(*values)[*n_values].type = HIST_TYPE_SINGLE_VALUE;
|
|||
|
(*n_values)++;
|
|||
|
}
|
|||
|
|
|||
|
/* For mod, check whether it is not often a noop (or replaceable by
|
|||
|
a few subtractions). */
|
|||
|
if (GET_CODE (set_src) == UMOD && !side_effects_p (op1))
|
|||
|
{
|
|||
|
rtx tmp;
|
|||
|
|
|||
|
*values = xrealloc (*values,
|
|||
|
(*n_values + 1)
|
|||
|
* sizeof (struct histogram_value));
|
|||
|
start_sequence ();
|
|||
|
tmp = simplify_gen_binary (DIV, mode, copy_rtx (op1), copy_rtx (op2));
|
|||
|
(*values)[*n_values].value = force_operand (tmp, NULL_RTX);
|
|||
|
(*values)[*n_values].seq = get_insns ();
|
|||
|
end_sequence ();
|
|||
|
(*values)[*n_values].mode = mode;
|
|||
|
(*values)[*n_values].insn = insn;
|
|||
|
(*values)[*n_values].type = HIST_TYPE_INTERVAL;
|
|||
|
(*values)[*n_values].hdata.intvl.int_start = 0;
|
|||
|
(*values)[*n_values].hdata.intvl.steps = 2;
|
|||
|
(*values)[*n_values].hdata.intvl.may_be_less = 1;
|
|||
|
(*values)[*n_values].hdata.intvl.may_be_more = 1;
|
|||
|
(*n_values)++;
|
|||
|
}
|
|||
|
return;
|
|||
|
|
|||
|
default:
|
|||
|
return;
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
/* Find values inside INSN for that we want to measure histograms and adds
|
|||
|
them to list VALUES (increasing the record of its length in N_VALUES). */
|
|||
|
static void
|
|||
|
insn_values_to_profile (rtx insn,
|
|||
|
unsigned *n_values,
|
|||
|
struct histogram_value **values)
|
|||
|
{
|
|||
|
if (flag_value_profile_transformations)
|
|||
|
insn_divmod_values_to_profile (insn, n_values, values);
|
|||
|
}
|
|||
|
|
|||
|
/* Find list of values for that we want to measure histograms. */
|
|||
|
void
|
|||
|
find_values_to_profile (unsigned *n_values, struct histogram_value **values)
|
|||
|
{
|
|||
|
rtx insn;
|
|||
|
unsigned i;
|
|||
|
|
|||
|
*n_values = 0;
|
|||
|
*values = NULL;
|
|||
|
for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
|
|||
|
insn_values_to_profile (insn, n_values, values);
|
|||
|
|
|||
|
for (i = 0; i < *n_values; i++)
|
|||
|
{
|
|||
|
switch ((*values)[i].type)
|
|||
|
{
|
|||
|
case HIST_TYPE_INTERVAL:
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file,
|
|||
|
"Interval counter for insn %d, range %d -- %d.\n",
|
|||
|
INSN_UID ((*values)[i].insn),
|
|||
|
(*values)[i].hdata.intvl.int_start,
|
|||
|
((*values)[i].hdata.intvl.int_start
|
|||
|
+ (*values)[i].hdata.intvl.steps - 1));
|
|||
|
(*values)[i].n_counters = (*values)[i].hdata.intvl.steps +
|
|||
|
((*values)[i].hdata.intvl.may_be_less ? 1 : 0) +
|
|||
|
((*values)[i].hdata.intvl.may_be_more ? 1 : 0);
|
|||
|
break;
|
|||
|
|
|||
|
case HIST_TYPE_POW2:
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file,
|
|||
|
"Pow2 counter for insn %d.\n",
|
|||
|
INSN_UID ((*values)[i].insn));
|
|||
|
(*values)[i].n_counters = GET_MODE_BITSIZE ((*values)[i].mode) +
|
|||
|
((*values)[i].hdata.pow2.may_be_other ? 1 : 0);
|
|||
|
break;
|
|||
|
|
|||
|
case HIST_TYPE_SINGLE_VALUE:
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file,
|
|||
|
"Single value counter for insn %d.\n",
|
|||
|
INSN_UID ((*values)[i].insn));
|
|||
|
(*values)[i].n_counters = 3;
|
|||
|
break;
|
|||
|
|
|||
|
case HIST_TYPE_CONST_DELTA:
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file,
|
|||
|
"Constant delta counter for insn %d.\n",
|
|||
|
INSN_UID ((*values)[i].insn));
|
|||
|
(*values)[i].n_counters = 4;
|
|||
|
break;
|
|||
|
|
|||
|
default:
|
|||
|
abort ();
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
/* Main entry point. Finds REG_VALUE_PROFILE notes from profiler and uses
|
|||
|
them to identify and exploit properties of values that are hard to analyze
|
|||
|
statically.
|
|||
|
|
|||
|
We do following transformations:
|
|||
|
|
|||
|
1)
|
|||
|
|
|||
|
x = a / b;
|
|||
|
|
|||
|
where b is almost always a constant N is transformed to
|
|||
|
|
|||
|
if (b == N)
|
|||
|
x = a / N;
|
|||
|
else
|
|||
|
x = a / b;
|
|||
|
|
|||
|
Analogically with %
|
|||
|
|
|||
|
2)
|
|||
|
|
|||
|
x = a % b
|
|||
|
|
|||
|
where b is almost always a power of 2 and the division is unsigned
|
|||
|
TODO -- handle signed case as well
|
|||
|
|
|||
|
if ((b & (b - 1)) == 0)
|
|||
|
x = a & (b - 1);
|
|||
|
else
|
|||
|
x = x % b;
|
|||
|
|
|||
|
Note that when b = 0, no error will occur and x = a; this is correct,
|
|||
|
as result of such operation is undefined.
|
|||
|
|
|||
|
3)
|
|||
|
|
|||
|
x = a % b
|
|||
|
|
|||
|
where a is almost always less then b and the division is unsigned
|
|||
|
TODO -- handle signed case as well
|
|||
|
|
|||
|
x = a;
|
|||
|
if (x >= b)
|
|||
|
x %= b;
|
|||
|
|
|||
|
4)
|
|||
|
|
|||
|
x = a % b
|
|||
|
|
|||
|
where a is almost always less then 2 * b and the division is unsigned
|
|||
|
TODO -- handle signed case as well
|
|||
|
|
|||
|
x = a;
|
|||
|
if (x >= b)
|
|||
|
x -= b;
|
|||
|
if (x >= b)
|
|||
|
x %= b;
|
|||
|
|
|||
|
It would be possible to continue analogically for K * b for other small
|
|||
|
K's, but it is probably not useful.
|
|||
|
|
|||
|
TODO:
|
|||
|
|
|||
|
There are other useful cases that could be handled by a similar mechanism,
|
|||
|
for example:
|
|||
|
|
|||
|
for (i = 0; i < n; i++)
|
|||
|
...
|
|||
|
|
|||
|
transform to (for constant N):
|
|||
|
|
|||
|
if (n == N)
|
|||
|
for (i = 0; i < N; i++)
|
|||
|
...
|
|||
|
else
|
|||
|
for (i = 0; i < n; i++)
|
|||
|
...
|
|||
|
making unroller happy. Since this may grow the code significantly,
|
|||
|
we would have to be very careful here. */
|
|||
|
|
|||
|
bool
|
|||
|
value_profile_transformations (void)
|
|||
|
{
|
|||
|
rtx insn, next;
|
|||
|
int changed = false;
|
|||
|
|
|||
|
for (insn = get_insns (); insn; insn = next)
|
|||
|
{
|
|||
|
next = NEXT_INSN (insn);
|
|||
|
|
|||
|
if (!INSN_P (insn))
|
|||
|
continue;
|
|||
|
|
|||
|
/* Scan for insn carrying a histogram. */
|
|||
|
if (!find_reg_note (insn, REG_VALUE_PROFILE, 0))
|
|||
|
continue;
|
|||
|
|
|||
|
/* Ignore cold areas -- we are growing a code. */
|
|||
|
if (!maybe_hot_bb_p (BLOCK_FOR_INSN (insn)))
|
|||
|
continue;
|
|||
|
|
|||
|
if (rtl_dump_file)
|
|||
|
{
|
|||
|
fprintf (rtl_dump_file, "Trying transformations on insn %d\n",
|
|||
|
INSN_UID (insn));
|
|||
|
print_rtl_single (rtl_dump_file, insn);
|
|||
|
}
|
|||
|
|
|||
|
/* Transformations: */
|
|||
|
if (flag_value_profile_transformations
|
|||
|
&& (mod_subtract_transform (insn)
|
|||
|
|| divmod_fixed_value_transform (insn)
|
|||
|
|| mod_pow2_value_transform (insn)))
|
|||
|
changed = true;
|
|||
|
}
|
|||
|
|
|||
|
if (changed)
|
|||
|
{
|
|||
|
commit_edge_insertions ();
|
|||
|
allocate_reg_info (max_reg_num (), FALSE, FALSE);
|
|||
|
}
|
|||
|
|
|||
|
return changed;
|
|||
|
}
|
|||
|
|
|||
|
/* Generate code for transformation 1 (with MODE and OPERATION, operands OP1
|
|||
|
and OP2 whose value is expected to be VALUE and result TARGET). */
|
|||
|
static rtx
|
|||
|
gen_divmod_fixed_value (enum machine_mode mode, enum rtx_code operation,
|
|||
|
rtx target, rtx op1, rtx op2, gcov_type value)
|
|||
|
{
|
|||
|
rtx tmp, tmp1;
|
|||
|
rtx neq_label = gen_label_rtx ();
|
|||
|
rtx end_label = gen_label_rtx ();
|
|||
|
rtx sequence;
|
|||
|
|
|||
|
start_sequence ();
|
|||
|
|
|||
|
if (!REG_P (op2))
|
|||
|
{
|
|||
|
tmp = gen_reg_rtx (mode);
|
|||
|
emit_move_insn (tmp, copy_rtx (op2));
|
|||
|
}
|
|||
|
else
|
|||
|
tmp = op2;
|
|||
|
|
|||
|
do_compare_rtx_and_jump (tmp, GEN_INT (value), NE, 0, mode, NULL_RTX,
|
|||
|
NULL_RTX, neq_label);
|
|||
|
tmp1 = simplify_gen_binary (operation, mode, copy_rtx (op1), GEN_INT (value));
|
|||
|
tmp1 = force_operand (tmp1, target);
|
|||
|
if (tmp1 != target)
|
|||
|
emit_move_insn (copy_rtx (target), copy_rtx (tmp1));
|
|||
|
|
|||
|
emit_jump_insn (gen_jump (end_label));
|
|||
|
emit_barrier ();
|
|||
|
|
|||
|
emit_label (neq_label);
|
|||
|
tmp1 = simplify_gen_binary (operation, mode, copy_rtx (op1), copy_rtx (tmp));
|
|||
|
tmp1 = force_operand (tmp1, target);
|
|||
|
if (tmp1 != target)
|
|||
|
emit_move_insn (copy_rtx (target), copy_rtx (tmp1));
|
|||
|
|
|||
|
emit_label (end_label);
|
|||
|
|
|||
|
sequence = get_insns ();
|
|||
|
end_sequence ();
|
|||
|
rebuild_jump_labels (sequence);
|
|||
|
return sequence;
|
|||
|
}
|
|||
|
|
|||
|
/* Do transform 1) on INSN if applicable. */
|
|||
|
static bool
|
|||
|
divmod_fixed_value_transform (rtx insn)
|
|||
|
{
|
|||
|
rtx set, set_src, set_dest, op1, op2, value, histogram;
|
|||
|
enum rtx_code code;
|
|||
|
enum machine_mode mode;
|
|||
|
gcov_type val, count, all;
|
|||
|
edge e;
|
|||
|
|
|||
|
set = single_set (insn);
|
|||
|
if (!set)
|
|||
|
return false;
|
|||
|
|
|||
|
set_src = SET_SRC (set);
|
|||
|
set_dest = SET_DEST (set);
|
|||
|
code = GET_CODE (set_src);
|
|||
|
mode = GET_MODE (set_dest);
|
|||
|
|
|||
|
if (code != DIV && code != MOD && code != UDIV && code != UMOD)
|
|||
|
return false;
|
|||
|
op1 = XEXP (set_src, false);
|
|||
|
op2 = XEXP (set_src, 1);
|
|||
|
|
|||
|
for (histogram = REG_NOTES (insn);
|
|||
|
histogram;
|
|||
|
histogram = XEXP (histogram, 1))
|
|||
|
if (REG_NOTE_KIND (histogram) == REG_VALUE_PROFILE
|
|||
|
&& XEXP (XEXP (histogram, 0), 0) == GEN_INT (HIST_TYPE_SINGLE_VALUE))
|
|||
|
break;
|
|||
|
|
|||
|
if (!histogram)
|
|||
|
return false;
|
|||
|
|
|||
|
histogram = XEXP (XEXP (histogram, 0), 1);
|
|||
|
value = XEXP (histogram, 0);
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
val = INTVAL (XEXP (histogram, 0));
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
count = INTVAL (XEXP (histogram, 0));
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
all = INTVAL (XEXP (histogram, 0));
|
|||
|
|
|||
|
/* We require that count is at least half of all; this means
|
|||
|
that for the transformation to fire the value must be constant
|
|||
|
at least 50% of time (and 75% gives the guarantee of usage). */
|
|||
|
if (!rtx_equal_p (op2, value) || 2 * count < all)
|
|||
|
return false;
|
|||
|
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file, "Div/mod by constant transformation on insn %d\n",
|
|||
|
INSN_UID (insn));
|
|||
|
|
|||
|
e = split_block (BLOCK_FOR_INSN (insn), PREV_INSN (insn));
|
|||
|
delete_insn (insn);
|
|||
|
|
|||
|
insert_insn_on_edge (
|
|||
|
gen_divmod_fixed_value (mode, code, set_dest, op1, op2, val), e);
|
|||
|
|
|||
|
return true;
|
|||
|
}
|
|||
|
|
|||
|
/* Generate code for transformation 2 (with MODE and OPERATION, operands OP1
|
|||
|
and OP2 and result TARGET). */
|
|||
|
static rtx
|
|||
|
gen_mod_pow2 (enum machine_mode mode, enum rtx_code operation, rtx target,
|
|||
|
rtx op1, rtx op2)
|
|||
|
{
|
|||
|
rtx tmp, tmp1, tmp2, tmp3;
|
|||
|
rtx neq_label = gen_label_rtx ();
|
|||
|
rtx end_label = gen_label_rtx ();
|
|||
|
rtx sequence;
|
|||
|
|
|||
|
start_sequence ();
|
|||
|
|
|||
|
if (!REG_P (op2))
|
|||
|
{
|
|||
|
tmp = gen_reg_rtx (mode);
|
|||
|
emit_move_insn (tmp, copy_rtx (op2));
|
|||
|
}
|
|||
|
else
|
|||
|
tmp = op2;
|
|||
|
|
|||
|
tmp1 = expand_simple_binop (mode, PLUS, tmp, constm1_rtx, NULL_RTX,
|
|||
|
0, OPTAB_WIDEN);
|
|||
|
tmp2 = expand_simple_binop (mode, AND, tmp, tmp1, NULL_RTX,
|
|||
|
0, OPTAB_WIDEN);
|
|||
|
do_compare_rtx_and_jump (tmp2, const0_rtx, NE, 0, mode, NULL_RTX,
|
|||
|
NULL_RTX, neq_label);
|
|||
|
tmp3 = expand_simple_binop (mode, AND, op1, tmp1, target,
|
|||
|
0, OPTAB_WIDEN);
|
|||
|
if (tmp3 != target)
|
|||
|
emit_move_insn (copy_rtx (target), tmp3);
|
|||
|
emit_jump_insn (gen_jump (end_label));
|
|||
|
emit_barrier ();
|
|||
|
|
|||
|
emit_label (neq_label);
|
|||
|
tmp1 = simplify_gen_binary (operation, mode, copy_rtx (op1), copy_rtx (tmp));
|
|||
|
tmp1 = force_operand (tmp1, target);
|
|||
|
if (tmp1 != target)
|
|||
|
emit_move_insn (target, tmp1);
|
|||
|
|
|||
|
emit_label (end_label);
|
|||
|
|
|||
|
sequence = get_insns ();
|
|||
|
end_sequence ();
|
|||
|
rebuild_jump_labels (sequence);
|
|||
|
return sequence;
|
|||
|
}
|
|||
|
|
|||
|
/* Do transform 2) on INSN if applicable. */
|
|||
|
static bool
|
|||
|
mod_pow2_value_transform (rtx insn)
|
|||
|
{
|
|||
|
rtx set, set_src, set_dest, op1, op2, value, histogram;
|
|||
|
enum rtx_code code;
|
|||
|
enum machine_mode mode;
|
|||
|
gcov_type wrong_values, count;
|
|||
|
edge e;
|
|||
|
int i;
|
|||
|
|
|||
|
set = single_set (insn);
|
|||
|
if (!set)
|
|||
|
return false;
|
|||
|
|
|||
|
set_src = SET_SRC (set);
|
|||
|
set_dest = SET_DEST (set);
|
|||
|
code = GET_CODE (set_src);
|
|||
|
mode = GET_MODE (set_dest);
|
|||
|
|
|||
|
if (code != UMOD)
|
|||
|
return false;
|
|||
|
op1 = XEXP (set_src, 0);
|
|||
|
op2 = XEXP (set_src, 1);
|
|||
|
|
|||
|
for (histogram = REG_NOTES (insn);
|
|||
|
histogram;
|
|||
|
histogram = XEXP (histogram, 1))
|
|||
|
if (REG_NOTE_KIND (histogram) == REG_VALUE_PROFILE
|
|||
|
&& XEXP (XEXP (histogram, 0), 0) == GEN_INT (HIST_TYPE_POW2))
|
|||
|
break;
|
|||
|
|
|||
|
if (!histogram)
|
|||
|
return false;
|
|||
|
|
|||
|
histogram = XEXP (XEXP (histogram, 0), 1);
|
|||
|
value = XEXP (histogram, 0);
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
wrong_values =INTVAL (XEXP (histogram, 0));
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
|
|||
|
count = 0;
|
|||
|
for (i = 0; i < GET_MODE_BITSIZE (mode); i++)
|
|||
|
{
|
|||
|
count += INTVAL (XEXP (histogram, 0));
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
}
|
|||
|
|
|||
|
if (!rtx_equal_p (op2, value))
|
|||
|
return false;
|
|||
|
|
|||
|
/* We require that we hit a power of two at least half of all evaluations. */
|
|||
|
if (count < wrong_values)
|
|||
|
return false;
|
|||
|
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file, "Mod power of 2 transformation on insn %d\n",
|
|||
|
INSN_UID (insn));
|
|||
|
|
|||
|
e = split_block (BLOCK_FOR_INSN (insn), PREV_INSN (insn));
|
|||
|
delete_insn (insn);
|
|||
|
|
|||
|
insert_insn_on_edge (
|
|||
|
gen_mod_pow2 (mode, code, set_dest, op1, op2), e);
|
|||
|
|
|||
|
return true;
|
|||
|
}
|
|||
|
|
|||
|
/* Generate code for transformations 3 and 4 (with MODE and OPERATION,
|
|||
|
operands OP1 and OP2, result TARGET and at most SUB subtractions). */
|
|||
|
static rtx
|
|||
|
gen_mod_subtract (enum machine_mode mode, enum rtx_code operation,
|
|||
|
rtx target, rtx op1, rtx op2, int sub)
|
|||
|
{
|
|||
|
rtx tmp, tmp1;
|
|||
|
rtx end_label = gen_label_rtx ();
|
|||
|
rtx sequence;
|
|||
|
int i;
|
|||
|
|
|||
|
start_sequence ();
|
|||
|
|
|||
|
if (!REG_P (op2))
|
|||
|
{
|
|||
|
tmp = gen_reg_rtx (mode);
|
|||
|
emit_move_insn (tmp, copy_rtx (op2));
|
|||
|
}
|
|||
|
else
|
|||
|
tmp = op2;
|
|||
|
|
|||
|
emit_move_insn (target, copy_rtx (op1));
|
|||
|
do_compare_rtx_and_jump (target, tmp, LTU, 0, mode, NULL_RTX,
|
|||
|
NULL_RTX, end_label);
|
|||
|
|
|||
|
|
|||
|
for (i = 0; i < sub; i++)
|
|||
|
{
|
|||
|
tmp1 = expand_simple_binop (mode, MINUS, target, tmp, target,
|
|||
|
0, OPTAB_WIDEN);
|
|||
|
if (tmp1 != target)
|
|||
|
emit_move_insn (target, tmp1);
|
|||
|
do_compare_rtx_and_jump (target, tmp, LTU, 0, mode, NULL_RTX,
|
|||
|
NULL_RTX, end_label);
|
|||
|
}
|
|||
|
|
|||
|
tmp1 = simplify_gen_binary (operation, mode, copy_rtx (target), copy_rtx (tmp));
|
|||
|
tmp1 = force_operand (tmp1, target);
|
|||
|
if (tmp1 != target)
|
|||
|
emit_move_insn (target, tmp1);
|
|||
|
|
|||
|
emit_label (end_label);
|
|||
|
|
|||
|
sequence = get_insns ();
|
|||
|
end_sequence ();
|
|||
|
rebuild_jump_labels (sequence);
|
|||
|
return sequence;
|
|||
|
}
|
|||
|
|
|||
|
/* Do transforms 3) and 4) on INSN if applicable. */
|
|||
|
static bool
|
|||
|
mod_subtract_transform (rtx insn)
|
|||
|
{
|
|||
|
rtx set, set_src, set_dest, op1, op2, value, histogram;
|
|||
|
enum rtx_code code;
|
|||
|
enum machine_mode mode;
|
|||
|
gcov_type wrong_values, counts[2], count, all;
|
|||
|
edge e;
|
|||
|
int i;
|
|||
|
|
|||
|
set = single_set (insn);
|
|||
|
if (!set)
|
|||
|
return false;
|
|||
|
|
|||
|
set_src = SET_SRC (set);
|
|||
|
set_dest = SET_DEST (set);
|
|||
|
code = GET_CODE (set_src);
|
|||
|
mode = GET_MODE (set_dest);
|
|||
|
|
|||
|
if (code != UMOD)
|
|||
|
return false;
|
|||
|
op1 = XEXP (set_src, 0);
|
|||
|
op2 = XEXP (set_src, 1);
|
|||
|
|
|||
|
for (histogram = REG_NOTES (insn);
|
|||
|
histogram;
|
|||
|
histogram = XEXP (histogram, 1))
|
|||
|
if (REG_NOTE_KIND (histogram) == REG_VALUE_PROFILE
|
|||
|
&& XEXP (XEXP (histogram, 0), 0) == GEN_INT (HIST_TYPE_INTERVAL))
|
|||
|
break;
|
|||
|
|
|||
|
if (!histogram)
|
|||
|
return false;
|
|||
|
|
|||
|
histogram = XEXP (XEXP (histogram, 0), 1);
|
|||
|
value = XEXP (histogram, 0);
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
|
|||
|
all = 0;
|
|||
|
for (i = 0; i < 2; i++)
|
|||
|
{
|
|||
|
counts[i] = INTVAL (XEXP (histogram, 0));
|
|||
|
all += counts[i];
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
}
|
|||
|
wrong_values = INTVAL (XEXP (histogram, 0));
|
|||
|
histogram = XEXP (histogram, 1);
|
|||
|
wrong_values += INTVAL (XEXP (histogram, 0));
|
|||
|
all += wrong_values;
|
|||
|
|
|||
|
/* We require that we use just subtractions in at least 50% of all
|
|||
|
evaluations. */
|
|||
|
count = 0;
|
|||
|
for (i = 0; i < 2; i++)
|
|||
|
{
|
|||
|
count += counts[i];
|
|||
|
if (count * 2 >= all)
|
|||
|
break;
|
|||
|
}
|
|||
|
|
|||
|
if (i == 2)
|
|||
|
return false;
|
|||
|
|
|||
|
if (rtl_dump_file)
|
|||
|
fprintf (rtl_dump_file, "Mod subtract transformation on insn %d\n",
|
|||
|
INSN_UID (insn));
|
|||
|
|
|||
|
e = split_block (BLOCK_FOR_INSN (insn), PREV_INSN (insn));
|
|||
|
delete_insn (insn);
|
|||
|
|
|||
|
insert_insn_on_edge (
|
|||
|
gen_mod_subtract (mode, code, set_dest, op1, op2, i), e);
|
|||
|
|
|||
|
return true;
|
|||
|
}
|