invoke.texi (-fprofile-report): Document.
* doc/invoke.texi (-fprofile-report): Document. * common.opt (-fprofile-report): New option. * toplev.c (finalize): Call dump_profile_report. * toplev.h (profile_report): Declare. * passes.c (profile_record): New static var. (check_profile_consistency): New function. (dump_profile_record): New function. (execute_one_ipa_transform_pass): Call check_profile_consistency. (execute_one_pass): Likewise. From-SVN: r192161
This commit is contained in:
parent
5e25600e6e
commit
37e5402bb3
|
@ -1,3 +1,15 @@
|
||||||
|
2012-10-06 Jan Hubicka <jh@suse.cz>
|
||||||
|
|
||||||
|
* doc/invoke.texi (-fprofile-report): Document.
|
||||||
|
* common.opt (-fprofile-report): New option.
|
||||||
|
* toplev.c (finalize): Call dump_profile_report.
|
||||||
|
* toplev.h (profile_report): Declare.
|
||||||
|
* passes.c (profile_record): New static var.
|
||||||
|
(check_profile_consistency): New function.
|
||||||
|
(dump_profile_record): New function.
|
||||||
|
(execute_one_ipa_transform_pass): Call check_profile_consistency.
|
||||||
|
(execute_one_pass): Likewise.
|
||||||
|
|
||||||
2012-10-06 Jan Hubicka <jh@suse.cz>
|
2012-10-06 Jan Hubicka <jh@suse.cz>
|
||||||
|
|
||||||
PR lto/54790
|
PR lto/54790
|
||||||
|
|
|
@ -1654,6 +1654,10 @@ fprofile-values
|
||||||
Common Report Var(flag_profile_values)
|
Common Report Var(flag_profile_values)
|
||||||
Insert code to profile values of expressions
|
Insert code to profile values of expressions
|
||||||
|
|
||||||
|
fprofile-report
|
||||||
|
Common Report Var(profile_report)
|
||||||
|
Report on consistency of profile
|
||||||
|
|
||||||
frandom-seed
|
frandom-seed
|
||||||
Common Var(common_deferred_options) Defer
|
Common Var(common_deferred_options) Defer
|
||||||
|
|
||||||
|
|
|
@ -388,7 +388,7 @@ Objective-C and Objective-C++ Dialects}.
|
||||||
-fno-toplevel-reorder -fno-trapping-math -fno-zero-initialized-in-bss @gol
|
-fno-toplevel-reorder -fno-trapping-math -fno-zero-initialized-in-bss @gol
|
||||||
-fomit-frame-pointer -foptimize-register-move -foptimize-sibling-calls @gol
|
-fomit-frame-pointer -foptimize-register-move -foptimize-sibling-calls @gol
|
||||||
-fpartial-inlining -fpeel-loops -fpredictive-commoning @gol
|
-fpartial-inlining -fpeel-loops -fpredictive-commoning @gol
|
||||||
-fprefetch-loop-arrays @gol
|
-fprefetch-loop-arrays -fprofile-report @gol
|
||||||
-fprofile-correction -fprofile-dir=@var{path} -fprofile-generate @gol
|
-fprofile-correction -fprofile-dir=@var{path} -fprofile-generate @gol
|
||||||
-fprofile-generate=@var{path} @gol
|
-fprofile-generate=@var{path} @gol
|
||||||
-fprofile-use -fprofile-use=@var{path} -fprofile-values @gol
|
-fprofile-use -fprofile-use=@var{path} -fprofile-values @gol
|
||||||
|
@ -5153,6 +5153,11 @@ allocation for the WPA phase only.
|
||||||
Makes the compiler print some statistics about permanent memory
|
Makes the compiler print some statistics about permanent memory
|
||||||
allocation before or after interprocedural optimization.
|
allocation before or after interprocedural optimization.
|
||||||
|
|
||||||
|
@item -fprofile-report
|
||||||
|
@opindex fprofile-report
|
||||||
|
Makes the compiler print some statistics about consistency of the
|
||||||
|
(estimated) profile and effect of individual passes.
|
||||||
|
|
||||||
@item -fstack-usage
|
@item -fstack-usage
|
||||||
@opindex fstack-usage
|
@opindex fstack-usage
|
||||||
Makes the compiler output stack usage information for the program, on a
|
Makes the compiler output stack usage information for the program, on a
|
||||||
|
|
221
gcc/passes.c
221
gcc/passes.c
|
@ -1778,6 +1778,209 @@ execute_function_dump (void *data ATTRIBUTE_UNUSED)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* Make statistic about profile consistency. */
|
||||||
|
|
||||||
|
struct profile_record
|
||||||
|
{
|
||||||
|
int num_mismatched_freq_in[2];
|
||||||
|
int num_mismatched_freq_out[2];
|
||||||
|
int num_mismatched_count_in[2];
|
||||||
|
int num_mismatched_count_out[2];
|
||||||
|
bool run;
|
||||||
|
gcov_type time[2];
|
||||||
|
int size[2];
|
||||||
|
};
|
||||||
|
|
||||||
|
static struct profile_record *profile_record;
|
||||||
|
|
||||||
|
static void
|
||||||
|
check_profile_consistency (int index, int subpass, bool run)
|
||||||
|
{
|
||||||
|
basic_block bb;
|
||||||
|
edge_iterator ei;
|
||||||
|
edge e;
|
||||||
|
int sum;
|
||||||
|
gcov_type lsum;
|
||||||
|
|
||||||
|
if (index == -1)
|
||||||
|
return;
|
||||||
|
if (!profile_record)
|
||||||
|
profile_record = XCNEWVEC (struct profile_record,
|
||||||
|
passes_by_id_size);
|
||||||
|
gcc_assert (index < passes_by_id_size && index >= 0);
|
||||||
|
gcc_assert (subpass < 2);
|
||||||
|
profile_record[index].run |= run;
|
||||||
|
|
||||||
|
FOR_ALL_BB (bb)
|
||||||
|
{
|
||||||
|
if (bb != EXIT_BLOCK_PTR_FOR_FUNCTION (cfun)
|
||||||
|
&& profile_status != PROFILE_ABSENT)
|
||||||
|
{
|
||||||
|
sum = 0;
|
||||||
|
FOR_EACH_EDGE (e, ei, bb->succs)
|
||||||
|
sum += e->probability;
|
||||||
|
if (EDGE_COUNT (bb->succs) && abs (sum - REG_BR_PROB_BASE) > 100)
|
||||||
|
profile_record[index].num_mismatched_freq_out[subpass]++;
|
||||||
|
lsum = 0;
|
||||||
|
FOR_EACH_EDGE (e, ei, bb->succs)
|
||||||
|
lsum += e->count;
|
||||||
|
if (EDGE_COUNT (bb->succs)
|
||||||
|
&& (lsum - bb->count > 100 || lsum - bb->count < -100))
|
||||||
|
profile_record[index].num_mismatched_count_out[subpass]++;
|
||||||
|
}
|
||||||
|
if (bb != ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun)
|
||||||
|
&& profile_status != PROFILE_ABSENT)
|
||||||
|
{
|
||||||
|
sum = 0;
|
||||||
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
||||||
|
sum += EDGE_FREQUENCY (e);
|
||||||
|
if (abs (sum - bb->frequency) > 100
|
||||||
|
|| (MAX (sum, bb->frequency) > 10
|
||||||
|
&& abs ((sum - bb->frequency) * 100 / (MAX (sum, bb->frequency) + 1)) > 10))
|
||||||
|
profile_record[index].num_mismatched_freq_in[subpass]++;
|
||||||
|
lsum = 0;
|
||||||
|
FOR_EACH_EDGE (e, ei, bb->preds)
|
||||||
|
lsum += e->count;
|
||||||
|
if (lsum - bb->count > 100 || lsum - bb->count < -100)
|
||||||
|
profile_record[index].num_mismatched_count_in[subpass]++;
|
||||||
|
}
|
||||||
|
if (bb == ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun)
|
||||||
|
|| bb == EXIT_BLOCK_PTR_FOR_FUNCTION (cfun))
|
||||||
|
continue;
|
||||||
|
if ((cfun && (cfun->curr_properties & PROP_trees)))
|
||||||
|
{
|
||||||
|
gimple_stmt_iterator i;
|
||||||
|
|
||||||
|
for (i = gsi_start_bb (bb); !gsi_end_p (i); gsi_next (&i))
|
||||||
|
{
|
||||||
|
profile_record[index].size[subpass]
|
||||||
|
+= estimate_num_insns (gsi_stmt (i), &eni_size_weights);
|
||||||
|
if (profile_status == PROFILE_READ)
|
||||||
|
profile_record[index].time[subpass]
|
||||||
|
+= estimate_num_insns (gsi_stmt (i),
|
||||||
|
&eni_time_weights) * bb->count;
|
||||||
|
else if (profile_status == PROFILE_GUESSED)
|
||||||
|
profile_record[index].time[subpass]
|
||||||
|
+= estimate_num_insns (gsi_stmt (i),
|
||||||
|
&eni_time_weights) * bb->frequency;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else if (cfun && (cfun->curr_properties & PROP_rtl))
|
||||||
|
{
|
||||||
|
rtx insn;
|
||||||
|
for (insn = NEXT_INSN (BB_HEAD (bb)); insn && insn != NEXT_INSN (BB_END (bb));
|
||||||
|
insn = NEXT_INSN (insn))
|
||||||
|
if (INSN_P (insn))
|
||||||
|
{
|
||||||
|
profile_record[index].size[subpass]
|
||||||
|
+= insn_rtx_cost (PATTERN (insn), false);
|
||||||
|
if (profile_status == PROFILE_READ)
|
||||||
|
profile_record[index].time[subpass]
|
||||||
|
+= insn_rtx_cost (PATTERN (insn), true) * bb->count;
|
||||||
|
else if (profile_status == PROFILE_GUESSED)
|
||||||
|
profile_record[index].time[subpass]
|
||||||
|
+= insn_rtx_cost (PATTERN (insn), true) * bb->frequency;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Output profile consistency. */
|
||||||
|
|
||||||
|
void
|
||||||
|
dump_profile_report (void)
|
||||||
|
{
|
||||||
|
int i, j;
|
||||||
|
int last_freq_in = 0, last_count_in = 0, last_freq_out = 0, last_count_out = 0;
|
||||||
|
gcov_type last_time, last_size;
|
||||||
|
double rel_time_change, rel_size_change;
|
||||||
|
int last_reported;
|
||||||
|
|
||||||
|
if (!profile_record)
|
||||||
|
return;
|
||||||
|
fprintf (stderr, "\nProfile consistency report:\n\n");
|
||||||
|
fprintf (stderr, "Pass name |mismatch in |mismated out|Overall\n");
|
||||||
|
fprintf (stderr, " |freq count |freq count |size time\n");
|
||||||
|
|
||||||
|
for (i = 0; i < passes_by_id_size; i++)
|
||||||
|
for (j = 0 ; j < 2; j++)
|
||||||
|
if (profile_record[i].run)
|
||||||
|
{
|
||||||
|
if (last_time)
|
||||||
|
rel_time_change = (profile_record[i].time[j]
|
||||||
|
- (double)last_time) * 100 / (double)last_time;
|
||||||
|
else
|
||||||
|
rel_time_change = 0;
|
||||||
|
if (last_size)
|
||||||
|
rel_size_change = (profile_record[i].size[j]
|
||||||
|
- (double)last_size) * 100 / (double)last_size;
|
||||||
|
else
|
||||||
|
rel_size_change = 0;
|
||||||
|
|
||||||
|
if (profile_record[i].num_mismatched_freq_in[j] != last_freq_in
|
||||||
|
|| profile_record[i].num_mismatched_freq_out[j] != last_freq_out
|
||||||
|
|| profile_record[i].num_mismatched_count_in[j] != last_count_in
|
||||||
|
|| profile_record[i].num_mismatched_count_out[j] != last_count_out
|
||||||
|
|| rel_time_change || rel_size_change)
|
||||||
|
{
|
||||||
|
last_reported = i;
|
||||||
|
fprintf (stderr, "%-20s %s",
|
||||||
|
passes_by_id [i]->name,
|
||||||
|
j ? "(after TODO)" : " ");
|
||||||
|
if (profile_record[i].num_mismatched_freq_in[j] != last_freq_in)
|
||||||
|
fprintf (stderr, "| %+5i",
|
||||||
|
profile_record[i].num_mismatched_freq_in[j]
|
||||||
|
- last_freq_in);
|
||||||
|
else
|
||||||
|
fprintf (stderr, "| ");
|
||||||
|
if (profile_record[i].num_mismatched_count_in[j] != last_count_in)
|
||||||
|
fprintf (stderr, " %+5i",
|
||||||
|
profile_record[i].num_mismatched_count_in[j]
|
||||||
|
- last_count_in);
|
||||||
|
else
|
||||||
|
fprintf (stderr, " ");
|
||||||
|
if (profile_record[i].num_mismatched_freq_out[j] != last_freq_out)
|
||||||
|
fprintf (stderr, "| %+5i",
|
||||||
|
profile_record[i].num_mismatched_freq_out[j]
|
||||||
|
- last_freq_out);
|
||||||
|
else
|
||||||
|
fprintf (stderr, "| ");
|
||||||
|
if (profile_record[i].num_mismatched_count_out[j] != last_count_out)
|
||||||
|
fprintf (stderr, " %+5i",
|
||||||
|
profile_record[i].num_mismatched_count_out[j]
|
||||||
|
- last_count_out);
|
||||||
|
else
|
||||||
|
fprintf (stderr, " ");
|
||||||
|
|
||||||
|
/* Size/time units change across gimple and RTL. */
|
||||||
|
if (i == pass_expand.pass.static_pass_number)
|
||||||
|
fprintf (stderr, "|----------");
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (rel_size_change)
|
||||||
|
fprintf (stderr, "| %+8.4f%%", rel_size_change);
|
||||||
|
else
|
||||||
|
fprintf (stderr, "| ");
|
||||||
|
if (rel_time_change)
|
||||||
|
fprintf (stderr, " %+8.4f%%", rel_time_change);
|
||||||
|
}
|
||||||
|
fprintf (stderr, "\n");
|
||||||
|
last_freq_in = profile_record[i].num_mismatched_freq_in[j];
|
||||||
|
last_freq_out = profile_record[i].num_mismatched_freq_out[j];
|
||||||
|
last_count_in = profile_record[i].num_mismatched_count_in[j];
|
||||||
|
last_count_out = profile_record[i].num_mismatched_count_out[j];
|
||||||
|
}
|
||||||
|
else if (j && last_reported != i)
|
||||||
|
{
|
||||||
|
last_reported = i;
|
||||||
|
fprintf (stderr, "%-20s ------------| | |\n",
|
||||||
|
passes_by_id [i]->name);
|
||||||
|
}
|
||||||
|
last_time = profile_record[i].time[j];
|
||||||
|
last_size = profile_record[i].size[j];
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
/* Perform all TODO actions that ought to be done on each function. */
|
/* Perform all TODO actions that ought to be done on each function. */
|
||||||
|
|
||||||
static void
|
static void
|
||||||
|
@ -2042,9 +2245,14 @@ execute_one_ipa_transform_pass (struct cgraph_node *node,
|
||||||
if (pass->tv_id != TV_NONE)
|
if (pass->tv_id != TV_NONE)
|
||||||
timevar_pop (pass->tv_id);
|
timevar_pop (pass->tv_id);
|
||||||
|
|
||||||
|
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
|
||||||
|
check_profile_consistency (pass->static_pass_number, 0, true);
|
||||||
|
|
||||||
/* Run post-pass cleanup and verification. */
|
/* Run post-pass cleanup and verification. */
|
||||||
execute_todo (todo_after);
|
execute_todo (todo_after);
|
||||||
verify_interpass_invariants ();
|
verify_interpass_invariants ();
|
||||||
|
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
|
||||||
|
check_profile_consistency (pass->static_pass_number, 1, true);
|
||||||
|
|
||||||
do_per_function (execute_function_dump, NULL);
|
do_per_function (execute_function_dump, NULL);
|
||||||
pass_fini_dump_file (pass);
|
pass_fini_dump_file (pass);
|
||||||
|
@ -2144,6 +2352,13 @@ execute_one_pass (struct opt_pass *pass)
|
||||||
|
|
||||||
if (!gate_status)
|
if (!gate_status)
|
||||||
{
|
{
|
||||||
|
/* Run so passes selectively disabling themselves on a given function
|
||||||
|
are not miscounted. */
|
||||||
|
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
|
||||||
|
{
|
||||||
|
check_profile_consistency (pass->static_pass_number, 0, false);
|
||||||
|
check_profile_consistency (pass->static_pass_number, 1, false);
|
||||||
|
}
|
||||||
current_pass = NULL;
|
current_pass = NULL;
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
@ -2210,8 +2425,14 @@ execute_one_pass (struct opt_pass *pass)
|
||||||
clean_graph_dump_file (dump_file_name);
|
clean_graph_dump_file (dump_file_name);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
|
||||||
|
check_profile_consistency (pass->static_pass_number, 0, true);
|
||||||
|
|
||||||
/* Run post-pass cleanup and verification. */
|
/* Run post-pass cleanup and verification. */
|
||||||
execute_todo (todo_after | pass->todo_flags_finish);
|
execute_todo (todo_after | pass->todo_flags_finish);
|
||||||
|
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
|
||||||
|
check_profile_consistency (pass->static_pass_number, 1, true);
|
||||||
|
|
||||||
verify_interpass_invariants ();
|
verify_interpass_invariants ();
|
||||||
do_per_function (execute_function_dump, NULL);
|
do_per_function (execute_function_dump, NULL);
|
||||||
if (pass->type == IPA_PASS)
|
if (pass->type == IPA_PASS)
|
||||||
|
|
|
@ -1815,6 +1815,9 @@ finalize (bool no_backend)
|
||||||
if (mem_report)
|
if (mem_report)
|
||||||
dump_memory_report (true);
|
dump_memory_report (true);
|
||||||
|
|
||||||
|
if (dump_profile_report)
|
||||||
|
dump_profile_report ();
|
||||||
|
|
||||||
/* Language-specific end of compilation actions. */
|
/* Language-specific end of compilation actions. */
|
||||||
lang_hooks.finish ();
|
lang_hooks.finish ();
|
||||||
}
|
}
|
||||||
|
|
|
@ -49,6 +49,7 @@ extern void emit_debug_global_declarations (tree *, int);
|
||||||
extern void write_global_declarations (void);
|
extern void write_global_declarations (void);
|
||||||
|
|
||||||
extern void dump_memory_report (bool);
|
extern void dump_memory_report (bool);
|
||||||
|
extern void dump_profile_report (void);
|
||||||
|
|
||||||
extern void target_reinit (void);
|
extern void target_reinit (void);
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue