invoke.texi (-fprofile-report): Document.

* doc/invoke.texi (-fprofile-report): Document.
	* common.opt (-fprofile-report): New option.
	* toplev.c (finalize): Call dump_profile_report.
	* toplev.h (profile_report): Declare.
	* passes.c (profile_record): New static var.
	(check_profile_consistency): New function.
	(dump_profile_record): New function.
	(execute_one_ipa_transform_pass): Call check_profile_consistency.
	(execute_one_pass): Likewise.

From-SVN: r192161
This commit is contained in:
Jan Hubicka 2012-10-06 16:06:04 +02:00 committed by Jan Hubicka
parent 5e25600e6e
commit 37e5402bb3
6 changed files with 247 additions and 1 deletions

View File

@ -1,3 +1,15 @@
2012-10-06 Jan Hubicka <jh@suse.cz>
* doc/invoke.texi (-fprofile-report): Document.
* common.opt (-fprofile-report): New option.
* toplev.c (finalize): Call dump_profile_report.
* toplev.h (profile_report): Declare.
* passes.c (profile_record): New static var.
(check_profile_consistency): New function.
(dump_profile_record): New function.
(execute_one_ipa_transform_pass): Call check_profile_consistency.
(execute_one_pass): Likewise.
2012-10-06 Jan Hubicka <jh@suse.cz>
PR lto/54790

View File

@ -1654,6 +1654,10 @@ fprofile-values
Common Report Var(flag_profile_values)
Insert code to profile values of expressions
fprofile-report
Common Report Var(profile_report)
Report on consistency of profile
frandom-seed
Common Var(common_deferred_options) Defer

View File

@ -388,7 +388,7 @@ Objective-C and Objective-C++ Dialects}.
-fno-toplevel-reorder -fno-trapping-math -fno-zero-initialized-in-bss @gol
-fomit-frame-pointer -foptimize-register-move -foptimize-sibling-calls @gol
-fpartial-inlining -fpeel-loops -fpredictive-commoning @gol
-fprefetch-loop-arrays @gol
-fprefetch-loop-arrays -fprofile-report @gol
-fprofile-correction -fprofile-dir=@var{path} -fprofile-generate @gol
-fprofile-generate=@var{path} @gol
-fprofile-use -fprofile-use=@var{path} -fprofile-values @gol
@ -5153,6 +5153,11 @@ allocation for the WPA phase only.
Makes the compiler print some statistics about permanent memory
allocation before or after interprocedural optimization.
@item -fprofile-report
@opindex fprofile-report
Makes the compiler print some statistics about consistency of the
(estimated) profile and effect of individual passes.
@item -fstack-usage
@opindex fstack-usage
Makes the compiler output stack usage information for the program, on a

View File

@ -1778,6 +1778,209 @@ execute_function_dump (void *data ATTRIBUTE_UNUSED)
}
}
/* Make statistic about profile consistency. */
struct profile_record
{
int num_mismatched_freq_in[2];
int num_mismatched_freq_out[2];
int num_mismatched_count_in[2];
int num_mismatched_count_out[2];
bool run;
gcov_type time[2];
int size[2];
};
static struct profile_record *profile_record;
static void
check_profile_consistency (int index, int subpass, bool run)
{
basic_block bb;
edge_iterator ei;
edge e;
int sum;
gcov_type lsum;
if (index == -1)
return;
if (!profile_record)
profile_record = XCNEWVEC (struct profile_record,
passes_by_id_size);
gcc_assert (index < passes_by_id_size && index >= 0);
gcc_assert (subpass < 2);
profile_record[index].run |= run;
FOR_ALL_BB (bb)
{
if (bb != EXIT_BLOCK_PTR_FOR_FUNCTION (cfun)
&& profile_status != PROFILE_ABSENT)
{
sum = 0;
FOR_EACH_EDGE (e, ei, bb->succs)
sum += e->probability;
if (EDGE_COUNT (bb->succs) && abs (sum - REG_BR_PROB_BASE) > 100)
profile_record[index].num_mismatched_freq_out[subpass]++;
lsum = 0;
FOR_EACH_EDGE (e, ei, bb->succs)
lsum += e->count;
if (EDGE_COUNT (bb->succs)
&& (lsum - bb->count > 100 || lsum - bb->count < -100))
profile_record[index].num_mismatched_count_out[subpass]++;
}
if (bb != ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun)
&& profile_status != PROFILE_ABSENT)
{
sum = 0;
FOR_EACH_EDGE (e, ei, bb->preds)
sum += EDGE_FREQUENCY (e);
if (abs (sum - bb->frequency) > 100
|| (MAX (sum, bb->frequency) > 10
&& abs ((sum - bb->frequency) * 100 / (MAX (sum, bb->frequency) + 1)) > 10))
profile_record[index].num_mismatched_freq_in[subpass]++;
lsum = 0;
FOR_EACH_EDGE (e, ei, bb->preds)
lsum += e->count;
if (lsum - bb->count > 100 || lsum - bb->count < -100)
profile_record[index].num_mismatched_count_in[subpass]++;
}
if (bb == ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun)
|| bb == EXIT_BLOCK_PTR_FOR_FUNCTION (cfun))
continue;
if ((cfun && (cfun->curr_properties & PROP_trees)))
{
gimple_stmt_iterator i;
for (i = gsi_start_bb (bb); !gsi_end_p (i); gsi_next (&i))
{
profile_record[index].size[subpass]
+= estimate_num_insns (gsi_stmt (i), &eni_size_weights);
if (profile_status == PROFILE_READ)
profile_record[index].time[subpass]
+= estimate_num_insns (gsi_stmt (i),
&eni_time_weights) * bb->count;
else if (profile_status == PROFILE_GUESSED)
profile_record[index].time[subpass]
+= estimate_num_insns (gsi_stmt (i),
&eni_time_weights) * bb->frequency;
}
}
else if (cfun && (cfun->curr_properties & PROP_rtl))
{
rtx insn;
for (insn = NEXT_INSN (BB_HEAD (bb)); insn && insn != NEXT_INSN (BB_END (bb));
insn = NEXT_INSN (insn))
if (INSN_P (insn))
{
profile_record[index].size[subpass]
+= insn_rtx_cost (PATTERN (insn), false);
if (profile_status == PROFILE_READ)
profile_record[index].time[subpass]
+= insn_rtx_cost (PATTERN (insn), true) * bb->count;
else if (profile_status == PROFILE_GUESSED)
profile_record[index].time[subpass]
+= insn_rtx_cost (PATTERN (insn), true) * bb->frequency;
}
}
}
}
/* Output profile consistency. */
void
dump_profile_report (void)
{
int i, j;
int last_freq_in = 0, last_count_in = 0, last_freq_out = 0, last_count_out = 0;
gcov_type last_time, last_size;
double rel_time_change, rel_size_change;
int last_reported;
if (!profile_record)
return;
fprintf (stderr, "\nProfile consistency report:\n\n");
fprintf (stderr, "Pass name |mismatch in |mismated out|Overall\n");
fprintf (stderr, " |freq count |freq count |size time\n");
for (i = 0; i < passes_by_id_size; i++)
for (j = 0 ; j < 2; j++)
if (profile_record[i].run)
{
if (last_time)
rel_time_change = (profile_record[i].time[j]
- (double)last_time) * 100 / (double)last_time;
else
rel_time_change = 0;
if (last_size)
rel_size_change = (profile_record[i].size[j]
- (double)last_size) * 100 / (double)last_size;
else
rel_size_change = 0;
if (profile_record[i].num_mismatched_freq_in[j] != last_freq_in
|| profile_record[i].num_mismatched_freq_out[j] != last_freq_out
|| profile_record[i].num_mismatched_count_in[j] != last_count_in
|| profile_record[i].num_mismatched_count_out[j] != last_count_out
|| rel_time_change || rel_size_change)
{
last_reported = i;
fprintf (stderr, "%-20s %s",
passes_by_id [i]->name,
j ? "(after TODO)" : " ");
if (profile_record[i].num_mismatched_freq_in[j] != last_freq_in)
fprintf (stderr, "| %+5i",
profile_record[i].num_mismatched_freq_in[j]
- last_freq_in);
else
fprintf (stderr, "| ");
if (profile_record[i].num_mismatched_count_in[j] != last_count_in)
fprintf (stderr, " %+5i",
profile_record[i].num_mismatched_count_in[j]
- last_count_in);
else
fprintf (stderr, " ");
if (profile_record[i].num_mismatched_freq_out[j] != last_freq_out)
fprintf (stderr, "| %+5i",
profile_record[i].num_mismatched_freq_out[j]
- last_freq_out);
else
fprintf (stderr, "| ");
if (profile_record[i].num_mismatched_count_out[j] != last_count_out)
fprintf (stderr, " %+5i",
profile_record[i].num_mismatched_count_out[j]
- last_count_out);
else
fprintf (stderr, " ");
/* Size/time units change across gimple and RTL. */
if (i == pass_expand.pass.static_pass_number)
fprintf (stderr, "|----------");
else
{
if (rel_size_change)
fprintf (stderr, "| %+8.4f%%", rel_size_change);
else
fprintf (stderr, "| ");
if (rel_time_change)
fprintf (stderr, " %+8.4f%%", rel_time_change);
}
fprintf (stderr, "\n");
last_freq_in = profile_record[i].num_mismatched_freq_in[j];
last_freq_out = profile_record[i].num_mismatched_freq_out[j];
last_count_in = profile_record[i].num_mismatched_count_in[j];
last_count_out = profile_record[i].num_mismatched_count_out[j];
}
else if (j && last_reported != i)
{
last_reported = i;
fprintf (stderr, "%-20s ------------| | |\n",
passes_by_id [i]->name);
}
last_time = profile_record[i].time[j];
last_size = profile_record[i].size[j];
}
}
/* Perform all TODO actions that ought to be done on each function. */
static void
@ -2042,9 +2245,14 @@ execute_one_ipa_transform_pass (struct cgraph_node *node,
if (pass->tv_id != TV_NONE)
timevar_pop (pass->tv_id);
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
check_profile_consistency (pass->static_pass_number, 0, true);
/* Run post-pass cleanup and verification. */
execute_todo (todo_after);
verify_interpass_invariants ();
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
check_profile_consistency (pass->static_pass_number, 1, true);
do_per_function (execute_function_dump, NULL);
pass_fini_dump_file (pass);
@ -2144,6 +2352,13 @@ execute_one_pass (struct opt_pass *pass)
if (!gate_status)
{
/* Run so passes selectively disabling themselves on a given function
are not miscounted. */
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
{
check_profile_consistency (pass->static_pass_number, 0, false);
check_profile_consistency (pass->static_pass_number, 1, false);
}
current_pass = NULL;
return false;
}
@ -2210,8 +2425,14 @@ execute_one_pass (struct opt_pass *pass)
clean_graph_dump_file (dump_file_name);
}
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
check_profile_consistency (pass->static_pass_number, 0, true);
/* Run post-pass cleanup and verification. */
execute_todo (todo_after | pass->todo_flags_finish);
if (profile_report && cfun && (cfun->curr_properties & PROP_cfg))
check_profile_consistency (pass->static_pass_number, 1, true);
verify_interpass_invariants ();
do_per_function (execute_function_dump, NULL);
if (pass->type == IPA_PASS)

View File

@ -1815,6 +1815,9 @@ finalize (bool no_backend)
if (mem_report)
dump_memory_report (true);
if (dump_profile_report)
dump_profile_report ();
/* Language-specific end of compilation actions. */
lang_hooks.finish ();
}

View File

@ -49,6 +49,7 @@ extern void emit_debug_global_declarations (tree *, int);
extern void write_global_declarations (void);
extern void dump_memory_report (bool);
extern void dump_profile_report (void);
extern void target_reinit (void);