perf stat: Hide runtime_stat

runtime_stat is only shared for the sake of tests that don't care
about its value. Move the definition into stat-shadow.c and have the
tests also use the global version.

Signed-off-by: Ian Rogers <irogers@google.com>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Alexandre Torgue <alexandre.torgue@foss.st.com>
Cc: Andrii Nakryiko <andrii@kernel.org>
Cc: Athira Rajeev <atrajeev@linux.vnet.ibm.com>
Cc: Caleb Biggers <caleb.biggers@intel.com>
Cc: Eduard Zingerman <eddyz87@gmail.com>
Cc: Florian Fischer <florian.fischer@muhq.space>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: James Clark <james.clark@arm.com>
Cc: Jing Zhang <renyu.zj@linux.alibaba.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: John Garry <john.g.garry@oracle.com>
Cc: Kajol Jain <kjain@linux.ibm.com>
Cc: Kan Liang <kan.liang@linux.intel.com>
Cc: Leo Yan <leo.yan@linaro.org>
Cc: Mark Rutland <mark.rutland@arm.com>
Cc: Maxime Coquelin <mcoquelin.stm32@gmail.com>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Perry Taylor <perry.taylor@intel.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Ravi Bangoria <ravi.bangoria@amd.com>
Cc: Sandipan Das <sandipan.das@amd.com>
Cc: Sean Christopherson <seanjc@google.com>
Cc: Stephane Eranian <eranian@google.com>
Cc: Suzuki Poulouse <suzuki.poulose@arm.com>
Cc: Xing Zhengjun <zhengjun.xing@linux.intel.com>
Cc: linux-arm-kernel@lists.infradead.org
Cc: linux-stm32@st-md-mailman.stormreply.com
Link: https://lore.kernel.org/r/20230219092848.639226-48-irogers@google.com
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
This commit is contained in:
Ian Rogers 2023-02-19 01:28:44 -08:00 committed by Arnaldo Carvalho de Melo
parent 758bc8e626
commit cc26ffaa01
8 changed files with 90 additions and 136 deletions

View File

@ -2074,8 +2074,7 @@ static void perf_sample__fprint_metric(struct perf_script *script,
val = sample->period * evsel->scale; val = sample->period * evsel->scale;
perf_stat__update_shadow_stats(evsel, perf_stat__update_shadow_stats(evsel,
val, val,
sample->cpu, sample->cpu);
&rt_stat);
evsel_script(evsel)->val = val; evsel_script(evsel)->val = val;
if (evsel_script(leader)->gnum == leader->core.nr_members) { if (evsel_script(leader)->gnum == leader->core.nr_members) {
for_each_group_member (ev2, leader) { for_each_group_member (ev2, leader) {
@ -2083,8 +2082,7 @@ static void perf_sample__fprint_metric(struct perf_script *script,
evsel_script(ev2)->val, evsel_script(ev2)->val,
sample->cpu, sample->cpu,
&ctx, &ctx,
NULL, NULL);
&rt_stat);
} }
evsel_script(leader)->gnum = 0; evsel_script(leader)->gnum = 0;
} }

View File

@ -434,7 +434,7 @@ static void process_interval(void)
clock_gettime(CLOCK_MONOTONIC, &ts); clock_gettime(CLOCK_MONOTONIC, &ts);
diff_timespec(&rs, &ts, &ref_time); diff_timespec(&rs, &ts, &ref_time);
perf_stat__reset_shadow_per_stat(&rt_stat); perf_stat__reset_shadow_per_stat();
evlist__reset_aggr_stats(evsel_list); evlist__reset_aggr_stats(evsel_list);
if (read_counters(&rs) == 0) if (read_counters(&rs) == 0)
@ -910,7 +910,7 @@ static int __run_perf_stat(int argc, const char **argv, int run_idx)
evlist__copy_prev_raw_counts(evsel_list); evlist__copy_prev_raw_counts(evsel_list);
evlist__reset_prev_raw_counts(evsel_list); evlist__reset_prev_raw_counts(evsel_list);
evlist__reset_aggr_stats(evsel_list); evlist__reset_aggr_stats(evsel_list);
perf_stat__reset_shadow_per_stat(&rt_stat); perf_stat__reset_shadow_per_stat();
} else { } else {
update_stats(&walltime_nsecs_stats, t1 - t0); update_stats(&walltime_nsecs_stats, t1 - t0);
update_rusage_stats(&ru_stats, &stat_config.ru_data); update_rusage_stats(&ru_stats, &stat_config.ru_data);

View File

@ -30,8 +30,7 @@ static u64 find_value(const char *name, struct value *values)
return 0; return 0;
} }
static void load_runtime_stat(struct runtime_stat *st, struct evlist *evlist, static void load_runtime_stat(struct evlist *evlist, struct value *vals)
struct value *vals)
{ {
struct evsel *evsel; struct evsel *evsel;
u64 count; u64 count;
@ -39,14 +38,14 @@ static void load_runtime_stat(struct runtime_stat *st, struct evlist *evlist,
perf_stat__reset_shadow_stats(); perf_stat__reset_shadow_stats();
evlist__for_each_entry(evlist, evsel) { evlist__for_each_entry(evlist, evsel) {
count = find_value(evsel->name, vals); count = find_value(evsel->name, vals);
perf_stat__update_shadow_stats(evsel, count, 0, st); perf_stat__update_shadow_stats(evsel, count, 0);
if (!strcmp(evsel->name, "duration_time")) if (!strcmp(evsel->name, "duration_time"))
update_stats(&walltime_nsecs_stats, count); update_stats(&walltime_nsecs_stats, count);
} }
} }
static double compute_single(struct rblist *metric_events, struct evlist *evlist, static double compute_single(struct rblist *metric_events, struct evlist *evlist,
struct runtime_stat *st, const char *name) const char *name)
{ {
struct metric_expr *mexp; struct metric_expr *mexp;
struct metric_event *me; struct metric_event *me;
@ -58,7 +57,7 @@ static double compute_single(struct rblist *metric_events, struct evlist *evlist
list_for_each_entry (mexp, &me->head, nd) { list_for_each_entry (mexp, &me->head, nd) {
if (strcmp(mexp->metric_name, name)) if (strcmp(mexp->metric_name, name))
continue; continue;
return test_generic_metric(mexp, 0, st); return test_generic_metric(mexp, 0);
} }
} }
} }
@ -74,7 +73,6 @@ static int __compute_metric(const char *name, struct value *vals,
}; };
const struct pmu_metrics_table *pme_test; const struct pmu_metrics_table *pme_test;
struct perf_cpu_map *cpus; struct perf_cpu_map *cpus;
struct runtime_stat st;
struct evlist *evlist; struct evlist *evlist;
int err; int err;
@ -93,7 +91,6 @@ static int __compute_metric(const char *name, struct value *vals,
} }
perf_evlist__set_maps(&evlist->core, cpus, NULL); perf_evlist__set_maps(&evlist->core, cpus, NULL);
runtime_stat__init(&st);
/* Parse the metric into metric_events list. */ /* Parse the metric into metric_events list. */
pme_test = find_core_metrics_table("testarch", "testcpu"); pme_test = find_core_metrics_table("testarch", "testcpu");
@ -107,18 +104,17 @@ static int __compute_metric(const char *name, struct value *vals,
goto out; goto out;
/* Load the runtime stats with given numbers for events. */ /* Load the runtime stats with given numbers for events. */
load_runtime_stat(&st, evlist, vals); load_runtime_stat(evlist, vals);
/* And execute the metric */ /* And execute the metric */
if (name1 && ratio1) if (name1 && ratio1)
*ratio1 = compute_single(&metric_events, evlist, &st, name1); *ratio1 = compute_single(&metric_events, evlist, name1);
if (name2 && ratio2) if (name2 && ratio2)
*ratio2 = compute_single(&metric_events, evlist, &st, name2); *ratio2 = compute_single(&metric_events, evlist, name2);
out: out:
/* ... cleanup. */ /* ... cleanup. */
metricgroup__rblist_exit(&metric_events); metricgroup__rblist_exit(&metric_events);
runtime_stat__exit(&st);
evlist__free_stats(evlist); evlist__free_stats(evlist);
perf_cpu_map__put(cpus); perf_cpu_map__put(cpus);
evlist__delete(evlist); evlist__delete(evlist);
@ -300,6 +296,7 @@ static int test_metric_group(void)
static int test__parse_metric(struct test_suite *test __maybe_unused, int subtest __maybe_unused) static int test__parse_metric(struct test_suite *test __maybe_unused, int subtest __maybe_unused)
{ {
perf_stat__init_shadow_stats();
TEST_ASSERT_VAL("IPC failed", test_ipc() == 0); TEST_ASSERT_VAL("IPC failed", test_ipc() == 0);
TEST_ASSERT_VAL("frontend failed", test_frontend() == 0); TEST_ASSERT_VAL("frontend failed", test_frontend() == 0);
TEST_ASSERT_VAL("DCache_L2 failed", test_dcache_l2() == 0); TEST_ASSERT_VAL("DCache_L2 failed", test_dcache_l2() == 0);

View File

@ -816,7 +816,6 @@ static int test__parsing_callback(const struct pmu_metric *pm,
int k; int k;
struct evlist *evlist; struct evlist *evlist;
struct perf_cpu_map *cpus; struct perf_cpu_map *cpus;
struct runtime_stat st;
struct evsel *evsel; struct evsel *evsel;
struct rblist metric_events = { struct rblist metric_events = {
.nr_entries = 0, .nr_entries = 0,
@ -844,7 +843,6 @@ static int test__parsing_callback(const struct pmu_metric *pm,
} }
perf_evlist__set_maps(&evlist->core, cpus, NULL); perf_evlist__set_maps(&evlist->core, cpus, NULL);
runtime_stat__init(&st);
err = metricgroup__parse_groups_test(evlist, table, pm->metric_name, &metric_events); err = metricgroup__parse_groups_test(evlist, table, pm->metric_name, &metric_events);
if (err) { if (err) {
@ -867,7 +865,7 @@ static int test__parsing_callback(const struct pmu_metric *pm,
k = 1; k = 1;
perf_stat__reset_shadow_stats(); perf_stat__reset_shadow_stats();
evlist__for_each_entry(evlist, evsel) { evlist__for_each_entry(evlist, evsel) {
perf_stat__update_shadow_stats(evsel, k, 0, &st); perf_stat__update_shadow_stats(evsel, k, 0);
if (!strcmp(evsel->name, "duration_time")) if (!strcmp(evsel->name, "duration_time"))
update_stats(&walltime_nsecs_stats, k); update_stats(&walltime_nsecs_stats, k);
k++; k++;
@ -881,7 +879,7 @@ static int test__parsing_callback(const struct pmu_metric *pm,
list_for_each_entry (mexp, &me->head, nd) { list_for_each_entry (mexp, &me->head, nd) {
if (strcmp(mexp->metric_name, pm->metric_name)) if (strcmp(mexp->metric_name, pm->metric_name))
continue; continue;
pr_debug("Result %f\n", test_generic_metric(mexp, 0, &st)); pr_debug("Result %f\n", test_generic_metric(mexp, 0));
err = 0; err = 0;
(*failures)--; (*failures)--;
goto out_err; goto out_err;
@ -896,7 +894,6 @@ static int test__parsing_callback(const struct pmu_metric *pm,
/* ... cleanup. */ /* ... cleanup. */
metricgroup__rblist_exit(&metric_events); metricgroup__rblist_exit(&metric_events);
runtime_stat__exit(&st);
evlist__free_stats(evlist); evlist__free_stats(evlist);
perf_cpu_map__put(cpus); perf_cpu_map__put(cpus);
evlist__delete(evlist); evlist__delete(evlist);
@ -908,6 +905,7 @@ static int test__parsing(struct test_suite *test __maybe_unused,
{ {
int failures = 0; int failures = 0;
perf_stat__init_shadow_stats();
pmu_for_each_core_metric(test__parsing_callback, &failures); pmu_for_each_core_metric(test__parsing_callback, &failures);
pmu_for_each_sys_metric(test__parsing_callback, &failures); pmu_for_each_sys_metric(test__parsing_callback, &failures);

View File

@ -729,7 +729,7 @@ static void printout(struct perf_stat_config *config, struct outstate *os,
if (ok) { if (ok) {
perf_stat__print_shadow_stats(config, counter, uval, map_idx, perf_stat__print_shadow_stats(config, counter, uval, map_idx,
&out, &config->metric_events, &rt_stat); &out, &config->metric_events);
} else { } else {
pm(config, os, /*color=*/NULL, /*format=*/NULL, /*unit=*/"", /*val=*/0); pm(config, os, /*color=*/NULL, /*format=*/NULL, /*unit=*/"", /*val=*/0);
} }
@ -1089,8 +1089,7 @@ static void print_metric_headers(struct perf_stat_config *config,
perf_stat__print_shadow_stats(config, counter, 0, perf_stat__print_shadow_stats(config, counter, 0,
0, 0,
&out, &out,
&config->metric_events, &config->metric_events);
&rt_stat);
} }
if (!config->json_output) if (!config->json_output)

View File

@ -25,10 +25,13 @@
* AGGR_THREAD: Not supported? * AGGR_THREAD: Not supported?
*/ */
struct runtime_stat rt_stat;
struct stats walltime_nsecs_stats; struct stats walltime_nsecs_stats;
struct rusage_stats ru_stats; struct rusage_stats ru_stats;
static struct runtime_stat {
struct rblist value_list;
} rt_stat;
enum { enum {
CTX_BIT_USER = 1 << 0, CTX_BIT_USER = 1 << 0,
CTX_BIT_KERNEL = 1 << 1, CTX_BIT_KERNEL = 1 << 1,
@ -125,7 +128,6 @@ static struct saved_value *saved_value_lookup(struct evsel *evsel,
bool create, bool create,
enum stat_type type, enum stat_type type,
int ctx, int ctx,
struct runtime_stat *st,
struct cgroup *cgrp) struct cgroup *cgrp)
{ {
struct rblist *rblist; struct rblist *rblist;
@ -138,7 +140,7 @@ static struct saved_value *saved_value_lookup(struct evsel *evsel,
.cgrp = cgrp, .cgrp = cgrp,
}; };
rblist = &st->value_list; rblist = &rt_stat.value_list;
/* don't use context info for clock events */ /* don't use context info for clock events */
if (type == STAT_NSECS) if (type == STAT_NSECS)
@ -156,9 +158,9 @@ static struct saved_value *saved_value_lookup(struct evsel *evsel,
return NULL; return NULL;
} }
void runtime_stat__init(struct runtime_stat *st) void perf_stat__init_shadow_stats(void)
{ {
struct rblist *rblist = &st->value_list; struct rblist *rblist = &rt_stat.value_list;
rblist__init(rblist); rblist__init(rblist);
rblist->node_cmp = saved_value_cmp; rblist->node_cmp = saved_value_cmp;
@ -166,16 +168,6 @@ void runtime_stat__init(struct runtime_stat *st)
rblist->node_delete = saved_value_delete; rblist->node_delete = saved_value_delete;
} }
void runtime_stat__exit(struct runtime_stat *st)
{
rblist__exit(&st->value_list);
}
void perf_stat__init_shadow_stats(void)
{
runtime_stat__init(&rt_stat);
}
static int evsel_context(struct evsel *evsel) static int evsel_context(struct evsel *evsel)
{ {
int ctx = 0; int ctx = 0;
@ -194,12 +186,12 @@ static int evsel_context(struct evsel *evsel)
return ctx; return ctx;
} }
static void reset_stat(struct runtime_stat *st) void perf_stat__reset_shadow_per_stat(void)
{ {
struct rblist *rblist; struct rblist *rblist;
struct rb_node *pos, *next; struct rb_node *pos, *next;
rblist = &st->value_list; rblist = &rt_stat.value_list;
next = rb_first_cached(&rblist->entries); next = rb_first_cached(&rblist->entries);
while (next) { while (next) {
pos = next; pos = next;
@ -212,28 +204,22 @@ static void reset_stat(struct runtime_stat *st)
void perf_stat__reset_shadow_stats(void) void perf_stat__reset_shadow_stats(void)
{ {
reset_stat(&rt_stat); perf_stat__reset_shadow_per_stat();
memset(&walltime_nsecs_stats, 0, sizeof(walltime_nsecs_stats)); memset(&walltime_nsecs_stats, 0, sizeof(walltime_nsecs_stats));
memset(&ru_stats, 0, sizeof(ru_stats)); memset(&ru_stats, 0, sizeof(ru_stats));
} }
void perf_stat__reset_shadow_per_stat(struct runtime_stat *st)
{
reset_stat(st);
}
struct runtime_stat_data { struct runtime_stat_data {
int ctx; int ctx;
struct cgroup *cgrp; struct cgroup *cgrp;
}; };
static void update_runtime_stat(struct runtime_stat *st, static void update_runtime_stat(enum stat_type type,
enum stat_type type,
int map_idx, u64 count, int map_idx, u64 count,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
struct saved_value *v = saved_value_lookup(NULL, map_idx, true, type, struct saved_value *v = saved_value_lookup(NULL, map_idx, true, type,
rsd->ctx, st, rsd->cgrp); rsd->ctx, rsd->cgrp);
if (v) if (v)
update_stats(&v->stats, count); update_stats(&v->stats, count);
@ -245,7 +231,7 @@ static void update_runtime_stat(struct runtime_stat *st,
* instruction rates, etc: * instruction rates, etc:
*/ */
void perf_stat__update_shadow_stats(struct evsel *counter, u64 count, void perf_stat__update_shadow_stats(struct evsel *counter, u64 count,
int map_idx, struct runtime_stat *st) int map_idx)
{ {
u64 count_ns = count; u64 count_ns = count;
struct saved_value *v; struct saved_value *v;
@ -253,43 +239,42 @@ void perf_stat__update_shadow_stats(struct evsel *counter, u64 count,
.ctx = evsel_context(counter), .ctx = evsel_context(counter),
.cgrp = counter->cgrp, .cgrp = counter->cgrp,
}; };
count *= counter->scale; count *= counter->scale;
if (evsel__is_clock(counter)) if (evsel__is_clock(counter))
update_runtime_stat(st, STAT_NSECS, map_idx, count_ns, &rsd); update_runtime_stat(STAT_NSECS, map_idx, count_ns, &rsd);
else if (evsel__match(counter, HARDWARE, HW_CPU_CYCLES)) else if (evsel__match(counter, HARDWARE, HW_CPU_CYCLES))
update_runtime_stat(st, STAT_CYCLES, map_idx, count, &rsd); update_runtime_stat(STAT_CYCLES, map_idx, count, &rsd);
else if (evsel__match(counter, HARDWARE, HW_STALLED_CYCLES_FRONTEND)) else if (evsel__match(counter, HARDWARE, HW_STALLED_CYCLES_FRONTEND))
update_runtime_stat(st, STAT_STALLED_CYCLES_FRONT, update_runtime_stat(STAT_STALLED_CYCLES_FRONT,
map_idx, count, &rsd); map_idx, count, &rsd);
else if (evsel__match(counter, HARDWARE, HW_STALLED_CYCLES_BACKEND)) else if (evsel__match(counter, HARDWARE, HW_STALLED_CYCLES_BACKEND))
update_runtime_stat(st, STAT_STALLED_CYCLES_BACK, update_runtime_stat(STAT_STALLED_CYCLES_BACK,
map_idx, count, &rsd); map_idx, count, &rsd);
else if (evsel__match(counter, HARDWARE, HW_BRANCH_INSTRUCTIONS)) else if (evsel__match(counter, HARDWARE, HW_BRANCH_INSTRUCTIONS))
update_runtime_stat(st, STAT_BRANCHES, map_idx, count, &rsd); update_runtime_stat(STAT_BRANCHES, map_idx, count, &rsd);
else if (evsel__match(counter, HARDWARE, HW_CACHE_REFERENCES)) else if (evsel__match(counter, HARDWARE, HW_CACHE_REFERENCES))
update_runtime_stat(st, STAT_CACHEREFS, map_idx, count, &rsd); update_runtime_stat(STAT_CACHEREFS, map_idx, count, &rsd);
else if (evsel__match(counter, HW_CACHE, HW_CACHE_L1D)) else if (evsel__match(counter, HW_CACHE, HW_CACHE_L1D))
update_runtime_stat(st, STAT_L1_DCACHE, map_idx, count, &rsd); update_runtime_stat(STAT_L1_DCACHE, map_idx, count, &rsd);
else if (evsel__match(counter, HW_CACHE, HW_CACHE_L1I)) else if (evsel__match(counter, HW_CACHE, HW_CACHE_L1I))
update_runtime_stat(st, STAT_L1_ICACHE, map_idx, count, &rsd); update_runtime_stat(STAT_L1_ICACHE, map_idx, count, &rsd);
else if (evsel__match(counter, HW_CACHE, HW_CACHE_LL)) else if (evsel__match(counter, HW_CACHE, HW_CACHE_LL))
update_runtime_stat(st, STAT_LL_CACHE, map_idx, count, &rsd); update_runtime_stat(STAT_LL_CACHE, map_idx, count, &rsd);
else if (evsel__match(counter, HW_CACHE, HW_CACHE_DTLB)) else if (evsel__match(counter, HW_CACHE, HW_CACHE_DTLB))
update_runtime_stat(st, STAT_DTLB_CACHE, map_idx, count, &rsd); update_runtime_stat(STAT_DTLB_CACHE, map_idx, count, &rsd);
else if (evsel__match(counter, HW_CACHE, HW_CACHE_ITLB)) else if (evsel__match(counter, HW_CACHE, HW_CACHE_ITLB))
update_runtime_stat(st, STAT_ITLB_CACHE, map_idx, count, &rsd); update_runtime_stat(STAT_ITLB_CACHE, map_idx, count, &rsd);
if (counter->collect_stat) { if (counter->collect_stat) {
v = saved_value_lookup(counter, map_idx, true, STAT_NONE, 0, st, v = saved_value_lookup(counter, map_idx, true, STAT_NONE, 0,
rsd.cgrp); rsd.cgrp);
update_stats(&v->stats, count); update_stats(&v->stats, count);
if (counter->metric_leader) if (counter->metric_leader)
v->metric_total += count; v->metric_total += count;
} else if (counter->metric_leader && !counter->merged_stat) { } else if (counter->metric_leader && !counter->merged_stat) {
v = saved_value_lookup(counter->metric_leader, v = saved_value_lookup(counter->metric_leader,
map_idx, true, STAT_NONE, 0, st, rsd.cgrp); map_idx, true, STAT_NONE, 0, rsd.cgrp);
v->metric_total += count; v->metric_total += count;
v->metric_other++; v->metric_other++;
} }
@ -322,26 +307,24 @@ static const char *get_ratio_color(enum grc_type type, double ratio)
return color; return color;
} }
static double runtime_stat_avg(struct runtime_stat *st, static double runtime_stat_avg(enum stat_type type, int map_idx,
enum stat_type type, int map_idx,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
struct saved_value *v; struct saved_value *v;
v = saved_value_lookup(NULL, map_idx, false, type, rsd->ctx, st, rsd->cgrp); v = saved_value_lookup(NULL, map_idx, false, type, rsd->ctx, rsd->cgrp);
if (!v) if (!v)
return 0.0; return 0.0;
return avg_stats(&v->stats); return avg_stats(&v->stats);
} }
static double runtime_stat_n(struct runtime_stat *st, static double runtime_stat_n(enum stat_type type, int map_idx,
enum stat_type type, int map_idx,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
struct saved_value *v; struct saved_value *v;
v = saved_value_lookup(NULL, map_idx, false, type, rsd->ctx, st, rsd->cgrp); v = saved_value_lookup(NULL, map_idx, false, type, rsd->ctx, rsd->cgrp);
if (!v) if (!v)
return 0.0; return 0.0;
@ -351,13 +334,12 @@ static double runtime_stat_n(struct runtime_stat *st,
static void print_stalled_cycles_frontend(struct perf_stat_config *config, static void print_stalled_cycles_frontend(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_CYCLES, map_idx, rsd); total = runtime_stat_avg(STAT_CYCLES, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -374,13 +356,12 @@ static void print_stalled_cycles_frontend(struct perf_stat_config *config,
static void print_stalled_cycles_backend(struct perf_stat_config *config, static void print_stalled_cycles_backend(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_CYCLES, map_idx, rsd); total = runtime_stat_avg(STAT_CYCLES, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -393,13 +374,12 @@ static void print_stalled_cycles_backend(struct perf_stat_config *config,
static void print_branch_misses(struct perf_stat_config *config, static void print_branch_misses(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_BRANCHES, map_idx, rsd); total = runtime_stat_avg(STAT_BRANCHES, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -412,13 +392,12 @@ static void print_branch_misses(struct perf_stat_config *config,
static void print_l1_dcache_misses(struct perf_stat_config *config, static void print_l1_dcache_misses(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_L1_DCACHE, map_idx, rsd); total = runtime_stat_avg(STAT_L1_DCACHE, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -431,13 +410,12 @@ static void print_l1_dcache_misses(struct perf_stat_config *config,
static void print_l1_icache_misses(struct perf_stat_config *config, static void print_l1_icache_misses(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_L1_ICACHE, map_idx, rsd); total = runtime_stat_avg(STAT_L1_ICACHE, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -449,13 +427,12 @@ static void print_l1_icache_misses(struct perf_stat_config *config,
static void print_dtlb_cache_misses(struct perf_stat_config *config, static void print_dtlb_cache_misses(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_DTLB_CACHE, map_idx, rsd); total = runtime_stat_avg(STAT_DTLB_CACHE, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -467,13 +444,12 @@ static void print_dtlb_cache_misses(struct perf_stat_config *config,
static void print_itlb_cache_misses(struct perf_stat_config *config, static void print_itlb_cache_misses(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_ITLB_CACHE, map_idx, rsd); total = runtime_stat_avg(STAT_ITLB_CACHE, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -485,13 +461,12 @@ static void print_itlb_cache_misses(struct perf_stat_config *config,
static void print_ll_cache_misses(struct perf_stat_config *config, static void print_ll_cache_misses(struct perf_stat_config *config,
int map_idx, double avg, int map_idx, double avg,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct runtime_stat *st,
struct runtime_stat_data *rsd) struct runtime_stat_data *rsd)
{ {
double total, ratio = 0.0; double total, ratio = 0.0;
const char *color; const char *color;
total = runtime_stat_avg(st, STAT_LL_CACHE, map_idx, rsd); total = runtime_stat_avg(STAT_LL_CACHE, map_idx, rsd);
if (total) if (total)
ratio = avg / total * 100.0; ratio = avg / total * 100.0;
@ -503,8 +478,7 @@ static void print_ll_cache_misses(struct perf_stat_config *config,
static int prepare_metric(struct evsel **metric_events, static int prepare_metric(struct evsel **metric_events,
struct metric_ref *metric_refs, struct metric_ref *metric_refs,
struct expr_parse_ctx *pctx, struct expr_parse_ctx *pctx,
int map_idx, int map_idx)
struct runtime_stat *st)
{ {
double scale; double scale;
char *n; char *n;
@ -543,7 +517,7 @@ static int prepare_metric(struct evsel **metric_events,
} }
} else { } else {
v = saved_value_lookup(metric_events[i], map_idx, false, v = saved_value_lookup(metric_events[i], map_idx, false,
STAT_NONE, 0, st, STAT_NONE, 0,
metric_events[i]->cgrp); metric_events[i]->cgrp);
if (!v) if (!v)
break; break;
@ -587,8 +561,7 @@ static void generic_metric(struct perf_stat_config *config,
const char *metric_unit, const char *metric_unit,
int runtime, int runtime,
int map_idx, int map_idx,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out)
struct runtime_stat *st)
{ {
print_metric_t print_metric = out->print_metric; print_metric_t print_metric = out->print_metric;
struct expr_parse_ctx *pctx; struct expr_parse_ctx *pctx;
@ -605,7 +578,7 @@ static void generic_metric(struct perf_stat_config *config,
pctx->sctx.user_requested_cpu_list = strdup(config->user_requested_cpu_list); pctx->sctx.user_requested_cpu_list = strdup(config->user_requested_cpu_list);
pctx->sctx.runtime = runtime; pctx->sctx.runtime = runtime;
pctx->sctx.system_wide = config->system_wide; pctx->sctx.system_wide = config->system_wide;
i = prepare_metric(metric_events, metric_refs, pctx, map_idx, st); i = prepare_metric(metric_events, metric_refs, pctx, map_idx);
if (i < 0) { if (i < 0) {
expr__ctx_free(pctx); expr__ctx_free(pctx);
return; return;
@ -657,7 +630,7 @@ static void generic_metric(struct perf_stat_config *config,
expr__ctx_free(pctx); expr__ctx_free(pctx);
} }
double test_generic_metric(struct metric_expr *mexp, int map_idx, struct runtime_stat *st) double test_generic_metric(struct metric_expr *mexp, int map_idx)
{ {
struct expr_parse_ctx *pctx; struct expr_parse_ctx *pctx;
double ratio = 0.0; double ratio = 0.0;
@ -666,7 +639,7 @@ double test_generic_metric(struct metric_expr *mexp, int map_idx, struct runtime
if (!pctx) if (!pctx)
return NAN; return NAN;
if (prepare_metric(mexp->metric_events, mexp->metric_refs, pctx, map_idx, st) < 0) if (prepare_metric(mexp->metric_events, mexp->metric_refs, pctx, map_idx) < 0)
goto out; goto out;
if (expr__parse(&ratio, pctx, mexp->metric_expr)) if (expr__parse(&ratio, pctx, mexp->metric_expr))
@ -681,8 +654,7 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
struct evsel *evsel, struct evsel *evsel,
double avg, int map_idx, double avg, int map_idx,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct rblist *metric_events, struct rblist *metric_events)
struct runtime_stat *st)
{ {
void *ctxp = out->ctx; void *ctxp = out->ctx;
print_metric_t print_metric = out->print_metric; print_metric_t print_metric = out->print_metric;
@ -697,7 +669,7 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
if (config->iostat_run) { if (config->iostat_run) {
iostat_print_metric(config, evsel, out); iostat_print_metric(config, evsel, out);
} else if (evsel__match(evsel, HARDWARE, HW_INSTRUCTIONS)) { } else if (evsel__match(evsel, HARDWARE, HW_INSTRUCTIONS)) {
total = runtime_stat_avg(st, STAT_CYCLES, map_idx, &rsd); total = runtime_stat_avg(STAT_CYCLES, map_idx, &rsd);
if (total) { if (total) {
ratio = avg / total; ratio = avg / total;
@ -707,10 +679,9 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
print_metric(config, ctxp, NULL, NULL, "insn per cycle", 0); print_metric(config, ctxp, NULL, NULL, "insn per cycle", 0);
} }
total = runtime_stat_avg(st, STAT_STALLED_CYCLES_FRONT, map_idx, &rsd); total = runtime_stat_avg(STAT_STALLED_CYCLES_FRONT, map_idx, &rsd);
total = max(total, runtime_stat_avg(st, total = max(total, runtime_stat_avg(STAT_STALLED_CYCLES_BACK,
STAT_STALLED_CYCLES_BACK,
map_idx, &rsd)); map_idx, &rsd));
if (total && avg) { if (total && avg) {
@ -721,8 +692,8 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
ratio); ratio);
} }
} else if (evsel__match(evsel, HARDWARE, HW_BRANCH_MISSES)) { } else if (evsel__match(evsel, HARDWARE, HW_BRANCH_MISSES)) {
if (runtime_stat_n(st, STAT_BRANCHES, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_BRANCHES, map_idx, &rsd) != 0)
print_branch_misses(config, map_idx, avg, out, st, &rsd); print_branch_misses(config, map_idx, avg, out, &rsd);
else else
print_metric(config, ctxp, NULL, NULL, "of all branches", 0); print_metric(config, ctxp, NULL, NULL, "of all branches", 0);
} else if ( } else if (
@ -731,8 +702,8 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
((PERF_COUNT_HW_CACHE_OP_READ) << 8) | ((PERF_COUNT_HW_CACHE_OP_READ) << 8) |
((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) { ((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) {
if (runtime_stat_n(st, STAT_L1_DCACHE, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_L1_DCACHE, map_idx, &rsd) != 0)
print_l1_dcache_misses(config, map_idx, avg, out, st, &rsd); print_l1_dcache_misses(config, map_idx, avg, out, &rsd);
else else
print_metric(config, ctxp, NULL, NULL, "of all L1-dcache accesses", 0); print_metric(config, ctxp, NULL, NULL, "of all L1-dcache accesses", 0);
} else if ( } else if (
@ -741,8 +712,8 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
((PERF_COUNT_HW_CACHE_OP_READ) << 8) | ((PERF_COUNT_HW_CACHE_OP_READ) << 8) |
((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) { ((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) {
if (runtime_stat_n(st, STAT_L1_ICACHE, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_L1_ICACHE, map_idx, &rsd) != 0)
print_l1_icache_misses(config, map_idx, avg, out, st, &rsd); print_l1_icache_misses(config, map_idx, avg, out, &rsd);
else else
print_metric(config, ctxp, NULL, NULL, "of all L1-icache accesses", 0); print_metric(config, ctxp, NULL, NULL, "of all L1-icache accesses", 0);
} else if ( } else if (
@ -751,8 +722,8 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
((PERF_COUNT_HW_CACHE_OP_READ) << 8) | ((PERF_COUNT_HW_CACHE_OP_READ) << 8) |
((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) { ((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) {
if (runtime_stat_n(st, STAT_DTLB_CACHE, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_DTLB_CACHE, map_idx, &rsd) != 0)
print_dtlb_cache_misses(config, map_idx, avg, out, st, &rsd); print_dtlb_cache_misses(config, map_idx, avg, out, &rsd);
else else
print_metric(config, ctxp, NULL, NULL, "of all dTLB cache accesses", 0); print_metric(config, ctxp, NULL, NULL, "of all dTLB cache accesses", 0);
} else if ( } else if (
@ -761,8 +732,8 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
((PERF_COUNT_HW_CACHE_OP_READ) << 8) | ((PERF_COUNT_HW_CACHE_OP_READ) << 8) |
((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) { ((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) {
if (runtime_stat_n(st, STAT_ITLB_CACHE, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_ITLB_CACHE, map_idx, &rsd) != 0)
print_itlb_cache_misses(config, map_idx, avg, out, st, &rsd); print_itlb_cache_misses(config, map_idx, avg, out, &rsd);
else else
print_metric(config, ctxp, NULL, NULL, "of all iTLB cache accesses", 0); print_metric(config, ctxp, NULL, NULL, "of all iTLB cache accesses", 0);
} else if ( } else if (
@ -771,27 +742,27 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
((PERF_COUNT_HW_CACHE_OP_READ) << 8) | ((PERF_COUNT_HW_CACHE_OP_READ) << 8) |
((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) { ((PERF_COUNT_HW_CACHE_RESULT_MISS) << 16))) {
if (runtime_stat_n(st, STAT_LL_CACHE, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_LL_CACHE, map_idx, &rsd) != 0)
print_ll_cache_misses(config, map_idx, avg, out, st, &rsd); print_ll_cache_misses(config, map_idx, avg, out, &rsd);
else else
print_metric(config, ctxp, NULL, NULL, "of all LL-cache accesses", 0); print_metric(config, ctxp, NULL, NULL, "of all LL-cache accesses", 0);
} else if (evsel__match(evsel, HARDWARE, HW_CACHE_MISSES)) { } else if (evsel__match(evsel, HARDWARE, HW_CACHE_MISSES)) {
total = runtime_stat_avg(st, STAT_CACHEREFS, map_idx, &rsd); total = runtime_stat_avg(STAT_CACHEREFS, map_idx, &rsd);
if (total) if (total)
ratio = avg * 100 / total; ratio = avg * 100 / total;
if (runtime_stat_n(st, STAT_CACHEREFS, map_idx, &rsd) != 0) if (runtime_stat_n(STAT_CACHEREFS, map_idx, &rsd) != 0)
print_metric(config, ctxp, NULL, "%8.3f %%", print_metric(config, ctxp, NULL, "%8.3f %%",
"of all cache refs", ratio); "of all cache refs", ratio);
else else
print_metric(config, ctxp, NULL, NULL, "of all cache refs", 0); print_metric(config, ctxp, NULL, NULL, "of all cache refs", 0);
} else if (evsel__match(evsel, HARDWARE, HW_STALLED_CYCLES_FRONTEND)) { } else if (evsel__match(evsel, HARDWARE, HW_STALLED_CYCLES_FRONTEND)) {
print_stalled_cycles_frontend(config, map_idx, avg, out, st, &rsd); print_stalled_cycles_frontend(config, map_idx, avg, out, &rsd);
} else if (evsel__match(evsel, HARDWARE, HW_STALLED_CYCLES_BACKEND)) { } else if (evsel__match(evsel, HARDWARE, HW_STALLED_CYCLES_BACKEND)) {
print_stalled_cycles_backend(config, map_idx, avg, out, st, &rsd); print_stalled_cycles_backend(config, map_idx, avg, out, &rsd);
} else if (evsel__match(evsel, HARDWARE, HW_CPU_CYCLES)) { } else if (evsel__match(evsel, HARDWARE, HW_CPU_CYCLES)) {
total = runtime_stat_avg(st, STAT_NSECS, map_idx, &rsd); total = runtime_stat_avg(STAT_NSECS, map_idx, &rsd);
if (total) { if (total) {
ratio = avg / total; ratio = avg / total;
@ -805,11 +776,11 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
avg / (ratio * evsel->scale)); avg / (ratio * evsel->scale));
else else
print_metric(config, ctxp, NULL, NULL, "CPUs utilized", 0); print_metric(config, ctxp, NULL, NULL, "CPUs utilized", 0);
} else if (runtime_stat_n(st, STAT_NSECS, map_idx, &rsd) != 0) { } else if (runtime_stat_n(STAT_NSECS, map_idx, &rsd) != 0) {
char unit = ' '; char unit = ' ';
char unit_buf[10] = "/sec"; char unit_buf[10] = "/sec";
total = runtime_stat_avg(st, STAT_NSECS, map_idx, &rsd); total = runtime_stat_avg(STAT_NSECS, map_idx, &rsd);
if (total) if (total)
ratio = convert_unit_double(1000000000.0 * avg / total, &unit); ratio = convert_unit_double(1000000000.0 * avg / total, &unit);
@ -829,7 +800,7 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
generic_metric(config, mexp->metric_expr, mexp->metric_threshold, generic_metric(config, mexp->metric_expr, mexp->metric_threshold,
mexp->metric_events, mexp->metric_refs, evsel->name, mexp->metric_events, mexp->metric_refs, evsel->name,
mexp->metric_name, mexp->metric_unit, mexp->runtime, mexp->metric_name, mexp->metric_unit, mexp->runtime,
map_idx, out, st); map_idx, out);
} }
} }
if (num == 0) if (num == 0)

View File

@ -659,7 +659,7 @@ static void evsel__update_shadow_stats(struct evsel *evsel)
for (i = 0; i < ps->nr_aggr; i++) { for (i = 0; i < ps->nr_aggr; i++) {
struct perf_counts_values *aggr_counts = &ps->aggr[i].counts; struct perf_counts_values *aggr_counts = &ps->aggr[i].counts;
perf_stat__update_shadow_stats(evsel, aggr_counts->val, i, &rt_stat); perf_stat__update_shadow_stats(evsel, aggr_counts->val, i);
} }
} }

View File

@ -55,10 +55,6 @@ enum aggr_mode {
AGGR_MAX AGGR_MAX
}; };
struct runtime_stat {
struct rblist value_list;
};
struct rusage_stats { struct rusage_stats {
struct stats ru_utime_usec_stat; struct stats ru_utime_usec_stat;
struct stats ru_stime_usec_stat; struct stats ru_stime_usec_stat;
@ -153,7 +149,6 @@ static inline void update_rusage_stats(struct rusage_stats *ru_stats, struct rus
struct evsel; struct evsel;
struct evlist; struct evlist;
extern struct runtime_stat rt_stat;
extern struct stats walltime_nsecs_stats; extern struct stats walltime_nsecs_stats;
extern struct rusage_stats ru_stats; extern struct rusage_stats ru_stats;
@ -162,13 +157,10 @@ typedef void (*print_metric_t)(struct perf_stat_config *config,
const char *fmt, double val); const char *fmt, double val);
typedef void (*new_line_t)(struct perf_stat_config *config, void *ctx); typedef void (*new_line_t)(struct perf_stat_config *config, void *ctx);
void runtime_stat__init(struct runtime_stat *st);
void runtime_stat__exit(struct runtime_stat *st);
void perf_stat__init_shadow_stats(void); void perf_stat__init_shadow_stats(void);
void perf_stat__reset_shadow_stats(void); void perf_stat__reset_shadow_stats(void);
void perf_stat__reset_shadow_per_stat(struct runtime_stat *st); void perf_stat__reset_shadow_per_stat(void);
void perf_stat__update_shadow_stats(struct evsel *counter, u64 count, void perf_stat__update_shadow_stats(struct evsel *counter, u64 count, int map_idx);
int map_idx, struct runtime_stat *st);
struct perf_stat_output_ctx { struct perf_stat_output_ctx {
void *ctx; void *ctx;
print_metric_t print_metric; print_metric_t print_metric;
@ -180,8 +172,7 @@ void perf_stat__print_shadow_stats(struct perf_stat_config *config,
struct evsel *evsel, struct evsel *evsel,
double avg, int map_idx, double avg, int map_idx,
struct perf_stat_output_ctx *out, struct perf_stat_output_ctx *out,
struct rblist *metric_events, struct rblist *metric_events);
struct runtime_stat *st);
int evlist__alloc_stats(struct perf_stat_config *config, int evlist__alloc_stats(struct perf_stat_config *config,
struct evlist *evlist, bool alloc_raw); struct evlist *evlist, bool alloc_raw);
@ -220,5 +211,5 @@ void evlist__print_counters(struct evlist *evlist, struct perf_stat_config *conf
struct target *_target, struct timespec *ts, int argc, const char **argv); struct target *_target, struct timespec *ts, int argc, const char **argv);
struct metric_expr; struct metric_expr;
double test_generic_metric(struct metric_expr *mexp, int map_idx, struct runtime_stat *st); double test_generic_metric(struct metric_expr *mexp, int map_idx);
#endif #endif