Commit 1cac7b1a authored by Peter Zijlstra's avatar Peter Zijlstra Committed by Ingo Molnar

perf/core: Fix event schedule order

Scheduling in events with cpu=-1 before events with cpu=# changes
semantics and is undesirable in that it would priorize these events.

Given that groups->index is across all groups we actually have an
inter-group ordering, meaning we can merge-sort two groups, which is
just what we need to preserve semantics.
Signed-off-by: default avatarPeter Zijlstra (Intel) <peterz@infradead.org>
Acked-by: default avatarMark Rutland <mark.rutland@arm.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Alexey Budankov <alexey.budankov@linux.intel.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: David Carrillo-Cisneros <davidcc@google.com>
Cc: Dmitri Prokhorov <Dmitry.Prohorov@intel.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Kan Liang <kan.liang@intel.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Stephane Eranian <eranian@google.com>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Valery Cherepennikov <valery.cherepennikov@intel.com>
Cc: Vince Weaver <vincent.weaver@maine.edu>
Cc: linux-kernel@vger.kernel.org
Signed-off-by: default avatarIngo Molnar <mingo@kernel.org>
parent 161c85fa
...@@ -1608,6 +1608,21 @@ perf_event_groups_first(struct perf_event_groups *groups, int cpu) ...@@ -1608,6 +1608,21 @@ perf_event_groups_first(struct perf_event_groups *groups, int cpu)
return match; return match;
} }
/*
* Like rb_entry_next_safe() for the @cpu subtree.
*/
static struct perf_event *
perf_event_groups_next(struct perf_event *event)
{
struct perf_event *next;
next = rb_entry_safe(rb_next(&event->group_node), typeof(*event), group_node);
if (next && next->cpu == event->cpu)
return next;
return NULL;
}
/* /*
* Rotate the @cpu subtree. * Rotate the @cpu subtree.
* *
...@@ -2354,22 +2369,6 @@ static int group_can_go_on(struct perf_event *event, ...@@ -2354,22 +2369,6 @@ static int group_can_go_on(struct perf_event *event,
return can_add_hw; return can_add_hw;
} }
static int
flexible_group_sched_in(struct perf_event *event,
struct perf_event_context *ctx,
struct perf_cpu_context *cpuctx,
int *can_add_hw)
{
if (event->state <= PERF_EVENT_STATE_OFF || !event_filter_match(event))
return 0;
if (group_can_go_on(event, cpuctx, *can_add_hw))
if (group_sched_in(event, cpuctx, ctx))
*can_add_hw = 0;
return 1;
}
static void add_event_to_ctx(struct perf_event *event, static void add_event_to_ctx(struct perf_event *event,
struct perf_event_context *ctx) struct perf_event_context *ctx)
{ {
...@@ -3185,52 +3184,112 @@ static void cpu_ctx_sched_out(struct perf_cpu_context *cpuctx, ...@@ -3185,52 +3184,112 @@ static void cpu_ctx_sched_out(struct perf_cpu_context *cpuctx,
ctx_sched_out(&cpuctx->ctx, cpuctx, event_type); ctx_sched_out(&cpuctx->ctx, cpuctx, event_type);
} }
static void static int visit_groups_merge(struct perf_event_groups *groups, int cpu,
ctx_pinned_sched_in(struct perf_event_context *ctx, int (*func)(struct perf_event *, void *), void *data)
struct perf_cpu_context *cpuctx)
{ {
int sw = -1, cpu = smp_processor_id(); struct perf_event **evt, *evt1, *evt2;
struct perf_event *event; int ret;
int can_add_hw;
perf_event_groups_for_each_cpu(event, sw, evt1 = perf_event_groups_first(groups, -1);
&ctx->pinned_groups, group_node) { evt2 = perf_event_groups_first(groups, cpu);
can_add_hw = 1;
if (flexible_group_sched_in(event, ctx, cpuctx, &can_add_hw)) { while (evt1 || evt2) {
if (event->state == PERF_EVENT_STATE_INACTIVE) if (evt1 && evt2) {
perf_event_set_state(event, if (evt1->group_index < evt2->group_index)
PERF_EVENT_STATE_ERROR); evt = &evt1;
else
evt = &evt2;
} else if (evt1) {
evt = &evt1;
} else {
evt = &evt2;
} }
ret = func(*evt, data);
if (ret)
return ret;
*evt = perf_event_groups_next(*evt);
} }
perf_event_groups_for_each_cpu(event, cpu, return 0;
&ctx->pinned_groups, group_node) { }
can_add_hw = 1;
if (flexible_group_sched_in(event, ctx, cpuctx, &can_add_hw)) { struct sched_in_data {
struct perf_event_context *ctx;
struct perf_cpu_context *cpuctx;
int can_add_hw;
};
static int pinned_sched_in(struct perf_event *event, void *data)
{
struct sched_in_data *sid = data;
if (event->state <= PERF_EVENT_STATE_OFF)
return 0;
if (!event_filter_match(event))
return 0;
if (group_can_go_on(event, sid->cpuctx, sid->can_add_hw))
group_sched_in(event, sid->cpuctx, sid->ctx);
/*
* If this pinned group hasn't been scheduled,
* put it in error state.
*/
if (event->state == PERF_EVENT_STATE_INACTIVE) if (event->state == PERF_EVENT_STATE_INACTIVE)
perf_event_set_state(event, perf_event_set_state(event, PERF_EVENT_STATE_ERROR);
PERF_EVENT_STATE_ERROR);
} return 0;
}
static int flexible_sched_in(struct perf_event *event, void *data)
{
struct sched_in_data *sid = data;
if (event->state <= PERF_EVENT_STATE_OFF)
return 0;
if (!event_filter_match(event))
return 0;
if (group_can_go_on(event, sid->cpuctx, sid->can_add_hw)) {
if (group_sched_in(event, sid->cpuctx, sid->ctx))
sid->can_add_hw = 0;
} }
return 0;
} }
static void static void
ctx_flexible_sched_in(struct perf_event_context *ctx, ctx_pinned_sched_in(struct perf_event_context *ctx,
struct perf_cpu_context *cpuctx) struct perf_cpu_context *cpuctx)
{ {
int sw = -1, cpu = smp_processor_id(); struct sched_in_data sid = {
struct perf_event *event; .ctx = ctx,
int can_add_hw = 1; .cpuctx = cpuctx,
.can_add_hw = 1,
};
perf_event_groups_for_each_cpu(event, sw, visit_groups_merge(&ctx->pinned_groups,
&ctx->flexible_groups, group_node) smp_processor_id(),
flexible_group_sched_in(event, ctx, cpuctx, &can_add_hw); pinned_sched_in, &sid);
}
can_add_hw = 1; static void
perf_event_groups_for_each_cpu(event, cpu, ctx_flexible_sched_in(struct perf_event_context *ctx,
&ctx->flexible_groups, group_node) struct perf_cpu_context *cpuctx)
flexible_group_sched_in(event, ctx, cpuctx, &can_add_hw); {
struct sched_in_data sid = {
.ctx = ctx,
.cpuctx = cpuctx,
.can_add_hw = 1,
};
visit_groups_merge(&ctx->flexible_groups,
smp_processor_id(),
flexible_sched_in, &sid);
} }
static void static void
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment