Commit 810b7ee3 authored by Chris Wilson's avatar Chris Wilson

drm/i915/gt: Always report the sample time for busy-stats

Return the monotonic timestamp (ktime_get()) at the time of sampling the
busy-time. This is used in preference to taking ktime_get() separately
before or after the read seqlock as there can be some large variance in
reported timestamps. For selftests trying to ascertain that we are
reporting accurate to within a few microseconds, even a small delay
leads to the test failing.
Signed-off-by: default avatarChris Wilson <chris@chris-wilson.co.uk>
Cc: Tvrtko Ursulin <tvrtko.ursulin@intel.com>
Reviewed-by: default avatarTvrtko Ursulin <tvrtko.ursulin@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20200617130916.15261-2-chris@chris-wilson.co.uk
parent 1b90e4a4
...@@ -334,7 +334,8 @@ void intel_engine_dump(struct intel_engine_cs *engine, ...@@ -334,7 +334,8 @@ void intel_engine_dump(struct intel_engine_cs *engine,
struct drm_printer *m, struct drm_printer *m,
const char *header, ...); const char *header, ...);
ktime_t intel_engine_get_busy_time(struct intel_engine_cs *engine); ktime_t intel_engine_get_busy_time(struct intel_engine_cs *engine,
ktime_t *now);
struct i915_request * struct i915_request *
intel_engine_find_active_request(struct intel_engine_cs *engine); intel_engine_find_active_request(struct intel_engine_cs *engine);
......
...@@ -1595,7 +1595,8 @@ void intel_engine_dump(struct intel_engine_cs *engine, ...@@ -1595,7 +1595,8 @@ void intel_engine_dump(struct intel_engine_cs *engine,
intel_engine_print_breadcrumbs(engine, m); intel_engine_print_breadcrumbs(engine, m);
} }
static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine) static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine,
ktime_t *now)
{ {
ktime_t total = engine->stats.total; ktime_t total = engine->stats.total;
...@@ -1603,9 +1604,9 @@ static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine) ...@@ -1603,9 +1604,9 @@ static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine)
* If the engine is executing something at the moment * If the engine is executing something at the moment
* add it to the total. * add it to the total.
*/ */
*now = ktime_get();
if (atomic_read(&engine->stats.active)) if (atomic_read(&engine->stats.active))
total = ktime_add(total, total = ktime_add(total, ktime_sub(*now, engine->stats.start));
ktime_sub(ktime_get(), engine->stats.start));
return total; return total;
} }
...@@ -1613,17 +1614,18 @@ static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine) ...@@ -1613,17 +1614,18 @@ static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine)
/** /**
* intel_engine_get_busy_time() - Return current accumulated engine busyness * intel_engine_get_busy_time() - Return current accumulated engine busyness
* @engine: engine to report on * @engine: engine to report on
* @now: monotonic timestamp of sampling
* *
* Returns accumulated time @engine was busy since engine stats were enabled. * Returns accumulated time @engine was busy since engine stats were enabled.
*/ */
ktime_t intel_engine_get_busy_time(struct intel_engine_cs *engine) ktime_t intel_engine_get_busy_time(struct intel_engine_cs *engine, ktime_t *now)
{ {
unsigned int seq; unsigned int seq;
ktime_t total; ktime_t total;
do { do {
seq = read_seqbegin(&engine->stats.lock); seq = read_seqbegin(&engine->stats.lock);
total = __intel_engine_get_busy_time(engine); total = __intel_engine_get_busy_time(engine, now);
} while (read_seqretry(&engine->stats.lock, seq)); } while (read_seqretry(&engine->stats.lock, seq));
return total; return total;
......
...@@ -53,13 +53,13 @@ static void rps_timer(struct timer_list *t) ...@@ -53,13 +53,13 @@ static void rps_timer(struct timer_list *t)
struct intel_engine_cs *engine; struct intel_engine_cs *engine;
enum intel_engine_id id; enum intel_engine_id id;
s64 max_busy[3] = {}; s64 max_busy[3] = {};
ktime_t dt, last; ktime_t dt, timestamp, last;
for_each_engine(engine, rps_to_gt(rps), id) { for_each_engine(engine, rps_to_gt(rps), id) {
s64 busy; s64 busy;
int i; int i;
dt = intel_engine_get_busy_time(engine); dt = intel_engine_get_busy_time(engine, &timestamp);
last = engine->stats.rps; last = engine->stats.rps;
engine->stats.rps = dt; engine->stats.rps = dt;
...@@ -70,15 +70,14 @@ static void rps_timer(struct timer_list *t) ...@@ -70,15 +70,14 @@ static void rps_timer(struct timer_list *t)
} }
} }
dt = ktime_get();
last = rps->pm_timestamp; last = rps->pm_timestamp;
rps->pm_timestamp = dt; rps->pm_timestamp = timestamp;
if (intel_rps_is_active(rps)) { if (intel_rps_is_active(rps)) {
s64 busy; s64 busy;
int i; int i;
dt = ktime_sub(dt, last); dt = ktime_sub(timestamp, last);
/* /*
* Our goal is to evaluate each engine independently, so we run * Our goal is to evaluate each engine independently, so we run
......
...@@ -29,8 +29,8 @@ static int live_engine_busy_stats(void *arg) ...@@ -29,8 +29,8 @@ static int live_engine_busy_stats(void *arg)
GEM_BUG_ON(intel_gt_pm_is_awake(gt)); GEM_BUG_ON(intel_gt_pm_is_awake(gt));
for_each_engine(engine, gt, id) { for_each_engine(engine, gt, id) {
struct i915_request *rq; struct i915_request *rq;
ktime_t de; ktime_t de, dt;
u64 dt; ktime_t t[2];
if (!intel_engine_supports_stats(engine)) if (!intel_engine_supports_stats(engine))
continue; continue;
...@@ -47,12 +47,11 @@ static int live_engine_busy_stats(void *arg) ...@@ -47,12 +47,11 @@ static int live_engine_busy_stats(void *arg)
ENGINE_TRACE(engine, "measuring idle time\n"); ENGINE_TRACE(engine, "measuring idle time\n");
preempt_disable(); preempt_disable();
dt = ktime_to_ns(ktime_get()); de = intel_engine_get_busy_time(engine, &t[0]);
de = intel_engine_get_busy_time(engine);
udelay(100); udelay(100);
de = ktime_sub(intel_engine_get_busy_time(engine), de); de = ktime_sub(intel_engine_get_busy_time(engine, &t[1]), de);
dt = ktime_to_ns(ktime_get()) - dt;
preempt_enable(); preempt_enable();
dt = ktime_sub(t[1], t[0]);
if (de < 0 || de > 10) { if (de < 0 || de > 10) {
pr_err("%s: reported %lldns [%d%%] busyness while sleeping [for %lldns]\n", pr_err("%s: reported %lldns [%d%%] busyness while sleeping [for %lldns]\n",
engine->name, engine->name,
...@@ -80,12 +79,11 @@ static int live_engine_busy_stats(void *arg) ...@@ -80,12 +79,11 @@ static int live_engine_busy_stats(void *arg)
ENGINE_TRACE(engine, "measuring busy time\n"); ENGINE_TRACE(engine, "measuring busy time\n");
preempt_disable(); preempt_disable();
dt = ktime_to_ns(ktime_get()); de = intel_engine_get_busy_time(engine, &t[0]);
de = intel_engine_get_busy_time(engine);
udelay(100); udelay(100);
de = ktime_sub(intel_engine_get_busy_time(engine), de); de = ktime_sub(intel_engine_get_busy_time(engine, &t[1]), de);
dt = ktime_to_ns(ktime_get()) - dt;
preempt_enable(); preempt_enable();
dt = ktime_sub(t[1], t[0]);
if (100 * de < 95 * dt || 95 * de > 100 * dt) { if (100 * de < 95 * dt || 95 * de > 100 * dt) {
pr_err("%s: reported %lldns [%d%%] busyness while spinning [for %lldns]\n", pr_err("%s: reported %lldns [%d%%] busyness while spinning [for %lldns]\n",
engine->name, engine->name,
......
...@@ -565,7 +565,10 @@ static u64 __i915_pmu_event_read(struct perf_event *event) ...@@ -565,7 +565,10 @@ static u64 __i915_pmu_event_read(struct perf_event *event)
/* Do nothing */ /* Do nothing */
} else if (sample == I915_SAMPLE_BUSY && } else if (sample == I915_SAMPLE_BUSY &&
intel_engine_supports_stats(engine)) { intel_engine_supports_stats(engine)) {
val = ktime_to_ns(intel_engine_get_busy_time(engine)); ktime_t unused;
val = ktime_to_ns(intel_engine_get_busy_time(engine,
&unused));
} else { } else {
val = engine->pmu.sample[sample].cur; val = engine->pmu.sample[sample].cur;
} }
......
...@@ -2492,9 +2492,11 @@ static int perf_series_engines(void *arg) ...@@ -2492,9 +2492,11 @@ static int perf_series_engines(void *arg)
intel_engine_pm_get(p->engine); intel_engine_pm_get(p->engine);
if (intel_engine_supports_stats(p->engine)) if (intel_engine_supports_stats(p->engine))
p->busy = intel_engine_get_busy_time(p->engine) + 1; p->busy = intel_engine_get_busy_time(p->engine,
p->runtime = -intel_context_get_total_runtime_ns(ce); &p->time) + 1;
else
p->time = ktime_get(); p->time = ktime_get();
p->runtime = -intel_context_get_total_runtime_ns(ce);
} }
err = (*fn)(ps); err = (*fn)(ps);
...@@ -2505,13 +2507,15 @@ static int perf_series_engines(void *arg) ...@@ -2505,13 +2507,15 @@ static int perf_series_engines(void *arg)
struct perf_stats *p = &stats[idx]; struct perf_stats *p = &stats[idx];
struct intel_context *ce = ps->ce[idx]; struct intel_context *ce = ps->ce[idx];
int integer, decimal; int integer, decimal;
u64 busy, dt; u64 busy, dt, now;
p->time = ktime_sub(ktime_get(), p->time); if (p->busy)
if (p->busy) { p->busy = ktime_sub(intel_engine_get_busy_time(p->engine,
p->busy = ktime_sub(intel_engine_get_busy_time(p->engine), &now),
p->busy - 1); p->busy - 1);
} else
now = ktime_get();
p->time = ktime_sub(now, p->time);
err = switch_to_kernel_sync(ce, err); err = switch_to_kernel_sync(ce, err);
p->runtime += intel_context_get_total_runtime_ns(ce); p->runtime += intel_context_get_total_runtime_ns(ce);
...@@ -2571,13 +2575,14 @@ static int p_sync0(void *arg) ...@@ -2571,13 +2575,14 @@ static int p_sync0(void *arg)
return err; return err;
} }
busy = false;
if (intel_engine_supports_stats(engine)) { if (intel_engine_supports_stats(engine)) {
p->busy = intel_engine_get_busy_time(engine); p->busy = intel_engine_get_busy_time(engine, &p->time);
busy = true; busy = true;
} else {
p->time = ktime_get();
busy = false;
} }
p->time = ktime_get();
count = 0; count = 0;
do { do {
struct i915_request *rq; struct i915_request *rq;
...@@ -2600,11 +2605,15 @@ static int p_sync0(void *arg) ...@@ -2600,11 +2605,15 @@ static int p_sync0(void *arg)
count++; count++;
} while (!__igt_timeout(end_time, NULL)); } while (!__igt_timeout(end_time, NULL));
p->time = ktime_sub(ktime_get(), p->time);
if (busy) { if (busy) {
p->busy = ktime_sub(intel_engine_get_busy_time(engine), ktime_t now;
p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now),
p->busy); p->busy);
p->time = ktime_sub(now, p->time);
} else {
p->time = ktime_sub(ktime_get(), p->time);
} }
err = switch_to_kernel_sync(ce, err); err = switch_to_kernel_sync(ce, err);
...@@ -2637,13 +2646,14 @@ static int p_sync1(void *arg) ...@@ -2637,13 +2646,14 @@ static int p_sync1(void *arg)
return err; return err;
} }
busy = false;
if (intel_engine_supports_stats(engine)) { if (intel_engine_supports_stats(engine)) {
p->busy = intel_engine_get_busy_time(engine); p->busy = intel_engine_get_busy_time(engine, &p->time);
busy = true; busy = true;
} else {
p->time = ktime_get();
busy = false;
} }
p->time = ktime_get();
count = 0; count = 0;
do { do {
struct i915_request *rq; struct i915_request *rq;
...@@ -2668,11 +2678,15 @@ static int p_sync1(void *arg) ...@@ -2668,11 +2678,15 @@ static int p_sync1(void *arg)
count++; count++;
} while (!__igt_timeout(end_time, NULL)); } while (!__igt_timeout(end_time, NULL));
i915_request_put(prev); i915_request_put(prev);
p->time = ktime_sub(ktime_get(), p->time);
if (busy) { if (busy) {
p->busy = ktime_sub(intel_engine_get_busy_time(engine), ktime_t now;
p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now),
p->busy); p->busy);
p->time = ktime_sub(now, p->time);
} else {
p->time = ktime_sub(ktime_get(), p->time);
} }
err = switch_to_kernel_sync(ce, err); err = switch_to_kernel_sync(ce, err);
...@@ -2704,14 +2718,15 @@ static int p_many(void *arg) ...@@ -2704,14 +2718,15 @@ static int p_many(void *arg)
return err; return err;
} }
busy = false;
if (intel_engine_supports_stats(engine)) { if (intel_engine_supports_stats(engine)) {
p->busy = intel_engine_get_busy_time(engine); p->busy = intel_engine_get_busy_time(engine, &p->time);
busy = true; busy = true;
} else {
p->time = ktime_get();
busy = false;
} }
count = 0; count = 0;
p->time = ktime_get();
do { do {
struct i915_request *rq; struct i915_request *rq;
...@@ -2724,11 +2739,15 @@ static int p_many(void *arg) ...@@ -2724,11 +2739,15 @@ static int p_many(void *arg)
i915_request_add(rq); i915_request_add(rq);
count++; count++;
} while (!__igt_timeout(end_time, NULL)); } while (!__igt_timeout(end_time, NULL));
p->time = ktime_sub(ktime_get(), p->time);
if (busy) { if (busy) {
p->busy = ktime_sub(intel_engine_get_busy_time(engine), ktime_t now;
p->busy = ktime_sub(intel_engine_get_busy_time(engine, &now),
p->busy); p->busy);
p->time = ktime_sub(now, p->time);
} else {
p->time = ktime_sub(ktime_get(), p->time);
} }
err = switch_to_kernel_sync(ce, err); err = switch_to_kernel_sync(ce, err);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment