Skip to content

Commit

Permalink
drm/i915/pmu: Stop averaging with the previous sample
Browse files Browse the repository at this point in the history
Averaging with the previous sample brings a small statistical improvement
to sampling counters, but can leek a little bit of state from a current
client to the next which mulls the border between past and present for
observing clients.

This is because on event enable clients record the current counter value
and use it as reference, but with rapid off-on event cycles, and due the
delayed nature of sampling timer self-disarm, previous sample value does
not get cleared under these circumstances.

Solution is to stop averaging with the previous sample. This has a small
downside of losing some precision with short and spiky signals, but the
alternatives look too complicated for the benefit.

Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin@intel.com>
Cc: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Sagar Arun Kamble <sagar.a.kamble@intel.com>
Reviewed-by: Chris Wilson <chris@chris-wilson.co.uk>
Tested-by: Chris Wilson <chris@chris-wilson.co.uk>
Link: https://patchwork.freedesktop.org/patch/msgid/20171124094959.10725-1-tvrtko.ursulin@linux.intel.com
  • Loading branch information
Tvrtko Ursulin committed Nov 24, 2017
1 parent 1b2b659 commit 8ee4f19
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 28 deletions.
29 changes: 2 additions & 27 deletions drivers/gpu/drm/i915/i915_pmu.c
Original file line number Diff line number Diff line change
Expand Up @@ -181,12 +181,7 @@ static bool grab_forcewake(struct drm_i915_private *i915, bool fw)
static void
update_sample(struct i915_pmu_sample *sample, u32 unit, u32 val)
{
/*
* Since we are doing stochastic sampling for these counters,
* average the delta with the previous value for better accuracy.
*/
sample->cur += div_u64(mul_u32_u32(sample->prev + val, unit), 2);
sample->prev = val;
sample->cur += mul_u32_u32(val, unit);
}

static void engines_sample(struct drm_i915_private *dev_priv)
Expand Down Expand Up @@ -262,31 +257,13 @@ static void frequency_sample(struct drm_i915_private *dev_priv)
}
}

static void pmu_init_previous_samples(struct drm_i915_private *i915)
{
struct intel_engine_cs *engine;
enum intel_engine_id id;
unsigned int i;

for_each_engine(engine, i915, id) {
for (i = 0; i < ARRAY_SIZE(engine->pmu.sample); i++)
engine->pmu.sample[i].prev = 0;
}

for (i = 0; i < ARRAY_SIZE(i915->pmu.sample); i++)
i915->pmu.sample[i].prev = i915->gt_pm.rps.idle_freq;
}

static enum hrtimer_restart i915_sample(struct hrtimer *hrtimer)
{
struct drm_i915_private *i915 =
container_of(hrtimer, struct drm_i915_private, pmu.timer);

if (!READ_ONCE(i915->pmu.timer_enabled)) {
pmu_init_previous_samples(i915);

if (!READ_ONCE(i915->pmu.timer_enabled))
return HRTIMER_NORESTART;
}

engines_sample(i915);
frequency_sample(i915);
Expand Down Expand Up @@ -857,8 +834,6 @@ void i915_pmu_register(struct drm_i915_private *i915)
hrtimer_init(&i915->pmu.timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
i915->pmu.timer.function = i915_sample;

pmu_init_previous_samples(i915);

for_each_engine(engine, i915, id)
INIT_DELAYED_WORK(&engine->pmu.disable_busy_stats,
__disable_busy_stats);
Expand Down
1 change: 0 additions & 1 deletion drivers/gpu/drm/i915/i915_pmu.h
Original file line number Diff line number Diff line change
Expand Up @@ -41,7 +41,6 @@ enum {

struct i915_pmu_sample {
u64 cur;
u32 prev;
};

struct i915_pmu {
Expand Down

0 comments on commit 8ee4f19

Please sign in to comment.