Commit 4ef10fe0 authored by Lionel Landwerlin's avatar Lionel Landwerlin

drm/i915/perf: add new open param to configure polling of OA buffer

This new parameter let's the application choose how often the OA
buffer should be checked on the CPU side for data availability. Longer
polling period tend to reduce CPU overhead if the application does not
care about somewhat real time data collection.

v2: Allow disabling polling completely with 0 value (Lionel)
v3: Version the new parameter (Joonas)
v4: Rebase (Umesh)
v5: Make poll delay value of 0 invalid (Umesh)
v6:
- Describe poll_oa_period (Ashutosh)
- Fix comment for new poll parameter (Lionel)
- Drop open_flags in read_properties_unlocked (Lionel)
- Rename uapi parameter (Ashutosh)
v7: Reword the comment in uapi (Ashutosh)
Signed-off-by: default avatarLionel Landwerlin <lionel.g.landwerlin@intel.com>
Signed-off-by: default avatarUmesh Nerlige Ramappa <umesh.nerlige.ramappa@intel.com>
Reviewed-by: default avatarAshutosh Dixit <ashutosh.dixit@intel.com>
Signed-off-by: default avatarLionel Landwerlin <lionel.g.landwerlin@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20200324185457.14635-4-umesh.nerlige.ramappa@intel.com
parent c51dbc6e
...@@ -248,11 +248,11 @@ ...@@ -248,11 +248,11 @@
#define OA_TAIL_MARGIN_NSEC 100000ULL #define OA_TAIL_MARGIN_NSEC 100000ULL
#define INVALID_TAIL_PTR 0xffffffff #define INVALID_TAIL_PTR 0xffffffff
/* frequency for checking whether the OA unit has written new reports to the /* The default frequency for checking whether the OA unit has written new
* circular OA buffer... * reports to the circular OA buffer...
*/ */
#define POLL_FREQUENCY 200 #define DEFAULT_POLL_FREQUENCY_HZ 200
#define POLL_PERIOD (NSEC_PER_SEC / POLL_FREQUENCY) #define DEFAULT_POLL_PERIOD_NS (NSEC_PER_SEC / DEFAULT_POLL_FREQUENCY_HZ)
/* for sysctl proc_dointvec_minmax of dev.i915.perf_stream_paranoid */ /* for sysctl proc_dointvec_minmax of dev.i915.perf_stream_paranoid */
static u32 i915_perf_stream_paranoid = true; static u32 i915_perf_stream_paranoid = true;
...@@ -339,6 +339,8 @@ static const struct i915_oa_format gen12_oa_formats[I915_OA_FORMAT_MAX] = { ...@@ -339,6 +339,8 @@ static const struct i915_oa_format gen12_oa_formats[I915_OA_FORMAT_MAX] = {
* @sseu: internal SSEU configuration computed either from the userspace * @sseu: internal SSEU configuration computed either from the userspace
* specified configuration in the opening parameters or a default value * specified configuration in the opening parameters or a default value
* (see get_default_sseu_config()) * (see get_default_sseu_config())
* @poll_oa_period: The period in nanoseconds at which the CPU will check for OA
* data availability
* *
* As read_properties_unlocked() enumerates and validates the properties given * As read_properties_unlocked() enumerates and validates the properties given
* to open a stream of metrics the configuration is built up in the structure * to open a stream of metrics the configuration is built up in the structure
...@@ -361,6 +363,8 @@ struct perf_open_properties { ...@@ -361,6 +363,8 @@ struct perf_open_properties {
bool has_sseu; bool has_sseu;
struct intel_sseu sseu; struct intel_sseu sseu;
u64 poll_oa_period;
}; };
struct i915_oa_config_bo { struct i915_oa_config_bo {
...@@ -2600,7 +2604,7 @@ static void i915_oa_stream_enable(struct i915_perf_stream *stream) ...@@ -2600,7 +2604,7 @@ static void i915_oa_stream_enable(struct i915_perf_stream *stream)
if (stream->periodic) if (stream->periodic)
hrtimer_start(&stream->poll_check_timer, hrtimer_start(&stream->poll_check_timer,
ns_to_ktime(POLL_PERIOD), ns_to_ktime(stream->poll_oa_period),
HRTIMER_MODE_REL_PINNED); HRTIMER_MODE_REL_PINNED);
} }
...@@ -3035,7 +3039,8 @@ static enum hrtimer_restart oa_poll_check_timer_cb(struct hrtimer *hrtimer) ...@@ -3035,7 +3039,8 @@ static enum hrtimer_restart oa_poll_check_timer_cb(struct hrtimer *hrtimer)
wake_up(&stream->poll_wq); wake_up(&stream->poll_wq);
} }
hrtimer_forward_now(hrtimer, ns_to_ktime(POLL_PERIOD)); hrtimer_forward_now(hrtimer,
ns_to_ktime(stream->poll_oa_period));
return HRTIMER_RESTART; return HRTIMER_RESTART;
} }
...@@ -3424,6 +3429,7 @@ i915_perf_open_ioctl_locked(struct i915_perf *perf, ...@@ -3424,6 +3429,7 @@ i915_perf_open_ioctl_locked(struct i915_perf *perf,
stream->perf = perf; stream->perf = perf;
stream->ctx = specific_ctx; stream->ctx = specific_ctx;
stream->poll_oa_period = props->poll_oa_period;
ret = i915_oa_stream_init(stream, param, props); ret = i915_oa_stream_init(stream, param, props);
if (ret) if (ret)
...@@ -3502,6 +3508,7 @@ static int read_properties_unlocked(struct i915_perf *perf, ...@@ -3502,6 +3508,7 @@ static int read_properties_unlocked(struct i915_perf *perf,
int ret; int ret;
memset(props, 0, sizeof(struct perf_open_properties)); memset(props, 0, sizeof(struct perf_open_properties));
props->poll_oa_period = DEFAULT_POLL_PERIOD_NS;
if (!n_props) { if (!n_props) {
DRM_DEBUG("No i915 perf properties given\n"); DRM_DEBUG("No i915 perf properties given\n");
...@@ -3634,6 +3641,14 @@ static int read_properties_unlocked(struct i915_perf *perf, ...@@ -3634,6 +3641,14 @@ static int read_properties_unlocked(struct i915_perf *perf,
props->has_sseu = true; props->has_sseu = true;
break; break;
} }
case DRM_I915_PERF_PROP_POLL_OA_PERIOD:
if (value < 100000 /* 100us */) {
DRM_DEBUG("OA availability timer too small (%lluns < 100us)\n",
value);
return -EINVAL;
}
props->poll_oa_period = value;
break;
case DRM_I915_PERF_PROP_MAX: case DRM_I915_PERF_PROP_MAX:
MISSING_CASE(id); MISSING_CASE(id);
return -EINVAL; return -EINVAL;
...@@ -4416,8 +4431,11 @@ int i915_perf_ioctl_version(void) ...@@ -4416,8 +4431,11 @@ int i915_perf_ioctl_version(void)
* 4: Add DRM_I915_PERF_PROP_ALLOWED_SSEU to limit what contexts can * 4: Add DRM_I915_PERF_PROP_ALLOWED_SSEU to limit what contexts can
* be run for the duration of the performance recording based on * be run for the duration of the performance recording based on
* their SSEU configuration. * their SSEU configuration.
*
* 5: Add DRM_I915_PERF_PROP_POLL_OA_PERIOD parameter that controls the
* interval for the hrtimer used to check for OA data.
*/ */
return 4; return 5;
} }
#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST) #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
......
...@@ -304,6 +304,12 @@ struct i915_perf_stream { ...@@ -304,6 +304,12 @@ struct i915_perf_stream {
* reprogrammed. * reprogrammed.
*/ */
struct i915_vma *noa_wait; struct i915_vma *noa_wait;
/**
* @poll_oa_period: The period in nanoseconds at which the OA
* buffer should be checked for available data.
*/
u64 poll_oa_period;
}; };
/** /**
......
...@@ -1980,6 +1980,19 @@ enum drm_i915_perf_property_id { ...@@ -1980,6 +1980,19 @@ enum drm_i915_perf_property_id {
*/ */
DRM_I915_PERF_PROP_GLOBAL_SSEU, DRM_I915_PERF_PROP_GLOBAL_SSEU,
/**
* This optional parameter specifies the timer interval in nanoseconds
* at which the i915 driver will check the OA buffer for available data.
* Minimum allowed value is 100 microseconds. A default value is used by
* the driver if this parameter is not specified. Note that larger timer
* values will reduce cpu consumption during OA perf captures. However,
* excessively large values would potentially result in OA buffer
* overwrites as captures reach end of the OA buffer.
*
* This property is available in perf revision 5.
*/
DRM_I915_PERF_PROP_POLL_OA_PERIOD,
DRM_I915_PERF_PROP_MAX /* non-ABI */ DRM_I915_PERF_PROP_MAX /* non-ABI */
}; };
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment