Commit 5f284e9c authored by Umesh Nerlige Ramappa's avatar Umesh Nerlige Ramappa

drm/i915/perf: Group engines into respective OA groups

Now that we may have multiple OA units in a single GT as well as on
separate GTs, create an engine group that maps to a single OA unit.

v2: (Jani)
- Drop warning on ENOMEM
- Reorder patch in the series

v3: (Ashutosh)
- Remove unused members from perf structs
- Update comments
- Update engine_supports_oa check
- Just return 1 in num_perf_groups_per_gt for now
- Set engine->oa_group to NULL to begin with

v4: Use engine_supports_oa() check in oa_init_reg_state (Ashutosh)
v5: Rebase after dropping engine_supports_oa helper
Signed-off-by: default avatarUmesh Nerlige Ramappa <umesh.nerlige.ramappa@intel.com>
Reviewed-by: default avatarAshutosh Dixit <ashutosh.dixit@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20230323225901.3743681-5-umesh.nerlige.ramappa@intel.com
parent 9919d119
...@@ -53,6 +53,8 @@ struct intel_gt; ...@@ -53,6 +53,8 @@ struct intel_gt;
struct intel_ring; struct intel_ring;
struct intel_uncore; struct intel_uncore;
struct intel_breadcrumbs; struct intel_breadcrumbs;
struct intel_engine_cs;
struct i915_perf_group;
typedef u32 intel_engine_mask_t; typedef u32 intel_engine_mask_t;
#define ALL_ENGINES ((intel_engine_mask_t)~0ul) #define ALL_ENGINES ((intel_engine_mask_t)~0ul)
...@@ -617,6 +619,14 @@ struct intel_engine_cs { ...@@ -617,6 +619,14 @@ struct intel_engine_cs {
} props, defaults; } props, defaults;
I915_SELFTEST_DECLARE(struct fault_attr reset_timeout); I915_SELFTEST_DECLARE(struct fault_attr reset_timeout);
/*
* The perf group maps to one OA unit which controls one OA buffer. All
* reports corresponding to this engine will be reported to this OA
* buffer. An engine will map to a single OA unit, but a single OA unit
* can generate reports for multiple engines.
*/
struct i915_perf_group *oa_group;
}; };
static inline bool static inline bool
......
...@@ -6,6 +6,7 @@ ...@@ -6,6 +6,7 @@
#include <linux/string_helpers.h> #include <linux/string_helpers.h>
#include "i915_drv.h" #include "i915_drv.h"
#include "i915_perf_types.h"
#include "intel_engine_regs.h" #include "intel_engine_regs.h"
#include "intel_gt_regs.h" #include "intel_gt_regs.h"
#include "intel_sseu.h" #include "intel_sseu.h"
...@@ -677,7 +678,7 @@ u32 intel_sseu_make_rpcs(struct intel_gt *gt, ...@@ -677,7 +678,7 @@ u32 intel_sseu_make_rpcs(struct intel_gt *gt,
* If i915/perf is active, we want a stable powergating configuration * If i915/perf is active, we want a stable powergating configuration
* on the system. Use the configuration pinned by i915/perf. * on the system. Use the configuration pinned by i915/perf.
*/ */
if (gt->perf.exclusive_stream) if (gt->perf.group && gt->perf.group[PERF_GROUP_OAG].exclusive_stream)
req_sseu = &gt->perf.sseu; req_sseu = &gt->perf.sseu;
slices = hweight8(req_sseu->slice_mask); slices = hweight8(req_sseu->slice_mask);
......
...@@ -1570,12 +1570,18 @@ free_noa_wait(struct i915_perf_stream *stream) ...@@ -1570,12 +1570,18 @@ free_noa_wait(struct i915_perf_stream *stream)
i915_vma_unpin_and_release(&stream->noa_wait, 0); i915_vma_unpin_and_release(&stream->noa_wait, 0);
} }
static bool engine_supports_oa(const struct intel_engine_cs *engine)
{
return engine->oa_group;
}
static void i915_oa_stream_destroy(struct i915_perf_stream *stream) static void i915_oa_stream_destroy(struct i915_perf_stream *stream)
{ {
struct i915_perf *perf = stream->perf; struct i915_perf *perf = stream->perf;
struct intel_gt *gt = stream->engine->gt; struct intel_gt *gt = stream->engine->gt;
struct i915_perf_group *g = stream->engine->oa_group;
if (WARN_ON(stream != gt->perf.exclusive_stream)) if (WARN_ON(stream != g->exclusive_stream))
return; return;
/* /*
...@@ -1584,7 +1590,7 @@ static void i915_oa_stream_destroy(struct i915_perf_stream *stream) ...@@ -1584,7 +1590,7 @@ static void i915_oa_stream_destroy(struct i915_perf_stream *stream)
* *
* See i915_oa_init_reg_state() and lrc_configure_all_contexts() * See i915_oa_init_reg_state() and lrc_configure_all_contexts()
*/ */
WRITE_ONCE(gt->perf.exclusive_stream, NULL); WRITE_ONCE(g->exclusive_stream, NULL);
perf->ops.disable_metric_set(stream); perf->ops.disable_metric_set(stream);
free_oa_buffer(stream); free_oa_buffer(stream);
...@@ -3182,6 +3188,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream, ...@@ -3182,6 +3188,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream,
{ {
struct drm_i915_private *i915 = stream->perf->i915; struct drm_i915_private *i915 = stream->perf->i915;
struct i915_perf *perf = stream->perf; struct i915_perf *perf = stream->perf;
struct i915_perf_group *g;
struct intel_gt *gt; struct intel_gt *gt;
int ret; int ret;
...@@ -3191,6 +3198,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream, ...@@ -3191,6 +3198,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream,
return -EINVAL; return -EINVAL;
} }
gt = props->engine->gt; gt = props->engine->gt;
g = props->engine->oa_group;
/* /*
* If the sysfs metrics/ directory wasn't registered for some * If the sysfs metrics/ directory wasn't registered for some
...@@ -3221,7 +3229,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream, ...@@ -3221,7 +3229,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream,
* counter reports and marshal to the appropriate client * counter reports and marshal to the appropriate client
* we currently only allow exclusive access * we currently only allow exclusive access
*/ */
if (gt->perf.exclusive_stream) { if (g->exclusive_stream) {
drm_dbg(&stream->perf->i915->drm, drm_dbg(&stream->perf->i915->drm,
"OA unit already in use\n"); "OA unit already in use\n");
return -EBUSY; return -EBUSY;
...@@ -3316,7 +3324,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream, ...@@ -3316,7 +3324,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream,
stream->ops = &i915_oa_stream_ops; stream->ops = &i915_oa_stream_ops;
stream->engine->gt->perf.sseu = props->sseu; stream->engine->gt->perf.sseu = props->sseu;
WRITE_ONCE(gt->perf.exclusive_stream, stream); WRITE_ONCE(g->exclusive_stream, stream);
ret = i915_perf_stream_enable_sync(stream); ret = i915_perf_stream_enable_sync(stream);
if (ret) { if (ret) {
...@@ -3339,7 +3347,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream, ...@@ -3339,7 +3347,7 @@ static int i915_oa_stream_init(struct i915_perf_stream *stream,
return 0; return 0;
err_enable: err_enable:
WRITE_ONCE(gt->perf.exclusive_stream, NULL); WRITE_ONCE(g->exclusive_stream, NULL);
perf->ops.disable_metric_set(stream); perf->ops.disable_metric_set(stream);
free_oa_buffer(stream); free_oa_buffer(stream);
...@@ -3373,7 +3381,7 @@ void i915_oa_init_reg_state(const struct intel_context *ce, ...@@ -3373,7 +3381,7 @@ void i915_oa_init_reg_state(const struct intel_context *ce,
return; return;
/* perf.exclusive_stream serialised by lrc_configure_all_contexts() */ /* perf.exclusive_stream serialised by lrc_configure_all_contexts() */
stream = READ_ONCE(engine->gt->perf.exclusive_stream); stream = READ_ONCE(engine->oa_group->exclusive_stream);
if (stream && GRAPHICS_VER(stream->perf->i915) < 12) if (stream && GRAPHICS_VER(stream->perf->i915) < 12)
gen8_update_reg_state_unlocked(ce, stream); gen8_update_reg_state_unlocked(ce, stream);
} }
...@@ -3965,6 +3973,13 @@ static int read_properties_unlocked(struct i915_perf *perf, ...@@ -3965,6 +3973,13 @@ static int read_properties_unlocked(struct i915_perf *perf,
return -EINVAL; return -EINVAL;
} }
if (!engine_supports_oa(props->engine)) {
drm_dbg(&perf->i915->drm,
"Engine not supported by OA %d:%d\n",
I915_ENGINE_CLASS_RENDER, 0);
return -EINVAL;
}
/* Considering that ID = 0 is reserved and assuming that we don't /* Considering that ID = 0 is reserved and assuming that we don't
* (currently) expect any configurations to ever specify duplicate * (currently) expect any configurations to ever specify duplicate
* values for a particular property ID then the last _PROP_MAX value is * values for a particular property ID then the last _PROP_MAX value is
...@@ -4743,6 +4758,60 @@ static struct ctl_table oa_table[] = { ...@@ -4743,6 +4758,60 @@ static struct ctl_table oa_table[] = {
{} {}
}; };
static u32 num_perf_groups_per_gt(struct intel_gt *gt)
{
return 1;
}
static u32 __oa_engine_group(struct intel_engine_cs *engine)
{
if (engine->class == RENDER_CLASS)
return PERF_GROUP_OAG;
else
return PERF_GROUP_INVALID;
}
static int oa_init_gt(struct intel_gt *gt)
{
u32 num_groups = num_perf_groups_per_gt(gt);
struct intel_engine_cs *engine;
struct i915_perf_group *g;
intel_engine_mask_t tmp;
g = kcalloc(num_groups, sizeof(*g), GFP_KERNEL);
if (!g)
return -ENOMEM;
for_each_engine_masked(engine, gt, ALL_ENGINES, tmp) {
u32 index = __oa_engine_group(engine);
engine->oa_group = NULL;
if (index < num_groups) {
g[index].num_engines++;
engine->oa_group = &g[index];
}
}
gt->perf.num_perf_groups = num_groups;
gt->perf.group = g;
return 0;
}
static int oa_init_engine_groups(struct i915_perf *perf)
{
struct intel_gt *gt;
int i, ret;
for_each_gt(gt, perf->i915, i) {
ret = oa_init_gt(gt);
if (ret)
return ret;
}
return 0;
}
static void oa_init_supported_formats(struct i915_perf *perf) static void oa_init_supported_formats(struct i915_perf *perf)
{ {
struct drm_i915_private *i915 = perf->i915; struct drm_i915_private *i915 = perf->i915;
...@@ -4909,7 +4978,7 @@ void i915_perf_init(struct drm_i915_private *i915) ...@@ -4909,7 +4978,7 @@ void i915_perf_init(struct drm_i915_private *i915)
if (perf->ops.enable_metric_set) { if (perf->ops.enable_metric_set) {
struct intel_gt *gt; struct intel_gt *gt;
int i; int i, ret;
for_each_gt(gt, i915, i) for_each_gt(gt, i915, i)
mutex_init(&gt->perf.lock); mutex_init(&gt->perf.lock);
...@@ -4948,6 +5017,11 @@ void i915_perf_init(struct drm_i915_private *i915) ...@@ -4948,6 +5017,11 @@ void i915_perf_init(struct drm_i915_private *i915)
perf->i915 = i915; perf->i915 = i915;
ret = oa_init_engine_groups(perf);
if (ret)
drm_err(&i915->drm,
"OA initialization failed %d\n", ret);
oa_init_supported_formats(perf); oa_init_supported_formats(perf);
} }
} }
...@@ -4976,10 +5050,15 @@ void i915_perf_sysctl_unregister(void) ...@@ -4976,10 +5050,15 @@ void i915_perf_sysctl_unregister(void)
void i915_perf_fini(struct drm_i915_private *i915) void i915_perf_fini(struct drm_i915_private *i915)
{ {
struct i915_perf *perf = &i915->perf; struct i915_perf *perf = &i915->perf;
struct intel_gt *gt;
int i;
if (!perf->i915) if (!perf->i915)
return; return;
for_each_gt(gt, perf->i915, i)
kfree(gt->perf.group);
idr_for_each(&perf->metrics_idr, destroy_config, perf); idr_for_each(&perf->metrics_idr, destroy_config, perf);
idr_destroy(&perf->metrics_idr); idr_destroy(&perf->metrics_idr);
......
...@@ -17,6 +17,7 @@ ...@@ -17,6 +17,7 @@
#include <linux/wait.h> #include <linux/wait.h>
#include <uapi/drm/i915_drm.h> #include <uapi/drm/i915_drm.h>
#include "gt/intel_engine_types.h"
#include "gt/intel_sseu.h" #include "gt/intel_sseu.h"
#include "i915_reg_defs.h" #include "i915_reg_defs.h"
#include "intel_wakeref.h" #include "intel_wakeref.h"
...@@ -30,6 +31,13 @@ struct i915_vma; ...@@ -30,6 +31,13 @@ struct i915_vma;
struct intel_context; struct intel_context;
struct intel_engine_cs; struct intel_engine_cs;
enum {
PERF_GROUP_OAG = 0,
PERF_GROUP_MAX,
PERF_GROUP_INVALID = U32_MAX,
};
struct i915_oa_format { struct i915_oa_format {
u32 format; u32 format;
int size; int size;
...@@ -390,6 +398,20 @@ struct i915_oa_ops { ...@@ -390,6 +398,20 @@ struct i915_oa_ops {
u32 (*oa_hw_tail_read)(struct i915_perf_stream *stream); u32 (*oa_hw_tail_read)(struct i915_perf_stream *stream);
}; };
struct i915_perf_group {
/*
* @exclusive_stream: The stream currently using the OA unit. This is
* sometimes accessed outside a syscall associated to its file
* descriptor.
*/
struct i915_perf_stream *exclusive_stream;
/*
* @num_engines: The number of engines using this OA unit.
*/
u32 num_engines;
};
struct i915_perf_gt { struct i915_perf_gt {
/* /*
* Lock associated with anything below within this structure. * Lock associated with anything below within this structure.
...@@ -402,12 +424,15 @@ struct i915_perf_gt { ...@@ -402,12 +424,15 @@ struct i915_perf_gt {
*/ */
struct intel_sseu sseu; struct intel_sseu sseu;
/**
* @num_perf_groups: number of perf groups per gt.
*/
u32 num_perf_groups;
/* /*
* @exclusive_stream: The stream currently using the OA unit. This is * @group: list of OA groups - one for each OA buffer.
* sometimes accessed outside a syscall associated to its file
* descriptor.
*/ */
struct i915_perf_stream *exclusive_stream; struct i915_perf_group *group;
}; };
struct i915_perf { struct i915_perf {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment