Add gpu work period support for i915

Aakash-Sarkar · Aakash-Sarkar · commit e9071d11cfa0 · 2025-02-13T16:40:56.000+05:30
Signed-off-by: Aakash Sarkar &lt;aakash.deep.sarkar@intel.com&gt;
diff --git a/drivers/gpu/drm/i915/Makefile b/drivers/gpu/drm/i915/Makefile
@@ -362,6 +362,8 @@ i915-y += \
 
 i915-y += i915_perf.o
 
+i915-y += i915_gpu_work.o
+
 # Protected execution platform (PXP) support. Base support is required for HuC
 i915-y += \
 	pxp/intel_pxp.o \
diff --git a/drivers/gpu/drm/i915/gt/intel_context_types.h b/drivers/gpu/drm/i915/gt/intel_context_types.h
@@ -152,6 +152,7 @@ struct intel_context {
 			struct ewma_runtime avg;
 			u64 total;
 			u32 last;
+			u32 dt;
 			I915_SELFTEST_DECLARE(u32 num_underflow);
 			I915_SELFTEST_DECLARE(u32 max_underflow);
 		} runtime;
@@ -173,6 +174,8 @@ struct intel_context {
 	/** sseu: Control eu/slice partitioning */
 	struct intel_sseu sseu;
 
+	u64 start_time_ns;
+
 	/**
 	 * pinned_contexts_link: List link for the engine's pinned contexts.
 	 * This is only used if this is a perma-pinned kernel context and
diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
@@ -1601,6 +1601,8 @@ int intel_engines_init(struct intel_gt *gt)
 			return err;
 
 		intel_engine_add_user(engine);
+
+		i915_gpu_work_stats_init(engine);
 	}
 
 	return 0;
diff --git a/drivers/gpu/drm/i915/gt/intel_engine_types.h b/drivers/gpu/drm/i915/gt/intel_engine_types.h
@@ -26,6 +26,7 @@
 #include "intel_uncore.h"
 #include "intel_wakeref.h"
 #include "intel_workarounds_types.h"
+#include "i915_gpu_work.h"
 
 /* HW Engine class + instance */
 #define RENDER_CLASS		0
@@ -169,6 +170,11 @@ struct intel_engine_execlists {
 	 */
 	struct timer_list preempt;
 
+	/**
+	 * @work_period_timer: emit the gpu work period stats event
+	 */
+	struct timer_list work_period_timer;
+
 	/**
 	 * @preempt_target: active request at the time of the preemption request
 	 *
@@ -487,6 +493,7 @@ struct intel_engine_cs {
 		struct i915_pmu_sample sample[I915_ENGINE_SAMPLE_COUNT];
 	} pmu;
 
+	struct i915_engine_work gpu_work;
 	struct intel_hw_status_page status_page;
 	struct i915_ctx_workarounds wa_ctx;
 	struct i915_wa_list ctx_wa_list;
diff --git a/drivers/gpu/drm/i915/gt/intel_execlists_submission.c b/drivers/gpu/drm/i915/gt/intel_execlists_submission.c
@@ -1252,6 +1252,11 @@ static unsigned long active_preempt_timeout(struct intel_engine_cs *engine,
 	return READ_ONCE(engine->props.preempt_timeout_ms);
 }
 
+static unsigned long work_period_timeslice(struct intel_engine_cs *engine)
+{
+	return GPU_WORK_PERIOD_EVENT_TIMEOUT;
+}
+
 static void set_preempt_timeout(struct intel_engine_cs *engine,
 				const struct i915_request *rq)
 {
@@ -2040,6 +2045,8 @@ process_csb(struct intel_engine_cs *engine, struct i915_request **inactive)
 			if (active_ce)
 				lrc_runtime_start(active_ce);
 		}
+		if (active_ce)
+			active_ce->start_time_ns = ktime_get_raw_ns();
 		new_timeslice(execlists);
 	}
 
@@ -2423,6 +2430,13 @@ static bool preempt_timeout(const struct intel_engine_cs *const engine)
 	return engine->execlists.pending[0];
 }
 
+static bool work_period_expired(const struct intel_engine_cs *const engine)
+{
+	const struct timer_list *t = &engine->execlists.work_period_timer;
+
+	return timer_expired(t);
+}
+
 /*
  * Check the unread Context Status Buffers and manage the submission of new
  * contexts to the ELSP accordingly.
@@ -2439,6 +2453,17 @@ static void execlists_submission_tasklet(struct tasklet_struct *t)
 	inactive = process_csb(engine, post);
 	GEM_BUG_ON(inactive - post > ARRAY_SIZE(post));
 
+	struct intel_context *ce = (*inactive)->context;
+	struct i915_engine_work *ew = &engine->gpu_work;
+	i915_gpu_work_process_ctx(ce, ew);
+
+	if (unlikely(work_period_expired(engine))) {
+		cancel_timer(&engine->execlists.work_period_timer);
+		schedule_work(&ew->event_work);
+		set_timer_ms(&engine->execlists.work_period_timer,
+				 work_period_timeslice(engine));
+	}
+
 	if (unlikely(preempt_timeout(engine))) {
 		const struct i915_request *rq = *engine->execlists.active;
 
@@ -2547,6 +2572,11 @@ static void execlists_preempt(struct timer_list *timer)
 	execlists_kick(timer, preempt);
 }
 
+static void execlists_work_period(struct timer_list *timer)
+{
+	execlists_kick(timer, work_period_timer);
+}
+
 static void queue_request(struct intel_engine_cs *engine,
 			  struct i915_request *rq)
 {
@@ -3543,6 +3573,8 @@ int intel_execlists_submission_setup(struct intel_engine_cs *engine)
 	tasklet_setup(&engine->sched_engine->tasklet, execlists_submission_tasklet);
 	timer_setup(&engine->execlists.timer, execlists_timeslice, 0);
 	timer_setup(&engine->execlists.preempt, execlists_preempt, 0);
+	timer_setup(&engine->execlists.work_period_timer, execlists_work_period, 0);
+
 
 	logical_ring_default_vfuncs(engine);
 	logical_ring_default_irqs(engine);
diff --git a/drivers/gpu/drm/i915/gt/intel_lrc.c b/drivers/gpu/drm/i915/gt/intel_lrc.c
@@ -1946,6 +1946,7 @@ void lrc_update_runtime(struct intel_context *ce)
 
 	ewma_runtime_add(&stats->runtime.avg, dt);
 	stats->runtime.total += dt;
+	stats->runtime.dt = dt;
 }
 
 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
diff --git a/drivers/gpu/drm/i915/i915_gpu_work.c b/drivers/gpu/drm/i915/i915_gpu_work.c
@@ -0,0 +1,234 @@
+#include "i915_gpu_work.h"
+#include <linux/pid.h>
+#include <linux/errno.h>
+
+#include "gt/intel_context.h"
+#include "gt/intel_engine.h"
+#include "gem/i915_gem_context.h"
+
+#define CREATE_TRACE_POINTS
+#include "intel_power_gpu_work_period_trace.h"
+
+static inline u32 get_stats_uid(s32 key, struct i915_work_stats *stats)
+{
+    // TODO: stats is always accessed under spinlock.
+    // Do we really need the READ_ONCE? 
+    return READ_ONCE(stats[key].uid);
+}
+
+static s32 get_uid_ctx(struct intel_context *ce)
+{
+    struct i915_gem_context *ctx = NULL;
+    struct task_struct *task = NULL;
+    const struct cred *cred = NULL;
+    s32 ret;
+
+    rcu_read_lock();
+    ctx = rcu_dereference(ce->gem_context);
+    /* ctx could be freed from right under our nose,
+     * so check first if we are able to get a reference
+     */
+    if (ctx && !kref_get_unless_zero(&ctx->ref))
+        ctx = NULL;
+    rcu_read_unlock();
+
+    if (!ctx) {
+        ret = -EINVAL;
+        goto out;
+    }
+
+    // TODO: Error handling
+    task = get_pid_task(ctx->pid, PIDTYPE_PID);
+    cred = get_task_cred(task);
+    const unsigned int uid = cred->euid.val;
+    ret = (s32)uid;
+
+    put_cred(cred);
+    put_task_struct(task);
+    i915_gem_context_put(ctx);
+out:
+    return ret;
+}
+
+// TODO: Can this be called inside softirq?
+static void emit_work_period_event(struct i915_engine_work *ew)
+{
+    struct i915_work_stats * const stats = &ew->stats[0];
+    for (int itr = 0; itr < I915_ENGINE_WORK_STATS_COUNT; itr++) {
+        struct i915_work_stats *stat = &stats[itr];
+        if (!stat->uid)
+            continue;
+
+        trace_gpu_work_period(0, stat->uid,
+            stat->start_time_ns, stat->end_time_ns,
+            stat->total_active_duration_ns);
+
+        // TODO: check concurrent accesses to num_entries
+        if (!ew->num_entries--)
+            break;
+    }
+    GEM_BUG_ON(ew->num_entries != 0);
+    memset(stats, 0, sizeof(*stats) *
+                 I915_ENGINE_WORK_STATS_COUNT);
+    smp_wmb();
+}
+
+static void i915_work_period_event_worker(struct work_struct *work)
+{
+    struct i915_engine_work *ew =
+                 container_of(work, typeof(*ew), event_work);
+    spin_lock_bh(&ew->stats_lock);
+    // TODO: Is it too expensive to be called inside softirq?
+    emit_work_period_event(ew);
+    spin_unlock_bh(&ew->stats_lock);
+}
+
+static inline u32 get_cur_dt(struct intel_context* ce)
+{
+    struct intel_context_stats *stats = &ce->stats;
+    s32 dt = READ_ONCE(stats->runtime.dt);
+    if (unlikely(dt < 0)) {
+        return 0;
+    }
+    return dt;
+}
+
+static u64 get_active_duration_ns(struct intel_context* ce)
+{
+    u64 dur = get_cur_dt(ce);
+	if (ce->ops->flags & COPS_RUNTIME_CYCLES)
+		dur *= ce->engine->gt->clock_period_ns;
+    return dur;
+}
+
+/*
+ * Hash collision is handled here the same way we handle the situation
+ * when our favourite urinal is occupied in a crowded office restroom.
+ * Sorry!
+ */
+static s32 handle_collision(s32 key, struct i915_engine_work *ew)
+{
+    struct i915_work_stats * const stats = &ew->stats[0];
+    u32 uid, count = 0;
+
+    spin_lock(&ew->stats_lock);
+    while (uid = get_stats_uid(key, stats)) {
+        if (unlikely(count >=
+                I915_ENGINE_WORK_STATS_COUNT)) {
+            spin_unlock(&ew->stats_lock);
+            return -ENOMEM;
+        }
+
+        if (key == I915_ENGINE_WORK_STATS_COUNT)
+            key = 0;
+        key++;
+        count++;
+    }
+    spin_unlock(&ew->stats_lock);
+    return key;
+}
+
+void i915_gpu_work_process_ctx(struct intel_context *ce,
+                     struct i915_engine_work *ew)
+{
+    struct i915_work_stats * const stats = &ew->stats[0];
+    struct i915_work_stats *stat = NULL;
+    s32 key = 0, uid = 0;
+
+    uid = get_uid_ctx(ce);
+    // TODO: Handle this correctly
+    if (uid < 0)
+        return;
+
+    key = HASH_MAP(uid);
+
+    /* Hash collision. Find the next available key */
+    if (get_stats_uid(key, stats) != uid)
+        key = handle_collision(key, ew);
+
+    if (unlikely(KEY_INVALID(key))) {
+        /*
+         * This can only happen if all the slots in our stats
+         * array are occupied. Emit the events now and empty
+         * all the slots.
+         */
+        spin_lock(&ew->stats_lock);
+        emit_work_period_event(ew);
+        spin_unlock(&ew->stats_lock);
+        key = 0;
+    }
+    stat = &stats[key];
+
+    spin_lock(&ew->stats_lock);
+    /*
+     * If the uid at our hash index is empty (zero)
+     * this implies that our ctx is processed first
+     * time since we emitted the events last time
+     * and subsequently evicted all the slots.
+     * 
+     * So, we set the start time to the last time this
+     * ctx was put into the active queue. We also set
+     * the end time and the total active duration to
+     * the current runtime of this ctx
+     */
+    if (!stat->uid) {
+        stat->uid = uid;
+        stat->start_time_ns = READ_ONCE(ce->start_time_ns);
+        stat->total_active_duration_ns =
+                 get_active_duration_ns(ce);
+        stat->end_time_ns = get_active_duration_ns(ce);
+        /* TODO: num_entries could be accessed concurrently
+         * b/w two cpus (use atomic type?)
+         */
+        ew->num_entries++;
+        goto out;
+    }
+
+    /*
+     * Now we have the hash index but the slot
+     * could be occupied by another uid that maps
+     * to the same slot index.
+     * So, we do a linear search from our index until
+     * we find a slot with matching uid or we run
+     * through all the slots.
+     */
+    u32 count = 0;
+    while (stat->uid != uid) {
+        /* Is this if condition really reuqired? */
+        if (unlikely(count >=
+                 I915_ENGINE_WORK_STATS_COUNT))
+            goto out;
+
+        if (key == I915_ENGINE_WORK_STATS_COUNT)
+            key = 0;
+
+        stat = &stats[++key];
+        ++count;
+    }
+
+    /*
+     * We set the endtime to the current time this ctx
+     * is being processed and accumulate the current
+     * runtime to the total active duration
+     */
+    stat->end_time_ns = ktime_get_raw_ns();
+    stat->total_active_duration_ns +=
+                 get_active_duration_ns(ce);
+
+out:
+    spin_unlock(&ew->stats_lock);
+}
+
+void i915_gpu_work_stats_init(struct intel_engine_cs *engine)
+{
+    struct i915_engine_work *ew = &engine->gpu_work;
+    struct i915_work_stats * const stats = &ew->stats[0];
+
+    ew->enabled = false;
+    ew->num_entries = 0;
+    memset(stats, 0, sizeof(*stats) *
+                 I915_ENGINE_WORK_STATS_COUNT);
+
+    spin_lock_init(&ew->stats_lock);
+    INIT_WORK(&ew->event_work, i915_work_period_event_worker);
+}
diff --git a/drivers/gpu/drm/i915/i915_gpu_work.h b/drivers/gpu/drm/i915/i915_gpu_work.h
diff --git a/drivers/gpu/drm/i915/intel_power_gpu_work_period_trace.h b/drivers/gpu/drm/i915/intel_power_gpu_work_period_trace.h

Original file line number	Diff line number	Diff line change
`@@ -1601,6 +1601,8 @@ int intel_engines_init(struct intel_gt *gt)`
`1601`	`1601`	`return err;`
`1602`	`1602`
`1603`	`1603`	`intel_engine_add_user(engine);`
	`1604`	`+`
	`1605`	`+ i915_gpu_work_stats_init(engine);`
`1604`	`1606`	`}`
`1605`	`1607`
`1606`	`1608`	`return 0;`
Original file line number	Diff line number	Diff line change
`@@ -1946,6 +1946,7 @@ void lrc_update_runtime(struct intel_context *ce)`
`1946`	`1946`
`1947`	`1947`	`ewma_runtime_add(&stats->runtime.avg, dt);`
`1948`	`1948`	`stats->runtime.total += dt;`
	`1949`	`+ stats->runtime.dt = dt;`
`1949`	`1950`	`}`
`1950`	`1951`
`1951`	`1952`	`#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)`