Re: [PATCH v2] drm/i915/guc: Decouple GuC engine id from ring id

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 




On 23/01/16 19:58, yu.dai@xxxxxxxxx wrote:
From: Alex Dai <yu.dai@xxxxxxxxx>

Previously GuC uses ring id as engine id because of same definition.
But this is not true since this commit:

commit de1add360522c876c25ef2bbbbab1c94bdb509ab
Author: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxx>
Date:   Fri Jan 15 15:12:50 2016 +0000

     drm/i915: Decouple execbuf uAPI from internal implementation

Added GuC engine id into GuC interface to decouple it from ring id used
by driver.

v2: Keep ring name print out in debugfs; using for_each_ring() where
     possible to keep driver consistent. (Chris W.)

Signed-off-by: Alex Dai <yu.dai@xxxxxxxxx>
---
  drivers/gpu/drm/i915/i915_debugfs.c        | 12 +++++-----
  drivers/gpu/drm/i915/i915_guc_submission.c | 38 ++++++++++++++----------------
  drivers/gpu/drm/i915/intel_guc.h           |  6 ++---
  drivers/gpu/drm/i915/intel_guc_fwif.h      | 17 +++++++++----
  drivers/gpu/drm/i915/intel_lrc.c           |  5 ++++
  drivers/gpu/drm/i915/intel_ringbuffer.h    |  1 +
  6 files changed, 45 insertions(+), 34 deletions(-)

diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
index c5db235..cea1844 100644
--- a/drivers/gpu/drm/i915/i915_debugfs.c
+++ b/drivers/gpu/drm/i915/i915_debugfs.c
@@ -2463,9 +2463,9 @@ static void i915_guc_client_info(struct seq_file *m,

  	for_each_ring(ring, dev_priv, i) {
  		seq_printf(m, "\tSubmissions: %llu %s\n",
-				client->submissions[i],
+				client->submissions[ring->guc_id],
  				ring->name);
-		tot += client->submissions[i];
+		tot += client->submissions[ring->guc_id];
  	}
  	seq_printf(m, "\tTotal: %llu\n", tot);
  }
@@ -2502,10 +2502,10 @@ static int i915_guc_info(struct seq_file *m, void *data)

  	seq_printf(m, "\nGuC submissions:\n");
  	for_each_ring(ring, dev_priv, i) {
-		seq_printf(m, "\t%-24s: %10llu, last seqno 0x%08x %9d\n",
-			ring->name, guc.submissions[i],
-			guc.last_seqno[i], guc.last_seqno[i]);
-		total += guc.submissions[i];
+		seq_printf(m, "\t%-24s: %10llu, last seqno 0x%08x\n",
+			ring->name, guc.submissions[ring->guc_id],
+			guc.last_seqno[ring->guc_id]);
+		total += guc.submissions[ring->guc_id];
  	}
  	seq_printf(m, "\t%s: %llu\n", "Total", total);

diff --git a/drivers/gpu/drm/i915/i915_guc_submission.c b/drivers/gpu/drm/i915/i915_guc_submission.c
index 51ae5c1..b4da20f 100644
--- a/drivers/gpu/drm/i915/i915_guc_submission.c
+++ b/drivers/gpu/drm/i915/i915_guc_submission.c
@@ -376,6 +376,8 @@ static void guc_init_proc_desc(struct intel_guc *guc,
  static void guc_init_ctx_desc(struct intel_guc *guc,
  			      struct i915_guc_client *client)
  {
+	struct drm_i915_private *dev_priv = guc_to_i915(guc);
+	struct intel_engine_cs *ring;
  	struct intel_context *ctx = client->owner;
  	struct guc_context_desc desc;
  	struct sg_table *sg;
@@ -388,10 +390,8 @@ static void guc_init_ctx_desc(struct intel_guc *guc,
  	desc.priority = client->priority;
  	desc.db_id = client->doorbell_id;

-	for (i = 0; i < I915_NUM_RINGS; i++) {
-		struct guc_execlist_context *lrc = &desc.lrc[i];
-		struct intel_ringbuffer *ringbuf = ctx->engine[i].ringbuf;
-		struct intel_engine_cs *ring;
+	for_each_ring(ring, dev_priv, i) {
+		struct guc_execlist_context *lrc = &desc.lrc[ring->guc_id];
  		struct drm_i915_gem_object *obj;
  		uint64_t ctx_desc;

@@ -406,7 +406,6 @@ static void guc_init_ctx_desc(struct intel_guc *guc,
  		if (!obj)
  			break;	/* XXX: continue? */

-		ring = ringbuf->ring;
  		ctx_desc = intel_lr_context_descriptor(ctx, ring);
  		lrc->context_desc = (u32)ctx_desc;

@@ -414,16 +413,16 @@ static void guc_init_ctx_desc(struct intel_guc *guc,
  		lrc->ring_lcra = i915_gem_obj_ggtt_offset(obj) +
  				LRC_STATE_PN * PAGE_SIZE;
  		lrc->context_id = (client->ctx_index << GUC_ELC_CTXID_OFFSET) |
-				(ring->id << GUC_ELC_ENGINE_OFFSET);
+				(ring->guc_id << GUC_ELC_ENGINE_OFFSET);

-		obj = ringbuf->obj;
+		obj = ctx->engine[i].ringbuf->obj;

  		lrc->ring_begin = i915_gem_obj_ggtt_offset(obj);
  		lrc->ring_end = lrc->ring_begin + obj->base.size - 1;
  		lrc->ring_next_free_location = lrc->ring_begin;
  		lrc->ring_current_tail_pointer_value = 0;

-		desc.engines_used |= (1 << ring->id);
+		desc.engines_used |= (1 << ring->guc_id);
  	}

  	WARN_ON(desc.engines_used == 0);
@@ -510,7 +509,6 @@ int i915_guc_wq_check_space(struct i915_guc_client *gc)
  static int guc_add_workqueue_item(struct i915_guc_client *gc,
  				  struct drm_i915_gem_request *rq)
  {
-	enum intel_ring_id ring_id = rq->ring->id;
  	struct guc_wq_item *wqi;
  	void *base;
  	u32 tail, wq_len, wq_off, space;
@@ -544,7 +542,7 @@ static int guc_add_workqueue_item(struct i915_guc_client *gc,
  	wq_len = sizeof(struct guc_wq_item) / sizeof(u32) - 1;
  	wqi->header = WQ_TYPE_INORDER |
  			(wq_len << WQ_LEN_SHIFT) |
-			(ring_id << WQ_TARGET_SHIFT) |
+			(rq->ring->guc_id << WQ_TARGET_SHIFT) |
  			WQ_NO_WCFLUSH_WAIT;

  	/* The GuC wants only the low-order word of the context descriptor */
@@ -594,7 +592,7 @@ int i915_guc_submit(struct i915_guc_client *client,
  		    struct drm_i915_gem_request *rq)
  {
  	struct intel_guc *guc = client->guc;
-	enum intel_ring_id ring_id = rq->ring->id;
+	unsigned int engine_id = rq->ring->guc_id;
  	int q_ret, b_ret;

  	/* Need this because of the deferred pin ctx and ring */
@@ -605,7 +603,7 @@ int i915_guc_submit(struct i915_guc_client *client,
  	if (q_ret == 0)
  		b_ret = guc_ring_doorbell(client);

-	client->submissions[ring_id] += 1;
+	client->submissions[engine_id] += 1;
  	if (q_ret) {
  		client->q_fail += 1;
  		client->retcode = q_ret;
@@ -615,8 +613,8 @@ int i915_guc_submit(struct i915_guc_client *client,
  	} else {
  		client->retcode = 0;
  	}
-	guc->submissions[ring_id] += 1;
-	guc->last_seqno[ring_id] = rq->seqno;
+	guc->submissions[engine_id] += 1;
+	guc->last_seqno[engine_id] = rq->seqno;

  	return q_ret;
  }
@@ -848,7 +846,7 @@ static void init_guc_policies(struct guc_policies *policies)
  	policies->max_num_work_items = POLICY_MAX_NUM_WI;

  	for (p = 0; p < GUC_CTX_PRIORITY_NUM; p++) {
-		for (i = 0; i < I915_NUM_RINGS; i++) {
+		for (i = GUC_RENDER_ENGINE; i < GUC_MAX_ENGINES_NUM; i++) {
  			policy = &policies->policy[p][i];

  			policy->execution_quantum = 1000000;
@@ -900,7 +898,7 @@ static void guc_create_ads(struct intel_guc *guc)
  	ads->golden_context_lrca = ring->status_page.gfx_addr;

  	for_each_ring(ring, dev_priv, i)
-		ads->eng_state_size[i] = intel_lr_context_size(ring);
+		ads->eng_state_size[ring->guc_id] = intel_lr_context_size(ring);

  	/* GuC scheduling policies */
  	policies = (void *)ads + sizeof(struct guc_ads);
@@ -912,12 +910,12 @@ static void guc_create_ads(struct intel_guc *guc)
  	/* MMIO reg state */
  	reg_state = (void *)policies + sizeof(struct guc_policies);

-	for (i = 0; i < I915_NUM_RINGS; i++) {
-		reg_state->mmio_white_list[i].mmio_start =
-			dev_priv->ring[i].mmio_base + GUC_MMIO_WHITE_LIST_START;
+	for_each_ring(ring, dev_priv, i) {
+		reg_state->mmio_white_list[ring->guc_id].mmio_start =
+			ring->mmio_base + GUC_MMIO_WHITE_LIST_START;

  		/* Nothing to be saved or restored for now. */
-		reg_state->mmio_white_list[i].count = 0;
+		reg_state->mmio_white_list[ring->guc_id].count = 0;
  	}

  	ads->reg_state_addr = ads->scheduler_policies +
diff --git a/drivers/gpu/drm/i915/intel_guc.h b/drivers/gpu/drm/i915/intel_guc.h
index 045b149..73002e9 100644
--- a/drivers/gpu/drm/i915/intel_guc.h
+++ b/drivers/gpu/drm/i915/intel_guc.h
@@ -46,7 +46,7 @@ struct i915_guc_client {
  	uint32_t wq_head;

  	/* GuC submission statistics & status */
-	uint64_t submissions[I915_NUM_RINGS];
+	uint64_t submissions[GUC_MAX_ENGINES_NUM];
  	uint32_t q_fail;
  	uint32_t b_fail;
  	int retcode;
@@ -106,8 +106,8 @@ struct intel_guc {
  	uint32_t action_fail;		/* Total number of failures	*/
  	int32_t action_err;		/* Last error code		*/

-	uint64_t submissions[I915_NUM_RINGS];
-	uint32_t last_seqno[I915_NUM_RINGS];
+	uint64_t submissions[GUC_MAX_ENGINES_NUM];
+	uint32_t last_seqno[GUC_MAX_ENGINES_NUM];
  };

  /* intel_guc_loader.c */
diff --git a/drivers/gpu/drm/i915/intel_guc_fwif.h b/drivers/gpu/drm/i915/intel_guc_fwif.h
index 1856a47..2de57ff 100644
--- a/drivers/gpu/drm/i915/intel_guc_fwif.h
+++ b/drivers/gpu/drm/i915/intel_guc_fwif.h
@@ -44,6 +44,13 @@
  #define GUC_MAX_GPU_CONTEXTS		1024
  #define	GUC_INVALID_CTX_ID		GUC_MAX_GPU_CONTEXTS

+#define GUC_RENDER_ENGINE		0
+#define GUC_VIDEO_ENGINE		1
+#define GUC_BLITTER_ENGINE		2
+#define GUC_VIDEOENHANCE_ENGINE		3
+#define GUC_VIDEO_ENGINE2		4
+#define GUC_MAX_ENGINES_NUM		(GUC_VIDEO_ENGINE2 + 1)
+
  /* Work queue item header definitions */
  #define WQ_STATUS_ACTIVE		1
  #define WQ_STATUS_SUSPENDED		2
@@ -285,7 +292,7 @@ struct guc_context_desc {
  	u64 db_trigger_phy;
  	u16 db_id;

-	struct guc_execlist_context lrc[I915_NUM_RINGS];
+	struct guc_execlist_context lrc[GUC_MAX_ENGINES_NUM];

  	u8 attribute;

@@ -344,7 +351,7 @@ struct guc_policy {
  } __packed;

  struct guc_policies {
-	struct guc_policy policy[GUC_CTX_PRIORITY_NUM][I915_NUM_RINGS];
+	struct guc_policy policy[GUC_CTX_PRIORITY_NUM][GUC_MAX_ENGINES_NUM];

  	/* In micro seconds. How much time to allow before DPC processing is
  	 * called back via interrupt (to prevent DPC queue drain starving).
@@ -388,14 +395,14 @@ struct guc_mmio_regset {

  struct guc_mmio_reg_state {
  	struct guc_mmio_regset global_reg;
-	struct guc_mmio_regset engine_reg[I915_NUM_RINGS];
+	struct guc_mmio_regset engine_reg[GUC_MAX_ENGINES_NUM];

  	/* MMIO registers that are set as non privileged */
  	struct __packed {
  		u32 mmio_start;
  		u32 offsets[GUC_MMIO_WHITE_LIST_MAX];
  		u32 count;
-	} mmio_white_list[I915_NUM_RINGS];
+	} mmio_white_list[GUC_MAX_ENGINES_NUM];
  } __packed;

  /* GuC Additional Data Struct */
@@ -406,7 +413,7 @@ struct guc_ads {
  	u32 golden_context_lrca;
  	u32 scheduler_policies;
  	u32 reserved0[3];
-	u32 eng_state_size[I915_NUM_RINGS];
+	u32 eng_state_size[GUC_MAX_ENGINES_NUM];
  	u32 reserved2[4];
  } __packed;

diff --git a/drivers/gpu/drm/i915/intel_lrc.c b/drivers/gpu/drm/i915/intel_lrc.c
index 73d4347..efb91ad 100644
--- a/drivers/gpu/drm/i915/intel_lrc.c
+++ b/drivers/gpu/drm/i915/intel_lrc.c
@@ -2086,6 +2086,7 @@ static int logical_render_ring_init(struct drm_device *dev)
  	ring->name = "render ring";
  	ring->id = RCS;
  	ring->exec_id = I915_EXEC_RENDER;
+	ring->guc_id = GUC_RENDER_ENGINE;
  	ring->mmio_base = RENDER_RING_BASE;

  	logical_ring_default_irqs(ring, GEN8_RCS_IRQ_SHIFT);
@@ -2137,6 +2138,7 @@ static int logical_bsd_ring_init(struct drm_device *dev)
  	ring->name = "bsd ring";
  	ring->id = VCS;
  	ring->exec_id = I915_EXEC_BSD;
+	ring->guc_id = GUC_VIDEO_ENGINE;
  	ring->mmio_base = GEN6_BSD_RING_BASE;

  	logical_ring_default_irqs(ring, GEN8_VCS1_IRQ_SHIFT);
@@ -2153,6 +2155,7 @@ static int logical_bsd2_ring_init(struct drm_device *dev)
  	ring->name = "bsd2 ring";
  	ring->id = VCS2;
  	ring->exec_id = I915_EXEC_BSD;
+	ring->guc_id = GUC_VIDEO_ENGINE2;
  	ring->mmio_base = GEN8_BSD2_RING_BASE;

  	logical_ring_default_irqs(ring, GEN8_VCS2_IRQ_SHIFT);
@@ -2169,6 +2172,7 @@ static int logical_blt_ring_init(struct drm_device *dev)
  	ring->name = "blitter ring";
  	ring->id = BCS;
  	ring->exec_id = I915_EXEC_BLT;
+	ring->guc_id = GUC_BLITTER_ENGINE;
  	ring->mmio_base = BLT_RING_BASE;

  	logical_ring_default_irqs(ring, GEN8_BCS_IRQ_SHIFT);
@@ -2185,6 +2189,7 @@ static int logical_vebox_ring_init(struct drm_device *dev)
  	ring->name = "video enhancement ring";
  	ring->id = VECS;
  	ring->exec_id = I915_EXEC_VEBOX;
+	ring->guc_id = GUC_VIDEOENHANCE_ENGINE;
  	ring->mmio_base = VEBOX_RING_BASE;

  	logical_ring_default_irqs(ring, GEN8_VECS_IRQ_SHIFT);
diff --git a/drivers/gpu/drm/i915/intel_ringbuffer.h b/drivers/gpu/drm/i915/intel_ringbuffer.h
index b12f2aa..566b0ae 100644
--- a/drivers/gpu/drm/i915/intel_ringbuffer.h
+++ b/drivers/gpu/drm/i915/intel_ringbuffer.h
@@ -158,6 +158,7 @@ struct  intel_engine_cs {
  #define I915_NUM_RINGS 5
  #define _VCS(n) (VCS + (n))
  	unsigned int exec_id;
+	unsigned int guc_id;
  	u32		mmio_base;
  	struct		drm_device *dev;
  	struct intel_ringbuffer *buffer;


Looks OK to me, with a caveat that I don't know much about GuC. But obviously is needed to fix the fallout from my decoupling. And it sounds good to explicitly document this GuC dependency so:

Reviewed-by: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxx>

Regards,

Tvrtko
_______________________________________________
Intel-gfx mailing list
Intel-gfx@xxxxxxxxxxxxxxxxxxxxx
http://lists.freedesktop.org/mailman/listinfo/intel-gfx




[Index of Archives]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]
  Powered by Linux