diff mbox series

drm/i915/gt: Only disable powergating around rcs activity

Message ID 20191219164551.9402-1-chris@chris-wilson.co.uk (mailing list archive)
State New, archived
Headers show
Series drm/i915/gt: Only disable powergating around rcs activity | expand

Commit Message

Chris Wilson Dec. 19, 2019, 4:45 p.m. UTC
References: https://gitlab.freedesktop.org/drm/intel/issues/846
Cc: Imre Deak <imre.deak@intel.com>
Cc: Eero Tamminen <eero.t.tamminen@intel.com>
---
 drivers/gpu/drm/i915/gt/intel_engine_pm.c |  4 ++
 drivers/gpu/drm/i915/gt/intel_rc6.c       | 46 +++++++++++++++++++----
 drivers/gpu/drm/i915/gt/intel_rc6.h       |  3 ++
 drivers/gpu/drm/i915/gt/intel_rc6_types.h |  6 +++
 4 files changed, 52 insertions(+), 7 deletions(-)

Comments

Eero Tamminen Dec. 20, 2019, 4:30 p.m. UTC | #1
Hi,

According to quick testing I did, this clearly helps with low-power 
Media transcoding on BXT, and a bit on some other cases both on BXT & 
KBL GT3e.

However, it also seems to regress some cases.  They have too much 
variance to say for sure though (and because I can't build exactly same 
commit due to drm-tip getting rebased all the time).

Cases that may have regressed are similar to low-power ones, just using 
MediaSDK sample application and compute for encoding. For example:
sample_multi_transcode -i::h264 720x480p_30.00_4mb_h264_cabac_180s.264 
-o::h264 output.h264 -b 2000 -u 4 -n 4800 -async 4 -hw

(Chris, MediaSDK build installs sample_multi_transcode to 
share/mfx/samples/ directory.)


	- Eero

On 19.12.2019 18.45, Chris Wilson wrote:
> References: https://gitlab.freedesktop.org/drm/intel/issues/846
> Cc: Imre Deak <imre.deak@intel.com>
> Cc: Eero Tamminen <eero.t.tamminen@intel.com>
> ---
>   drivers/gpu/drm/i915/gt/intel_engine_pm.c |  4 ++
>   drivers/gpu/drm/i915/gt/intel_rc6.c       | 46 +++++++++++++++++++----
>   drivers/gpu/drm/i915/gt/intel_rc6.h       |  3 ++
>   drivers/gpu/drm/i915/gt/intel_rc6_types.h |  6 +++
>   4 files changed, 52 insertions(+), 7 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_pm.c b/drivers/gpu/drm/i915/gt/intel_engine_pm.c
> index 8fb7b34fc5a6..1886d604f1ad 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_pm.c
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_pm.c
> @@ -36,6 +36,8 @@ static int __engine_unpark(struct intel_wakeref *wf)
>   	if (engine->unpark)
>   		engine->unpark(engine);
>   
> +	intel_rc6_unpark_engine(&engine->gt->rc6, engine);
> +
>   	intel_engine_unpark_heartbeat(engine);
>   	return 0;
>   }
> @@ -232,6 +234,8 @@ static int __engine_park(struct intel_wakeref *wf)
>   	intel_engine_disarm_breadcrumbs(engine);
>   	intel_engine_pool_park(&engine->pool);
>   
> +	intel_rc6_park_engine(&engine->gt->rc6, engine);
> +
>   	/* Must be reset upon idling, or we may miss the busy wakeup. */
>   	GEM_BUG_ON(engine->execlists.queue_priority_hint != INT_MIN);
>   
> diff --git a/drivers/gpu/drm/i915/gt/intel_rc6.c b/drivers/gpu/drm/i915/gt/intel_rc6.c
> index 9e303c29d6e3..7024c34917a2 100644
> --- a/drivers/gpu/drm/i915/gt/intel_rc6.c
> +++ b/drivers/gpu/drm/i915/gt/intel_rc6.c
> @@ -175,13 +175,7 @@ static void gen9_rc6_enable(struct intel_rc6 *rc6)
>   		GEN6_RC_CTL_RC6_ENABLE |
>   		rc6_mode;
>   
> -	/*
> -	 * WaRsDisableCoarsePowerGating:skl,cnl
> -	 *   - Render/Media PG need to be disabled with RC6.
> -	 */
> -	if (!NEEDS_WaRsDisableCoarsePowerGating(rc6_to_i915(rc6)))
> -		set(uncore, GEN9_PG_ENABLE,
> -		    GEN9_RENDER_PG_ENABLE | GEN9_MEDIA_PG_ENABLE);
> +	rc6->engines[RENDER_CLASS].pg_enable = GEN9_RENDER_PG_ENABLE | GEN9_MEDIA_PG_ENABLE;
>   }
>   
>   static void gen8_rc6_enable(struct intel_rc6 *rc6)
> @@ -601,6 +595,44 @@ void intel_rc6_unpark(struct intel_rc6 *rc6)
>   	set(uncore, GEN6_RC_CONTROL, rc6->ctl_enable);
>   }
>   
> +void intel_rc6_unpark_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine)
> +{
> +	struct intel_uncore *uncore = rc6_to_uncore(rc6);
> +	struct intel_pg_engine *e = &rc6->engines[engine->class];
> +
> +	if (!rc6->enabled)
> +		return;
> +
> +	if (!e->pg_enable)
> +		return;
> +
> +	spin_lock_irq(&uncore->lock);
> +	if (!e->active++) {
> +		rc6->pg_enable &= ~e->pg_enable;
> +		set(uncore, GEN9_PG_ENABLE, rc6->pg_enable);
> +	}
> +	spin_unlock_irq(&uncore->lock);
> +}
> +
> +void intel_rc6_park_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine)
> +{
> +	struct intel_uncore *uncore = rc6_to_uncore(rc6);
> +	struct intel_pg_engine *e = &rc6->engines[engine->class];
> +
> +	if (!rc6->enabled)
> +		return;
> +
> +	if (!e->pg_enable)
> +		return;
> +
> +	spin_lock_irq(&uncore->lock);
> +	if (e->active > 0 && !--e->active) {
> +		rc6->pg_enable |= e->pg_enable;
> +		set(uncore, GEN9_PG_ENABLE, rc6->pg_enable);
> +	}
> +	spin_unlock_irq(&uncore->lock);
> +}
> +
>   void intel_rc6_park(struct intel_rc6 *rc6)
>   {
>   	struct intel_uncore *uncore = rc6_to_uncore(rc6);
> diff --git a/drivers/gpu/drm/i915/gt/intel_rc6.h b/drivers/gpu/drm/i915/gt/intel_rc6.h
> index 9f0f23fca8af..d4e422038866 100644
> --- a/drivers/gpu/drm/i915/gt/intel_rc6.h
> +++ b/drivers/gpu/drm/i915/gt/intel_rc6.h
> @@ -18,6 +18,9 @@ void intel_rc6_fini(struct intel_rc6 *rc6);
>   void intel_rc6_unpark(struct intel_rc6 *rc6);
>   void intel_rc6_park(struct intel_rc6 *rc6);
>   
> +void intel_rc6_unpark_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine);
> +void intel_rc6_park_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine);
> +
>   void intel_rc6_sanitize(struct intel_rc6 *rc6);
>   void intel_rc6_enable(struct intel_rc6 *rc6);
>   void intel_rc6_disable(struct intel_rc6 *rc6);
> diff --git a/drivers/gpu/drm/i915/gt/intel_rc6_types.h b/drivers/gpu/drm/i915/gt/intel_rc6_types.h
> index bfbb623f7a4f..e6fce9e7b34e 100644
> --- a/drivers/gpu/drm/i915/gt/intel_rc6_types.h
> +++ b/drivers/gpu/drm/i915/gt/intel_rc6_types.h
> @@ -22,6 +22,12 @@ struct intel_rc6 {
>   
>   	struct drm_i915_gem_object *pctx;
>   
> +	u32 pg_enable;
> +	struct intel_pg_engine {
> +		unsigned int active;
> +		u32 pg_enable;
> +	} engines[4];
> +
>   	bool supported : 1;
>   	bool enabled : 1;
>   	bool manual : 1;
>
diff mbox series

Patch

diff --git a/drivers/gpu/drm/i915/gt/intel_engine_pm.c b/drivers/gpu/drm/i915/gt/intel_engine_pm.c
index 8fb7b34fc5a6..1886d604f1ad 100644
--- a/drivers/gpu/drm/i915/gt/intel_engine_pm.c
+++ b/drivers/gpu/drm/i915/gt/intel_engine_pm.c
@@ -36,6 +36,8 @@  static int __engine_unpark(struct intel_wakeref *wf)
 	if (engine->unpark)
 		engine->unpark(engine);
 
+	intel_rc6_unpark_engine(&engine->gt->rc6, engine);
+
 	intel_engine_unpark_heartbeat(engine);
 	return 0;
 }
@@ -232,6 +234,8 @@  static int __engine_park(struct intel_wakeref *wf)
 	intel_engine_disarm_breadcrumbs(engine);
 	intel_engine_pool_park(&engine->pool);
 
+	intel_rc6_park_engine(&engine->gt->rc6, engine);
+
 	/* Must be reset upon idling, or we may miss the busy wakeup. */
 	GEM_BUG_ON(engine->execlists.queue_priority_hint != INT_MIN);
 
diff --git a/drivers/gpu/drm/i915/gt/intel_rc6.c b/drivers/gpu/drm/i915/gt/intel_rc6.c
index 9e303c29d6e3..7024c34917a2 100644
--- a/drivers/gpu/drm/i915/gt/intel_rc6.c
+++ b/drivers/gpu/drm/i915/gt/intel_rc6.c
@@ -175,13 +175,7 @@  static void gen9_rc6_enable(struct intel_rc6 *rc6)
 		GEN6_RC_CTL_RC6_ENABLE |
 		rc6_mode;
 
-	/*
-	 * WaRsDisableCoarsePowerGating:skl,cnl
-	 *   - Render/Media PG need to be disabled with RC6.
-	 */
-	if (!NEEDS_WaRsDisableCoarsePowerGating(rc6_to_i915(rc6)))
-		set(uncore, GEN9_PG_ENABLE,
-		    GEN9_RENDER_PG_ENABLE | GEN9_MEDIA_PG_ENABLE);
+	rc6->engines[RENDER_CLASS].pg_enable = GEN9_RENDER_PG_ENABLE | GEN9_MEDIA_PG_ENABLE;
 }
 
 static void gen8_rc6_enable(struct intel_rc6 *rc6)
@@ -601,6 +595,44 @@  void intel_rc6_unpark(struct intel_rc6 *rc6)
 	set(uncore, GEN6_RC_CONTROL, rc6->ctl_enable);
 }
 
+void intel_rc6_unpark_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine)
+{
+	struct intel_uncore *uncore = rc6_to_uncore(rc6);
+	struct intel_pg_engine *e = &rc6->engines[engine->class];
+
+	if (!rc6->enabled)
+		return;
+
+	if (!e->pg_enable)
+		return;
+
+	spin_lock_irq(&uncore->lock);
+	if (!e->active++) {
+		rc6->pg_enable &= ~e->pg_enable;
+		set(uncore, GEN9_PG_ENABLE, rc6->pg_enable);
+	}
+	spin_unlock_irq(&uncore->lock);
+}
+
+void intel_rc6_park_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine)
+{
+	struct intel_uncore *uncore = rc6_to_uncore(rc6);
+	struct intel_pg_engine *e = &rc6->engines[engine->class];
+
+	if (!rc6->enabled)
+		return;
+
+	if (!e->pg_enable)
+		return;
+
+	spin_lock_irq(&uncore->lock);
+	if (e->active > 0 && !--e->active) {
+		rc6->pg_enable |= e->pg_enable;
+		set(uncore, GEN9_PG_ENABLE, rc6->pg_enable);
+	}
+	spin_unlock_irq(&uncore->lock);
+}
+
 void intel_rc6_park(struct intel_rc6 *rc6)
 {
 	struct intel_uncore *uncore = rc6_to_uncore(rc6);
diff --git a/drivers/gpu/drm/i915/gt/intel_rc6.h b/drivers/gpu/drm/i915/gt/intel_rc6.h
index 9f0f23fca8af..d4e422038866 100644
--- a/drivers/gpu/drm/i915/gt/intel_rc6.h
+++ b/drivers/gpu/drm/i915/gt/intel_rc6.h
@@ -18,6 +18,9 @@  void intel_rc6_fini(struct intel_rc6 *rc6);
 void intel_rc6_unpark(struct intel_rc6 *rc6);
 void intel_rc6_park(struct intel_rc6 *rc6);
 
+void intel_rc6_unpark_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine);
+void intel_rc6_park_engine(struct intel_rc6 *rc6, struct intel_engine_cs *engine);
+
 void intel_rc6_sanitize(struct intel_rc6 *rc6);
 void intel_rc6_enable(struct intel_rc6 *rc6);
 void intel_rc6_disable(struct intel_rc6 *rc6);
diff --git a/drivers/gpu/drm/i915/gt/intel_rc6_types.h b/drivers/gpu/drm/i915/gt/intel_rc6_types.h
index bfbb623f7a4f..e6fce9e7b34e 100644
--- a/drivers/gpu/drm/i915/gt/intel_rc6_types.h
+++ b/drivers/gpu/drm/i915/gt/intel_rc6_types.h
@@ -22,6 +22,12 @@  struct intel_rc6 {
 
 	struct drm_i915_gem_object *pctx;
 
+	u32 pg_enable;
+	struct intel_pg_engine {
+		unsigned int active;
+		u32 pg_enable;
+	} engines[4];
+
 	bool supported : 1;
 	bool enabled : 1;
 	bool manual : 1;