[PATCHv2.99,02/11] drm/i915: Adjust PM QoS scaling response frequency based on GPU load.

Message ID	20200428032258.2518-3-currojerez@riseup.net (mailing list archive)
State	New, archived
Headers	show Return-Path: <SRS0=pxfJ=6M=lists.freedesktop.org=intel-gfx-bounces@kernel.org> DMARC-Filter: OpenDMARC Filter v1.3.2 mail.kernel.org 065FD2073C From: Francisco Jerez <currojerez@riseup.net> To: "Rafael J. Wysocki" <rjw@rjwysocki.net>, "Pandruvada\, Srinivas" <srinivas.pandruvada@intel.com> Date: Mon, 27 Apr 2020 20:22:49 -0700 Message-Id: <20200428032258.2518-3-currojerez@riseup.net> In-Reply-To: <20200428032258.2518-1-currojerez@riseup.net> References: <20200428032258.2518-1-currojerez@riseup.net> MIME-Version: 1.0 Subject: [Intel-gfx] [PATCHv2.99 02/11] drm/i915: Adjust PM QoS scaling response frequency based on GPU load. Precedence: list Cc: Peter Zijlstra <peterz@infradead.org>, intel-gfx@lists.freedesktop.org, chris.p.wilson@intel.com, linux-pm@vger.kernel.org Content-Type: text/plain; charset="us-ascii" Content-Transfer-Encoding: 7bit Errors-To: intel-gfx-bounces@lists.freedesktop.org Sender: "Intel-gfx" <intel-gfx-bounces@lists.freedesktop.org>
Series	[PATCHv2.99,01/11] PM: QoS: Add CPU_SCALING_RESPONSE global PM QoS limit. \| expand [PATCHv2.99,01/11] PM: QoS: Add CPU_SCALING_RESPONSE global PM QoS limit. [PATCHv2.99,02/11] drm/i915: Adjust PM QoS scaling response frequency based on GPU load. [PATCHv2.99,03/11] OPTIONAL: drm/i915: Expose PM QoS control parameters via debugfs. [PATCHv2.99,04/11] cpufreq: Define ADAPTIVE frequency governor policy. [PATCHv2.99,05/11] cpufreq: intel_pstate: Reorder intel_pstate_clear_update_util_hook() and intel_p… [PATCHv2.99,06/11] cpufreq: intel_pstate: Call intel_pstate_set_update_util_hook() once from the se… [PATCHv2.99,07/11] cpufreq: intel_pstate: Implement VLP controller statistics and target range calc… [PATCHv2.99,08/11] cpufreq: intel_pstate: Implement VLP controller for HWP parts. [PATCHv2.99,09/11] cpufreq: intel_pstate: Enable VLP controller based on ACPI FADT profile and CPUI… [PATCHv2.99,10/11] OPTIONAL: cpufreq: intel_pstate: Add tracing of VLP controller status. [PATCHv2.99,11/11] OPTIONAL: cpufreq: intel_pstate: Expose VLP controller parameters via debugfs.

diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c b/drivers/gpu/drm/i915/gt/intel_engine_cs.c index b1f8527f02c8..6b08a9ad2de1 100644 --- a/drivers/gpu/drm/i915/gt/intel_engine_cs.c +++ b/drivers/gpu/drm/i915/gt/intel_engine_cs.c @@ -517,6 +517,7 @@ void intel_engine_init_execlists(struct intel_engine_cs *engine) execlists->queue_priority_hint = INT_MIN; execlists->queue = RB_ROOT_CACHED; + atomic_set(&execlists->overload, 0); } static void cleanup_status_page(struct intel_engine_cs *engine) diff --git a/drivers/gpu/drm/i915/gt/intel_engine_types.h b/drivers/gpu/drm/i915/gt/intel_engine_types.h index bf395227c99f..9bdb3958dbb7 100644 --- a/drivers/gpu/drm/i915/gt/intel_engine_types.h +++ b/drivers/gpu/drm/i915/gt/intel_engine_types.h @@ -275,6 +275,17 @@ struct intel_engine_execlists { */ u8 csb_head; + /** + * @overload: whether at least two execlist ports are + * currently submitted to the hardware, indicating that CPU + * latency isn't critical in order to maintain the GPU busy. + * We use that to trigger a more energy-efficient response + * mode of CPU power management, since performance degradation + * is unlikely under those conditions, and GPU throughput may + * benefit from the increased TDP budget. + */ + atomic_t overload; + I915_SELFTEST_DECLARE(struct st_preempt_hang preempt_hang;) }; diff --git a/drivers/gpu/drm/i915/gt/intel_gt_pm.c b/drivers/gpu/drm/i915/gt/intel_gt_pm.c index 6bdb74892a1e..0d44ef3a07ad 100644 --- a/drivers/gpu/drm/i915/gt/intel_gt_pm.c +++ b/drivers/gpu/drm/i915/gt/intel_gt_pm.c @@ -107,6 +107,102 @@ void intel_gt_pm_init_early(struct intel_gt *gt) intel_wakeref_init(&gt->wakeref, gt->uncore->rpm, &wf_ops); } +/** + * Time increment until the most immediate PM QoS scaling response + * frequency update. + * + * May be in the future (return value > 0) if the GPU is currently + * active but we haven't updated the PM QoS request to reflect a + * bottleneck yet. May be in the past (return value < 0) if the GPU + * isn't fully utilized and we've already reset the PM QoS request to + * the default value. May be zero if a PM QoS request update is due. + * + * The time increment returned by this function decreases linearly + * with time until it reaches either zero or a configurable limit. + */ +static int32_t time_to_sf_qos_update_ns(struct intel_gt *gt) +{ + const uint64_t t1 = ktime_get_ns(); + const uint64_t dt1 = gt->sf_qos.delay_max_ns; + + if (atomic_read_acquire(&gt->sf_qos.active_count)) { + const uint64_t t0 = atomic64_read(&gt->sf_qos.time_set_ns); + + return min(dt1, t0 <= t1 ? 0 : t0 - t1); + } else { + const uint64_t t0 = atomic64_read(&gt->sf_qos.time_clear_ns); + const unsigned int shift = gt->sf_qos.delay_slope_shift; + + return -(int32_t)(t1 <= t0 ? 1 : + min(dt1, (t1 - t0) << shift)); + } +} + +/** + * Perform a delayed PM QoS scaling response frequency update. + */ +static void intel_gt_sf_qos_update(struct intel_gt *gt) +{ + const uint32_t dt = max(0, time_to_sf_qos_update_ns(gt)); + + timer_reduce(&gt->sf_qos.timer, jiffies + nsecs_to_jiffies(dt)); +} + +/** + * Timer that fires once the delay used to switch the PM QoS scaling + * response frequency request has elapsed. + */ +static void intel_gt_sf_qos_timeout(struct timer_list *timer) +{ + struct intel_gt *gt = container_of(timer, struct intel_gt, + sf_qos.timer); + const int32_t dt = time_to_sf_qos_update_ns(gt); + + if (dt == 0) + cpu_scaling_response_qos_update_request( + &gt->sf_qos.req, gt->sf_qos.target_hz); + else + cpu_scaling_response_qos_update_request( + &gt->sf_qos.req, PM_QOS_DEFAULT_VALUE); + + if (dt > 0) + intel_gt_sf_qos_update(gt); +} + +/** + * Report the beginning of a period of GPU utilization to PM. + * + * May trigger a more energy-efficient response mode in CPU PM, but + * only after a certain delay has elapsed so we don't have a negative + * impact on the CPU ramp-up latency except after the GPU has been + * continuously utilized for a long enough period of time. + */ +void intel_gt_pm_active_begin(struct intel_gt *gt) +{ + const uint32_t dt = abs(time_to_sf_qos_update_ns(gt)); + + atomic64_set(&gt->sf_qos.time_set_ns, ktime_get_ns() + dt); + + if (!atomic_fetch_inc_release(&gt->sf_qos.active_count)) + intel_gt_sf_qos_update(gt); +} + +/** + * Report the end of a period of GPU utilization to PM. + * + * Must be called once after each call to intel_gt_pm_active_begin(). + */ +void intel_gt_pm_active_end(struct intel_gt *gt) +{ + const uint32_t dt = abs(time_to_sf_qos_update_ns(gt)); + const unsigned int shift = gt->sf_qos.delay_slope_shift; + + atomic64_set(&gt->sf_qos.time_clear_ns, ktime_get_ns() - (dt >> shift)); + + if (!atomic_dec_return_release(&gt->sf_qos.active_count)) + intel_gt_sf_qos_update(gt); +} + void intel_gt_pm_init(struct intel_gt *gt) { /* @@ -116,6 +212,14 @@ void intel_gt_pm_init(struct intel_gt *gt) */ intel_rc6_init(&gt->rc6); intel_rps_init(&gt->rps); + + cpu_scaling_response_qos_add_request(&gt->sf_qos.req, + PM_QOS_DEFAULT_VALUE); + + gt->sf_qos.delay_max_ns = 10000000; + gt->sf_qos.delay_slope_shift = 1; + gt->sf_qos.target_hz = 2; + timer_setup(&gt->sf_qos.timer, intel_gt_sf_qos_timeout, 0); } static bool reset_engines(struct intel_gt *gt) @@ -174,6 +278,9 @@ static void gt_sanitize(struct intel_gt *gt, bool force) void intel_gt_pm_fini(struct intel_gt *gt) { + del_timer_sync(&gt->sf_qos.timer); + cpu_scaling_response_qos_remove_request(&gt->sf_qos.req); + intel_rc6_fini(&gt->rc6); } diff --git a/drivers/gpu/drm/i915/gt/intel_gt_pm.h b/drivers/gpu/drm/i915/gt/intel_gt_pm.h index 60f0e2fbe55c..43f1d45fb0db 100644 --- a/drivers/gpu/drm/i915/gt/intel_gt_pm.h +++ b/drivers/gpu/drm/i915/gt/intel_gt_pm.h @@ -58,6 +58,9 @@ int intel_gt_resume(struct intel_gt *gt); void intel_gt_runtime_suspend(struct intel_gt *gt); int intel_gt_runtime_resume(struct intel_gt *gt); +void intel_gt_pm_active_begin(struct intel_gt *gt); +void intel_gt_pm_active_end(struct intel_gt *gt); + static inline bool is_mock_gt(const struct intel_gt *gt) { return I915_SELFTEST_ONLY(gt->awake == -ENODEV); diff --git a/drivers/gpu/drm/i915/gt/intel_gt_types.h b/drivers/gpu/drm/i915/gt/intel_gt_types.h index 96890dd12b5f..8aaeb2450d05 100644 --- a/drivers/gpu/drm/i915/gt/intel_gt_types.h +++ b/drivers/gpu/drm/i915/gt/intel_gt_types.h @@ -10,6 +10,7 @@ #include <linux/list.h> #include <linux/mutex.h> #include <linux/notifier.h> +#include <linux/pm_qos.h> #include <linux/spinlock.h> #include <linux/types.h> @@ -97,6 +98,54 @@ struct intel_gt { * Reserved for exclusive use by the kernel. */ struct i915_address_space *vm; + + /** + * CPU response frequency QoS tracking. + */ + struct { + /** PM QoS request of this device. */ + struct pm_qos_request req; + + /** Timer used for delayed update of the PM QoS request. */ + struct timer_list timer; + + /** Response frequency target to use in GPU-bound conditions. */ + uint32_t target_hz; + + /** + * Maximum delay before the PM QoS request is updated + * after we become GPU-bound. + */ + uint32_t delay_max_ns; + + /** + * Exponent of delay slope used when the workload + * becomes non-GPU-bound, used to provide greater + * sensitivity to periods of GPU inactivity which may + * indicate that the workload is latency-bound. + */ + uint32_t delay_slope_shift; + + /** + * Last time intel_gt_pm_active_begin() was called to + * indicate that the GPU is a bottleneck. + */ + atomic64_t time_set_ns; + + /** + * Last time intel_gt_pm_active_end() was called to + * indicate that the GPU is no longer a bottleneck. + */ + atomic64_t time_clear_ns; + + /** + * Number of times intel_gt_pm_active_begin() was + * called without a matching intel_gt_pm_active_end(). + * Will be greater than zero if the GPU is currently + * considered to be a bottleneck. + */ + atomic_t active_count; + } sf_qos; }; enum intel_gt_scratch_field { diff --git a/drivers/gpu/drm/i915/gt/intel_lrc.c b/drivers/gpu/drm/i915/gt/intel_lrc.c index be5d6b71b6b0..767fa88f4d20 100644 --- a/drivers/gpu/drm/i915/gt/intel_lrc.c +++ b/drivers/gpu/drm/i915/gt/intel_lrc.c @@ -2365,6 +2365,12 @@ cancel_port_requests(struct intel_engine_execlists * const execlists) smp_wmb(); /* complete the seqlock for execlists_active() */ WRITE_ONCE(execlists->active, execlists->inflight); + + if (atomic_xchg(&execlists->overload, 0)) { + struct intel_engine_cs *engine = + container_of(execlists, typeof(*engine), execlists); + intel_gt_pm_active_end(engine->gt); + } } static inline void @@ -2533,12 +2539,23 @@ static void process_csb(struct intel_engine_cs *engine) WRITE_ONCE(execlists->active, execlists->inflight); WRITE_ONCE(execlists->pending[0], NULL); + + if (execlists->inflight[1]) { + if (!atomic_xchg(&execlists->overload, 1)) + intel_gt_pm_active_begin(engine->gt); + } else { + if (atomic_xchg(&execlists->overload, 0)) + intel_gt_pm_active_end(engine->gt); + } } else { GEM_BUG_ON(!*execlists->active); /* port0 completed, advanced to port1 */ trace_ports(execlists, "completed", execlists->active); + if (atomic_xchg(&execlists->overload, 0)) + intel_gt_pm_active_end(engine->gt); + /* * We rely on the hardware being strongly * ordered, that the breadcrumb write is

[PATCHv2.99,02/11] drm/i915: Adjust PM QoS scaling response frequency based on GPU load.

Commit Message

Patch