[v3] drm/i915: Prevent waiting inside ring construction for critical sections

Message ID	20210203150012.11322-1-chris@chris-wilson.co.uk (mailing list archive)
State	New, archived
Headers	show Return-Path: <SRS0=vatO=HF=lists.freedesktop.org=intel-gfx-bounces@kernel.org> DMARC-Filter: OpenDMARC Filter v1.3.2 mail.kernel.org 78C1664F7C From: Chris Wilson <chris@chris-wilson.co.uk> To: intel-gfx@lists.freedesktop.org Date: Wed, 3 Feb 2021 15:00:12 +0000 Message-Id: <20210203150012.11322-1-chris@chris-wilson.co.uk> In-Reply-To: <20210203124740.9354-1-chris@chris-wilson.co.uk> References: <20210203124740.9354-1-chris@chris-wilson.co.uk> MIME-Version: 1.0 Subject: [Intel-gfx] [PATCH v3] drm/i915: Prevent waiting inside ring construction for critical sections Precedence: list Cc: Chris Wilson <chris@chris-wilson.co.uk> Content-Type: text/plain; charset="us-ascii" Content-Transfer-Encoding: 7bit Errors-To: intel-gfx-bounces@lists.freedesktop.org Sender: "Intel-gfx" <intel-gfx-bounces@lists.freedesktop.org>
Series	[v3] drm/i915: Prevent waiting inside ring construction for critical sections \| expand [v3] drm/i915: Prevent waiting inside ring construction for critical sections

diff --git a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c index fe170186dd42..d2dc9f093119 100644 --- a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c +++ b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c @@ -1256,6 +1256,20 @@ static int reloc_move_to_gpu(struct i915_request *rq, struct i915_vma *vma) return err; } +static struct i915_request * +eb_request_create(struct i915_execbuffer *eb, struct intel_context *ce) +{ + gfp_t gfp = GFP_KERNEL | __GFP_NOWARN; + unsigned long flags= 0; + + if (eb->file->filp->f_flags & O_NONBLOCK) { + flags = BIT(I915_FENCE_FLAG_NOWAIT); + gfp |= __GFP_RETRY_MAYFAIL; + } + + return __i915_request_create(ce, flags, gfp); +} + static int __reloc_gpu_alloc(struct i915_execbuffer *eb, struct intel_engine_cs *engine, struct i915_vma *vma, @@ -1301,7 +1315,7 @@ static int __reloc_gpu_alloc(struct i915_execbuffer *eb, goto err_unmap; if (engine == eb->context->engine) { - rq = i915_request_create(eb->context); + rq = eb_request_create(eb, eb->context); } else { struct intel_context *ce = eb->reloc_context; @@ -1321,7 +1335,7 @@ static int __reloc_gpu_alloc(struct i915_execbuffer *eb, if (err) goto err_unpin; - rq = i915_request_create(ce); + rq = eb_request_create(eb, ce); intel_context_unpin(ce); } if (IS_ERR(rq)) { @@ -3283,7 +3297,7 @@ i915_gem_do_execbuffer(struct drm_device *dev, GEM_BUG_ON(eb.reloc_cache.rq); /* Allocate a request for this batch buffer nice and early. */ - eb.request = i915_request_create(eb.context); + eb.request = eb_request_create(&eb, eb.context); if (IS_ERR(eb.request)) { err = PTR_ERR(eb.request); goto err_vma; diff --git a/drivers/gpu/drm/i915/gt/intel_engine_heartbeat.c b/drivers/gpu/drm/i915/gt/intel_engine_heartbeat.c index 778bcae5ef2c..12b58ba5bcd8 100644 --- a/drivers/gpu/drm/i915/gt/intel_engine_heartbeat.c +++ b/drivers/gpu/drm/i915/gt/intel_engine_heartbeat.c @@ -40,9 +40,14 @@ static struct i915_request * heartbeat_create(struct intel_context *ce, gfp_t gfp) { struct i915_request *rq; + unsigned long flags; + + flags = 0; + if ((gfp & __GFP_RECLAIM) == 0) + flags = BIT(I915_FENCE_FLAG_NOWAIT); intel_context_enter(ce); - rq = __i915_request_create(ce, gfp); + rq = __i915_request_create_locked(ce, flags, gfp); intel_context_exit(ce); return rq; diff --git a/drivers/gpu/drm/i915/gt/intel_engine_pm.c b/drivers/gpu/drm/i915/gt/intel_engine_pm.c index 6372d7826bc9..d9bed542136a 100644 --- a/drivers/gpu/drm/i915/gt/intel_engine_pm.c +++ b/drivers/gpu/drm/i915/gt/intel_engine_pm.c @@ -200,7 +200,7 @@ static bool switch_to_kernel_context(struct intel_engine_cs *engine) flags = __timeline_mark_lock(ce); GEM_BUG_ON(atomic_read(&ce->timeline->active_count) < 0); - rq = __i915_request_create(ce, GFP_NOWAIT); + rq = __i915_request_create_locked(ce, BIT(I915_FENCE_FLAG_NOWAIT), GFP_NOWAIT); if (IS_ERR(rq)) /* Context switch failed, hope for the best! Maybe reset? */ goto out_unlock; diff --git a/drivers/gpu/drm/i915/gt/intel_ring.c b/drivers/gpu/drm/i915/gt/intel_ring.c index aee0a77c77e0..9f149fdc8416 100644 --- a/drivers/gpu/drm/i915/gt/intel_ring.c +++ b/drivers/gpu/drm/i915/gt/intel_ring.c @@ -184,9 +184,10 @@ void intel_ring_free(struct kref *ref) static noinline int wait_for_space(struct intel_ring *ring, - struct intel_timeline *tl, + struct i915_request *rq, unsigned int bytes) { + struct intel_timeline *tl = i915_request_timeline(rq); struct i915_request *target; long timeout; @@ -207,11 +208,13 @@ wait_for_space(struct intel_ring *ring, if (GEM_WARN_ON(&target->link == &tl->requests)) return -ENOSPC; - timeout = i915_request_wait(target, - I915_WAIT_INTERRUPTIBLE, - MAX_SCHEDULE_TIMEOUT); - if (timeout < 0) - return timeout; + timeout = MAX_SCHEDULE_TIMEOUT; + if (i915_request_nowait(rq)) + timeout = 0; + + timeout = i915_request_wait(target, I915_WAIT_INTERRUPTIBLE, timeout); + if (unlikely(timeout < 0)) + return i915_request_nowait(rq) ? -EWOULDBLOCK : timeout; i915_request_retire_upto(target); @@ -271,9 +274,7 @@ u32 *intel_ring_begin(struct i915_request *rq, unsigned int num_dwords) */ GEM_BUG_ON(!rq->reserved_space); - ret = wait_for_space(ring, - i915_request_timeline(rq), - total_bytes); + ret = wait_for_space(ring, rq, total_bytes); if (unlikely(ret)) return ERR_PTR(ret); } diff --git a/drivers/gpu/drm/i915/i915_request.c b/drivers/gpu/drm/i915/i915_request.c index a336d6c40d8b..04ca4fe54633 100644 --- a/drivers/gpu/drm/i915/i915_request.c +++ b/drivers/gpu/drm/i915/i915_request.c @@ -799,7 +799,7 @@ static void __i915_request_ctor(void *arg) } struct i915_request * -__i915_request_create(struct intel_context *ce, gfp_t gfp) +__i915_request_create_locked(struct intel_context *ce, unsigned long flags, gfp_t gfp) { struct intel_timeline *tl = ce->timeline; struct i915_request *rq; @@ -856,7 +856,7 @@ __i915_request_create(struct intel_context *ce, gfp_t gfp) rq->execution_mask = ce->engine->mask; kref_init(&rq->fence.refcount); - rq->fence.flags = 0; + rq->fence.flags = flags; rq->fence.error = 0; INIT_LIST_HEAD(&rq->fence.cb_list); @@ -934,7 +934,7 @@ __i915_request_create(struct intel_context *ce, gfp_t gfp) } struct i915_request * -i915_request_create(struct intel_context *ce) +__i915_request_create(struct intel_context *ce, unsigned long flags, gfp_t gfp) { struct i915_request *rq; struct intel_timeline *tl; @@ -949,7 +949,7 @@ i915_request_create(struct intel_context *ce) i915_request_retire(rq); intel_context_enter(ce); - rq = __i915_request_create(ce, GFP_KERNEL); + rq = __i915_request_create_locked(ce, flags, gfp); intel_context_exit(ce); /* active reference transferred to request */ if (IS_ERR(rq)) goto err_unlock; diff --git a/drivers/gpu/drm/i915/i915_request.h b/drivers/gpu/drm/i915/i915_request.h index c0bd4cb8786a..43230037f469 100644 --- a/drivers/gpu/drm/i915/i915_request.h +++ b/drivers/gpu/drm/i915/i915_request.h @@ -137,6 +137,18 @@ enum { * the GPU. Here we track such boost requests on a per-request basis. */ I915_FENCE_FLAG_BOOST, + + /* + * I915_FENCE_FLAG_NOWAIT - avoid waits while constructing the request + * + * We may wish to construct a request from some contexts where + * we do not want to wait, and sometimes the client would prefer + * to have a nonblocking interface. We may have to wait in a few place + * during request construction (e.g. waiting for space in the + * ringbuffer), this flag allows us to opt out of those waits and + * return -EAGAIN instead. + */ + I915_FENCE_FLAG_NOWAIT, }; /** @@ -305,9 +317,16 @@ static inline bool dma_fence_is_i915(const struct dma_fence *fence) struct kmem_cache *i915_request_slab_cache(void); struct i915_request * __must_check -__i915_request_create(struct intel_context *ce, gfp_t gfp); +__i915_request_create_locked(struct intel_context *ce, + unsigned long flags, gfp_t gfp); struct i915_request * __must_check -i915_request_create(struct intel_context *ce); +__i915_request_create(struct intel_context *ce, + unsigned long flags, gfp_t gfp); +static inline struct i915_request * +i915_request_create(struct intel_context *ce) +{ + return __i915_request_create(ce, 0, GFP_KERNEL); +} void __i915_request_skip(struct i915_request *rq); void i915_request_set_error_once(struct i915_request *rq, int error); @@ -558,6 +577,11 @@ static inline void i915_request_mark_complete(struct i915_request *rq) (u32 *)&rq->fence.seqno); } +static inline bool i915_request_nowait(const struct i915_request *rq) +{ + return test_bit(I915_FENCE_FLAG_NOWAIT, &rq->fence.flags); +} + static inline bool i915_request_has_waitboost(const struct i915_request *rq) { return test_bit(I915_FENCE_FLAG_BOOST, &rq->fence.flags);

[v3] drm/i915: Prevent waiting inside ring construction for critical sections

Commit Message

Patch