[RFC] amdgpu: Add a context flag to disable implicit sync

Message ID	20240807153941.3668940-1-faith.ekstrand@collabora.com (mailing list archive)
State	New, archived
Headers	show Return-Path: <dri-devel-bounces@lists.freedesktop.org> From: Faith Ekstrand <faith@gfxstrand.net> To: dri-devel@lists.freedesktop.org, amd-gfx@lists.freedesktop.org Cc: Faith Ekstrand <faith.ekstrand@collabora.com>, Alex Deucher <alexander.deucher@amd.com>, =?utf-8?q?Christian_K=C3=B6nig?= <christian.koenig@amd.com>, David Airlie <airlied@gmail.com>, =?utf-8?q?Michel_D=C3=A4nzer?= <mdaenzer@redhat.com>, Bas Nieuwenhuizen <bas@basnieuwenhuizen.nl> Subject: [RFC] amdgpu: Add a context flag to disable implicit sync Date: Wed, 7 Aug 2024 10:39:32 -0500 Message-ID: <20240807153941.3668940-1-faith.ekstrand@collabora.com> MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Precedence: list Errors-To: dri-devel-bounces@lists.freedesktop.org Sender: "dri-devel" <dri-devel-bounces@lists.freedesktop.org>
Series	[RFC] amdgpu: Add a context flag to disable implicit sync \| expand [RFC] amdgpu: Add a context flag to disable implicit sync

diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c index ec888fc6ead8..8410b4426541 100644 --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c @@ -1196,7 +1196,8 @@ static int amdgpu_cs_sync_rings(struct amdgpu_cs_parser *p) struct dma_resv *resv = bo->tbo.base.resv; enum amdgpu_sync_mode sync_mode; - sync_mode = amdgpu_bo_explicit_sync(bo) ? + sync_mode = (amdgpu_ctx_explicit_sync(p->ctx) || + amdgpu_bo_explicit_sync(bo)) ? AMDGPU_SYNC_EXPLICIT : AMDGPU_SYNC_NE_OWNER; r = amdgpu_sync_resv(p->adev, &p->sync, resv, sync_mode, &fpriv->vm); diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c index 5cb33ac99f70..a304740ccedf 100644 --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c @@ -318,7 +318,8 @@ static int amdgpu_ctx_get_stable_pstate(struct amdgpu_ctx *ctx, } static int amdgpu_ctx_init(struct amdgpu_ctx_mgr *mgr, int32_t priority, - struct drm_file *filp, struct amdgpu_ctx *ctx) + uint32_t flags, struct drm_file *filp, + struct amdgpu_ctx *ctx) { struct amdgpu_fpriv *fpriv = filp->driver_priv; u32 current_stable_pstate; @@ -334,6 +335,7 @@ static int amdgpu_ctx_init(struct amdgpu_ctx_mgr *mgr, int32_t priority, ctx->mgr = mgr; spin_lock_init(&ctx->ring_lock); + ctx->flags = flags; ctx->reset_counter = atomic_read(&mgr->adev->gpu_reset_counter); ctx->reset_counter_query = ctx->reset_counter; ctx->generation = amdgpu_vm_generation(mgr->adev, &fpriv->vm); @@ -474,6 +476,7 @@ static int amdgpu_ctx_alloc(struct amdgpu_device *adev, struct amdgpu_fpriv *fpriv, struct drm_file *filp, int32_t priority, + uint32_t flags, uint32_t *id) { struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr; @@ -493,7 +496,7 @@ static int amdgpu_ctx_alloc(struct amdgpu_device *adev, } *id = (uint32_t)r; - r = amdgpu_ctx_init(mgr, priority, filp, ctx); + r = amdgpu_ctx_init(mgr, priority, flags, filp, ctx); if (r) { idr_remove(&mgr->ctx_handles, *id); *id = 0; @@ -666,7 +669,7 @@ int amdgpu_ctx_ioctl(struct drm_device *dev, void *data, struct drm_file *filp) { int r; - uint32_t id, stable_pstate; + uint32_t id, stable_pstate, flags; int32_t priority; union drm_amdgpu_ctx *args = data; @@ -675,6 +678,7 @@ int amdgpu_ctx_ioctl(struct drm_device *dev, void *data, id = args->in.ctx_id; priority = args->in.priority; + flags = args->in.flags; /* For backwards compatibility, we need to accept ioctls with garbage * in the priority field. Garbage values in the priority field, result @@ -685,7 +689,7 @@ int amdgpu_ctx_ioctl(struct drm_device *dev, void *data, switch (args->in.op) { case AMDGPU_CTX_OP_ALLOC_CTX: - r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, &id); + r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, flags, &id); args->out.alloc.ctx_id = id; break; case AMDGPU_CTX_OP_FREE_CTX: diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.h b/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.h index 85376baaa92f..9431c8d2ea59 100644 --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.h +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.h @@ -45,6 +45,7 @@ struct amdgpu_ctx_entity { struct amdgpu_ctx { struct kref refcount; struct amdgpu_ctx_mgr *mgr; + uint32_t flags; unsigned reset_counter; unsigned reset_counter_query; uint64_t generation; @@ -84,6 +85,12 @@ struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx, bool amdgpu_ctx_priority_is_valid(int32_t ctx_prio); void amdgpu_ctx_priority_override(struct amdgpu_ctx *ctx, int32_t ctx_prio); +static inline bool +amdgpu_ctx_explicit_sync(struct amdgpu_ctx *ctx) +{ + return ctx->flags & AMDGPU_CTX_ALLOC_FLAGS_EXPLICIT_SYNC; +} + int amdgpu_ctx_ioctl(struct drm_device *dev, void *data, struct drm_file *filp); diff --git a/include/uapi/drm/amdgpu_drm.h b/include/uapi/drm/amdgpu_drm.h index 96e32dafd4f0..e9d87a6e3d86 100644 --- a/include/uapi/drm/amdgpu_drm.h +++ b/include/uapi/drm/amdgpu_drm.h @@ -125,7 +125,14 @@ extern "C" { #define AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS (1 << 5) /* Flag that BO is always valid in this VM */ #define AMDGPU_GEM_CREATE_VM_ALWAYS_VALID (1 << 6) -/* Flag that BO sharing will be explicitly synchronized */ +/* Flag that BO sharing will be explicitly synchronized + * + * This flag should not be used unless the client can guarantee that no + * other driver which ever touches this BO will ever want to use implicit + * synchronization as it disables implicit sync on this BO system-wide. + * Instead, drivers which use an explicit synchronization model should + * prefer AMDGPU_CTX_ALLOC_FLAGS_EXPLICIT_SYNC. + */ #define AMDGPU_GEM_CREATE_EXPLICIT_SYNC (1 << 7) /* Flag that indicates allocating MQD gart on GFX9, where the mtype * for the second page onward should be set to NC. It should never @@ -240,6 +247,9 @@ union drm_amdgpu_bo_list { #define AMDGPU_CTX_OP_GET_STABLE_PSTATE 5 #define AMDGPU_CTX_OP_SET_STABLE_PSTATE 6 +/* indicate that all synchronization will be explicit */ +#define AMDGPU_CTX_ALLOC_FLAGS_EXPLICIT_SYNC (1<<0) + /* GPU reset status */ #define AMDGPU_CTX_NO_RESET 0 /* this the context caused it */

[RFC] amdgpu: Add a context flag to disable implicit sync

Commit Message

Comments

Patch