[5/5,RFC] xfs: make CIl busy extent lists per-cpu

Message ID	20200512092811.1846252-6-david@fromorbit.com (mailing list archive)
State	Deferred, archived
Headers	show Return-Path: <SRS0=k9vQ=62=vger.kernel.org=linux-xfs-owner@kernel.org> From: Dave Chinner <david@fromorbit.com> To: linux-xfs@vger.kernel.org Subject: [PATCH 5/5] [RFC] xfs: make CIl busy extent lists per-cpu Date: Tue, 12 May 2020 19:28:11 +1000 Message-Id: <20200512092811.1846252-6-david@fromorbit.com> In-Reply-To: <20200512092811.1846252-1-david@fromorbit.com> References: <20200512092811.1846252-1-david@fromorbit.com> MIME-Version: 1.0 Content-Transfer-Encoding: 8bit Sender: linux-xfs-owner@vger.kernel.org Precedence: bulk
Series	xfs: fix a couple of performance issues \| expand [0/5,v2] xfs: fix a couple of performance issues [1/5] xfs: separate read-only variables in struct xfs_mount [2/5] xfs: convert m_active_trans counter to per-cpu [3/5,RFC] xfs: use percpu counters for CIL context counters [4/5,RFC] xfs: per-cpu CIL lists [5/5,RFC] xfs: make CIl busy extent lists per-cpu

diff --git a/fs/xfs/xfs_log_cil.c b/fs/xfs/xfs_log_cil.c index af444bc69a7cd..d3a5f8478d64a 100644 --- a/fs/xfs/xfs_log_cil.c +++ b/fs/xfs/xfs_log_cil.c @@ -461,13 +461,9 @@ xlog_cil_insert_items( percpu_counter_add_batch(&cil->xc_curr_res, split_res, 1000 * 1000); percpu_counter_add_batch(&cil->xc_space_used, len, 1000 * 1000); - spin_lock(&cil->xc_cil_lock); - /* attach the transaction to the CIL if it has any busy extents */ if (!list_empty(&tp->t_busy)) - list_splice_init(&tp->t_busy, &ctx->busy_extents); - - spin_unlock(&cil->xc_cil_lock); + list_splice_tail_init(&tp->t_busy, pcp_busy(cil)); /* * Now (re-)position everything modified at the tail of the CIL. @@ -486,7 +482,7 @@ xlog_cil_insert_items( */ if (!list_empty(&lip->li_cil)) continue; - list_add_tail(&lip->li_cil, this_cpu_ptr(cil->xc_cil)); + list_add_tail(&lip->li_cil, pcp_cil(cil)); } if (tp->t_ticket->t_curr_res < 0) @@ -733,10 +729,14 @@ xlog_cil_push_work( * Remove the items from the per-cpu CIL lists and then pull all the * log vectors off the items. We hold the xc_ctx_lock exclusively here, * so nothing can be adding or removing from the per-cpu lists here. + * + * Also splice the busy extents onto the context while we are walking + * the percpu structure. */ /* XXX: hotplug! */ for_each_online_cpu(cpu) { - list_splice_tail_init(per_cpu_ptr(cil->xc_cil, cpu), &cil_items); + list_splice_tail_init(pcp_cil_cpu(cil, cpu), &cil_items); + list_splice_tail_init(pcp_busy_cpu(cil, cpu), &ctx->busy_extents); } lv = NULL; @@ -933,7 +933,7 @@ xlog_cil_push_background( * The cil won't be empty because we are called while holding the * context lock so whatever we added to the CIL will still be there */ - ASSERT(space_used != 0); + ASSERT(percpu_counter_read(&cil->xc_curr_res) != 0); /* * don't do a background push if we haven't used up all the @@ -1241,17 +1241,18 @@ xlog_cil_init( goto out_free_cil; /* XXX: CPU hotplug!!! */ - cil->xc_cil = alloc_percpu_gfp(struct list_head, GFP_KERNEL); - if (!cil->xc_cil) + cil->xc_pcp = alloc_percpu_gfp(struct xfs_cil_pcpu, GFP_KERNEL); + if (!cil->xc_pcp) goto out_free_ctx; for_each_possible_cpu(cpu) { - INIT_LIST_HEAD(per_cpu_ptr(cil->xc_cil, cpu)); + INIT_LIST_HEAD(pcp_cil_cpu(cil, cpu)); + INIT_LIST_HEAD(pcp_busy_cpu(cil, cpu)); } error = percpu_counter_init(&cil->xc_space_used, 0, GFP_KERNEL); if (error) - goto out_free_pcp_cil; + goto out_free_pcp; error = percpu_counter_init(&cil->xc_curr_res, 0, GFP_KERNEL); if (error) @@ -1259,7 +1260,6 @@ xlog_cil_init( INIT_WORK(&cil->xc_push_work, xlog_cil_push_work); INIT_LIST_HEAD(&cil->xc_committing); - spin_lock_init(&cil->xc_cil_lock); spin_lock_init(&cil->xc_push_lock); init_rwsem(&cil->xc_ctx_lock); init_waitqueue_head(&cil->xc_commit_wait); @@ -1278,8 +1278,8 @@ xlog_cil_init( out_free_space: percpu_counter_destroy(&cil->xc_space_used); -out_free_pcp_cil: - free_percpu(cil->xc_cil); +out_free_pcp: + free_percpu(cil->xc_pcp); out_free_ctx: kmem_free(ctx); out_free_cil: @@ -1303,9 +1303,10 @@ xlog_cil_destroy( percpu_counter_destroy(&cil->xc_curr_res); for_each_possible_cpu(cpu) { - ASSERT(list_empty(per_cpu_ptr(cil->xc_cil, cpu))); + ASSERT(list_empty(pcp_cil_cpu(cil, cpu))); + ASSERT(list_empty(pcp_busy_cpu(cil, cpu))); } - free_percpu(cil->xc_cil); + free_percpu(cil->xc_pcp); kmem_free(cil); } diff --git a/fs/xfs/xfs_log_priv.h b/fs/xfs/xfs_log_priv.h index 0bb982920d070..cfc22c9482ea4 100644 --- a/fs/xfs/xfs_log_priv.h +++ b/fs/xfs/xfs_log_priv.h @@ -260,11 +260,16 @@ struct xfs_cil_ctx { * the commit LSN to be determined as well. This should make synchronous * operations almost as efficient as the old logging methods. */ +struct xfs_cil_pcpu { + struct list_head p_cil; + struct list_head p_busy_extents; +}; + struct xfs_cil { struct xlog *xc_log; struct percpu_counter xc_space_used; struct percpu_counter xc_curr_res; - struct list_head __percpu *xc_cil; + struct xfs_cil_pcpu __percpu *xc_pcp; spinlock_t xc_cil_lock; struct rw_semaphore xc_ctx_lock ____cacheline_aligned_in_smp; @@ -278,6 +283,11 @@ struct xfs_cil { struct work_struct xc_push_work; } ____cacheline_aligned_in_smp; +#define pcp_cil(cil) &(this_cpu_ptr(cil->xc_pcp)->p_cil) +#define pcp_cil_cpu(cil, cpu) &(per_cpu_ptr(cil->xc_pcp, cpu)->p_cil) +#define pcp_busy(cil) &(this_cpu_ptr(cil->xc_pcp)->p_busy_extents) +#define pcp_busy_cpu(cil, cpu) &(per_cpu_ptr(cil->xc_pcp, cpu)->p_busy_extents) + /* * The amount of log space we allow the CIL to aggregate is difficult to size. * Whatever we choose, we have to make sure we can get a reservation for the

[5/5,RFC] xfs: make CIl busy extent lists per-cpu

Commit Message

Patch