[07/40] lustre: ldlm: send the cancel RPC asap

Message ID	1681042400-15491-8-git-send-email-jsimmons@infradead.org (mailing list archive)
State	New, archived
Headers	show Return-Path: <lustre-devel-bounces@lists.lustre.org> From: James Simmons <jsimmons@infradead.org> To: Andreas Dilger <adilger@whamcloud.com>, Oleg Drokin <green@whamcloud.com>, NeilBrown <neilb@suse.de> Date: Sun, 9 Apr 2023 08:12:47 -0400 Message-Id: <1681042400-15491-8-git-send-email-jsimmons@infradead.org> In-Reply-To: <1681042400-15491-1-git-send-email-jsimmons@infradead.org> References: <1681042400-15491-1-git-send-email-jsimmons@infradead.org> Subject: [lustre-devel] [PATCH 07/40] lustre: ldlm: send the cancel RPC asap Precedence: list Cc: Yang Sheng <ys@whamcloud.com>, Lustre Development List <lustre-devel@lists.lustre.org> MIME-Version: 1.0 Content-Type: text/plain; charset="us-ascii" Content-Transfer-Encoding: 7bit Errors-To: lustre-devel-bounces@lists.lustre.org Sender: "lustre-devel" <lustre-devel-bounces@lists.lustre.org>
Series	lustre: backport OpenSFS changes from March XX, 2023 \| expand [00/40] lustre: backport OpenSFS changes from March XX, 2023 [01/40] lustre: protocol: basic batching processing framework [02/40] lustre: lov: fiemap improperly handles fm_extent_count=0 [03/40] lustre: llite: SIGBUS is possible on a race with page reclaim [04/40] lustre: osc: page fault in osc_release_bounce_pages() [05/40] lustre: readahead: add stats for read-ahead page count [06/40] lustre: quota: enforce project quota for root [07/40] lustre: ldlm: send the cancel RPC asap [08/40] lustre: enc: align Base64 encoding with RFC 4648 base64url [09/40] lustre: quota: fix insane grant quota [10/40] lustre: llite: check truncated page in ->readpage() [11/40] lnet: o2iblnd: Fix key mismatch issue [12/40] lustre: sec: fid2path for encrypted files [13/40] lustre: sec: Lustre/HSM on enc file with enc key [14/40] lustre: llite: check read page past requested [15/40] lustre: llite: fix relatime support [16/40] lustre: ptlrpc: clarify AT error message [17/40] lustre: update version to 2.15.54 [18/40] lustre: tgt: skip free inodes in OST weights [19/40] lustre: fileset: check fileset for operations by fid [20/40] lustre: clio: Remove cl_page_size() [21/40] lustre: fid: clean up OBIF_MAX_OID and IDIF_MAX_OID [22/40] lustre: llog: fix processing of a wrapped catalog [23/40] lustre: llite: replace lld_nfs_dentry flag with opencache handling [24/40] lustre: llite: match lock in corresponding namespace [25/40] lnet: libcfs: remove unused hash code [26/40] lustre: client: -o network needs add_conn processing [27/40] lnet: Lock primary NID logic [28/40] lnet: Peers added via kernel API should be permanent [29/40] lnet: don't delete peer created by Lustre [30/40] lnet: memory leak in copy_ioc_udsp_descr [31/40] lnet: remove crash with UDSP [32/40] lustre: ptlrpc: fix clang build errors [33/40] lustre: ldlm: remove client_import_find_conn() [34/40] lnet: add 'force' option to lnetctl peer del [35/40] lustre: ldlm: BL_AST lock cancel still can be batched [36/40] lnet: lnet_parse_route uses wrong loop var [37/40] lustre: tgt: add qos debug [38/40] lustre: enc: file names encryption when using secure boot [39/40] lustre: uapi: add DMV_IMP_INHERIT connect flag [40/40] lustre: llite: dir layout inheritance fixes

diff --git a/fs/lustre/include/lustre_dlm.h b/fs/lustre/include/lustre_dlm.h index d08c48f..3a4f152 100644 --- a/fs/lustre/include/lustre_dlm.h +++ b/fs/lustre/include/lustre_dlm.h @@ -593,6 +593,7 @@ enum ldlm_cancel_flags { LCF_BL_AST = 0x4, /* Cancel locks marked as LDLM_FL_BL_AST * in the same RPC */ + LCF_ONE_LOCK = 0x8, /* Cancel locks pack only one lock. */ }; struct ldlm_flock { diff --git a/fs/lustre/ldlm/ldlm_lockd.c b/fs/lustre/ldlm/ldlm_lockd.c index 0ff4e3a..3a085db 100644 --- a/fs/lustre/ldlm/ldlm_lockd.c +++ b/fs/lustre/ldlm/ldlm_lockd.c @@ -700,8 +700,7 @@ static int ldlm_callback_handler(struct ptlrpc_request *req) * we can tell the server we have no lock. Otherwise, we * should send cancel after dropping the cache. */ - if ((ldlm_is_canceling(lock) && ldlm_is_bl_done(lock)) || - ldlm_is_failed(lock)) { + if (ldlm_is_ast_sent(lock) || ldlm_is_failed(lock)) { LDLM_DEBUG(lock, "callback on lock %#llx - lock disappeared", dlm_req->lock_handle[0].cookie); @@ -736,7 +735,7 @@ static int ldlm_callback_handler(struct ptlrpc_request *req) switch (lustre_msg_get_opc(req->rq_reqmsg)) { case LDLM_BL_CALLBACK: - CDEBUG(D_INODE, "blocking ast\n"); + LDLM_DEBUG(lock, "blocking ast\n"); req_capsule_extend(&req->rq_pill, &RQF_LDLM_BL_CALLBACK); if (!ldlm_is_cancel_on_block(lock)) { rc = ldlm_callback_reply(req, 0); @@ -748,14 +747,14 @@ static int ldlm_callback_handler(struct ptlrpc_request *req) ldlm_handle_bl_callback(ns, &dlm_req->lock_desc, lock); break; case LDLM_CP_CALLBACK: - CDEBUG(D_INODE, "completion ast\n"); + LDLM_DEBUG(lock, "completion ast\n"); req_capsule_extend(&req->rq_pill, &RQF_LDLM_CP_CALLBACK); rc = ldlm_handle_cp_callback(req, ns, dlm_req, lock); if (!OBD_FAIL_CHECK(OBD_FAIL_LDLM_CANCEL_BL_CB_RACE)) ldlm_callback_reply(req, rc); break; case LDLM_GL_CALLBACK: - CDEBUG(D_INODE, "glimpse ast\n"); + LDLM_DEBUG(lock, "glimpse ast\n"); req_capsule_extend(&req->rq_pill, &RQF_LDLM_GL_CALLBACK); ldlm_handle_gl_callback(req, ns, dlm_req, lock); break; diff --git a/fs/lustre/ldlm/ldlm_request.c b/fs/lustre/ldlm/ldlm_request.c index 8b244d7..ef3ad28 100644 --- a/fs/lustre/ldlm/ldlm_request.c +++ b/fs/lustre/ldlm/ldlm_request.c @@ -994,14 +994,34 @@ static u64 ldlm_cli_cancel_local(struct ldlm_lock *lock) return rc; } +static inline int __ldlm_pack_lock(struct ldlm_lock *lock, + struct ldlm_request *dlm) +{ + LASSERT(lock->l_conn_export); + lock_res_and_lock(lock); + if (ldlm_is_ast_sent(lock)) { + unlock_res_and_lock(lock); + return 0; + } + ldlm_set_ast_sent(lock); + unlock_res_and_lock(lock); + + /* Pack the lock handle to the given request buffer. */ + LDLM_DEBUG(lock, "packing"); + dlm->lock_handle[dlm->lock_count++] = lock->l_remote_handle; + + return 1; +} +#define ldlm_cancel_pack(req, head, count) \ + _ldlm_cancel_pack(req, NULL, head, count) + /** * Pack @count locks in @head into ldlm_request buffer of request @req. */ -static void ldlm_cancel_pack(struct ptlrpc_request *req, +static int _ldlm_cancel_pack(struct ptlrpc_request *req, struct ldlm_lock *lock, struct list_head *head, int count) { struct ldlm_request *dlm; - struct ldlm_lock *lock; int max, packed = 0; dlm = req_capsule_client_get(&req->rq_pill, &RMF_DLM_REQ); @@ -1019,24 +1039,23 @@ static void ldlm_cancel_pack(struct ptlrpc_request *req, * so that the server cancel would call filter_lvbo_update() less * frequently. */ - list_for_each_entry(lock, head, l_bl_ast) { - if (!count--) - break; - LASSERT(lock->l_conn_export); - /* Pack the lock handle to the given request buffer. */ - LDLM_DEBUG(lock, "packing"); - dlm->lock_handle[dlm->lock_count++] = lock->l_remote_handle; - packed++; + if (lock) { /* only pack one lock */ + packed = __ldlm_pack_lock(lock, dlm); + } else { + list_for_each_entry(lock, head, l_bl_ast) { + if (!count--) + break; + packed += __ldlm_pack_lock(lock, dlm); + } } - CDEBUG(D_DLMTRACE, "%d locks packed\n", packed); + return packed; } /** * Prepare and send a batched cancel RPC. It will include @count lock * handles of locks given in @cancels list. */ -static int ldlm_cli_cancel_req(struct obd_export *exp, - struct list_head *cancels, +static int ldlm_cli_cancel_req(struct obd_export *exp, void *ptr, int count, enum ldlm_cancel_flags flags) { struct ptlrpc_request *req = NULL; @@ -1085,7 +1104,15 @@ static int ldlm_cli_cancel_req(struct obd_export *exp, req->rq_reply_portal = LDLM_CANCEL_REPLY_PORTAL; ptlrpc_at_set_req_timeout(req); - ldlm_cancel_pack(req, cancels, count); + if (flags & LCF_ONE_LOCK) + rc = _ldlm_cancel_pack(req, ptr, NULL, count); + else + rc = _ldlm_cancel_pack(req, NULL, ptr, count); + if (rc == 0) { + ptlrpc_req_finished(req); + sent = count; + goto out; + } ptlrpc_request_set_replen(req); if (flags & LCF_ASYNC) { @@ -1235,10 +1262,10 @@ int ldlm_cli_convert(struct ldlm_lock *lock, * Lock must not have any readers or writers by this time. */ int ldlm_cli_cancel(const struct lustre_handle *lockh, - enum ldlm_cancel_flags cancel_flags) + enum ldlm_cancel_flags flags) { struct obd_export *exp; - int avail, count = 1; + int avail, count = 1, bl_ast = 0; u64 rc = 0; struct ldlm_namespace *ns; struct ldlm_lock *lock; @@ -1253,11 +1280,17 @@ int ldlm_cli_cancel(const struct lustre_handle *lockh, lock_res_and_lock(lock); LASSERT(!ldlm_is_converting(lock)); - /* Lock is being canceled and the caller doesn't want to wait */ - if (ldlm_is_canceling(lock)) { + if (ldlm_is_bl_ast(lock)) { + if (ldlm_is_ast_sent(lock)) { + unlock_res_and_lock(lock); + LDLM_LOCK_RELEASE(lock); + return 0; + } + bl_ast = 1; + } else if (ldlm_is_canceling(lock)) { + /* Lock is being canceled and the caller doesn't want to wait */ unlock_res_and_lock(lock); - - if (!(cancel_flags & LCF_ASYNC)) + if (flags & LCF_ASYNC) wait_event_idle(lock->l_waitq, is_bl_done(lock)); LDLM_LOCK_RELEASE(lock); @@ -1267,24 +1300,30 @@ int ldlm_cli_cancel(const struct lustre_handle *lockh, ldlm_set_canceling(lock); unlock_res_and_lock(lock); - if (cancel_flags & LCF_LOCAL) + if (flags & LCF_LOCAL) OBD_FAIL_TIMEOUT(OBD_FAIL_LDLM_LOCAL_CANCEL_PAUSE, cfs_fail_val); rc = ldlm_cli_cancel_local(lock); - if (rc == LDLM_FL_LOCAL_ONLY || cancel_flags & LCF_LOCAL) { + if (rc == LDLM_FL_LOCAL_ONLY || flags & LCF_LOCAL) { LDLM_LOCK_RELEASE(lock); return 0; } - /* - * Even if the lock is marked as LDLM_FL_BL_AST, this is a LDLM_CANCEL - * RPC which goes to canceld portal, so we can cancel other LRU locks - * here and send them all as one LDLM_CANCEL RPC. - */ - LASSERT(list_empty(&lock->l_bl_ast)); - list_add(&lock->l_bl_ast, &cancels); exp = lock->l_conn_export; + if (bl_ast) { /* Send RPC immedaitly for LDLM_FL_BL_AST */ + ldlm_cli_cancel_req(exp, lock, count, flags | LCF_ONE_LOCK); + LDLM_LOCK_RELEASE(lock); + return 0; + } + + LASSERT(list_empty(&lock->l_bl_ast)); + list_add(&lock->l_bl_ast, &cancels); + /* + * This is a LDLM_CANCEL RPC which goes to canceld portal, + * so we can cancel other LRU locks here and send them all + * as one LDLM_CANCEL RPC. + */ if (exp_connect_cancelset(exp)) { avail = ldlm_format_handles_avail(class_exp2cliimp(exp), &RQF_LDLM_CANCEL, @@ -1295,7 +1334,8 @@ int ldlm_cli_cancel(const struct lustre_handle *lockh, count += ldlm_cancel_lru_local(ns, &cancels, 0, avail - 1, LCF_BL_AST, 0); } - ldlm_cli_cancel_list(&cancels, count, NULL, cancel_flags); + ldlm_cli_cancel_list(&cancels, count, NULL, flags); + return 0; } EXPORT_SYMBOL(ldlm_cli_cancel);

[07/40] lustre: ldlm: send the cancel RPC asap

Commit Message

Patch