[RFC,10/21] unpack-trees: add basic support for parallel checkout

Message ID	1b39a4099a69f2c42211d46d615055c783703fea.1597093021.git.matheus.bernardino@usp.br (mailing list archive)
State	New, archived
Headers	show Return-Path: <SRS0=S9iH=BU=vger.kernel.org=git-owner@kernel.org> From: Matheus Tavares <matheus.bernardino@usp.br> To: git@vger.kernel.org Cc: stolee@gmail.com, jeffhost@microsoft.com, =?utf-8?b?Tmd1eeG7hW4gVGjDoWkg?= =?utf-8?b?Tmfhu41jIER1eQ==?= <pclouds@gmail.com>, Jonathan Tan <jonathantanmy@google.com>, =?utf-8?q?Ren=C3=A9_Scharfe?= <l.s.r@web.de>, Christian Couder <chriscool@tuxfamily.org>, Stefan Beller <stefanbeller@gmail.com>, Junio C Hamano <gitster@pobox.com>, Lars Schneider <larsxschneider@gmail.com> Subject: [RFC PATCH 10/21] unpack-trees: add basic support for parallel checkout Date: Mon, 10 Aug 2020 18:33:18 -0300 Message-Id: <1b39a4099a69f2c42211d46d615055c783703fea.1597093021.git.matheus.bernardino@usp.br> In-Reply-To: <cover.1597093021.git.matheus.bernardino@usp.br> References: <cover.1597093021.git.matheus.bernardino@usp.br> MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Sender: git-owner@vger.kernel.org Precedence: bulk
Series	Parallel checkout \| expand [RFC,00/21,RFC] Parallel checkout [RFC,01/21] convert: make convert_attrs() and convert structs public [RFC,02/21] convert: add [async_]convert_to_working_tree_ca() variants [RFC,03/21] convert: add get_stream_filter_ca() variant [RFC,04/21] convert: add conv_attrs classification [RFC,05/21] entry: extract a header file for entry.c functions [RFC,06/21] entry: make fstat_output() and read_blob_entry() public [RFC,07/21] entry: extract cache_entry update from write_entry() [RFC,08/21] entry: move conv_attrs lookup up to checkout_entry() [RFC,09/21] entry: add checkout_entry_ca() which takes preloaded conv_attrs [RFC,10/21] unpack-trees: add basic support for parallel checkout [RFC,11/21] parallel-checkout: make it truly parallel [RFC,12/21] parallel-checkout: add configuration options [RFC,13/21] parallel-checkout: support progress displaying [RFC,14/21] make_transient_cache_entry(): optionally alloc from mem_pool [RFC,15/21] builtin/checkout.c: complete parallel checkout support [RFC,16/21] checkout-index: add parallel checkout support [RFC,17/21] parallel-checkout: avoid stat() calls in workers [RFC,18/21] entry: use is_dir_sep() when checking leading dirs [RFC,19/21] symlinks: make has_dirs_only_path() track FL_NOENT [RFC,20/21] parallel-checkout: create leading dirs in workers [RFC,21/21] parallel-checkout: skip checking the working tree on clone

diff --git a/Makefile b/Makefile index 65f8cfb236..caab8e6401 100644 --- a/Makefile +++ b/Makefile @@ -933,6 +933,7 @@ LIB_OBJS += pack-revindex.o LIB_OBJS += pack-write.o LIB_OBJS += packfile.o LIB_OBJS += pager.o +LIB_OBJS += parallel-checkout.o LIB_OBJS += parse-options-cb.o LIB_OBJS += parse-options.o LIB_OBJS += patch-delta.o diff --git a/entry.c b/entry.c index f9835afba3..47c2c20d5a 100644 --- a/entry.c +++ b/entry.c @@ -7,6 +7,7 @@ #include "progress.h" #include "fsmonitor.h" #include "entry.h" +#include "parallel-checkout.h" static void create_directories(const char *path, int path_len, const struct checkout *state) @@ -538,6 +539,9 @@ int checkout_entry_ca(struct cache_entry *ce, struct conv_attrs *ca, ca = &ca_buf; } + if (!enqueue_checkout(ce, ca)) + return 0; + return write_entry(ce, path.buf, ca, state, 0); } diff --git a/parallel-checkout.c b/parallel-checkout.c new file mode 100644 index 0000000000..e3b44eeb34 --- /dev/null +++ b/parallel-checkout.c @@ -0,0 +1,340 @@ +#include "cache.h" +#include "entry.h" +#include "parallel-checkout.h" +#include "streaming.h" + +enum ci_status { + CI_PENDING = 0, + CI_SUCCESS, + CI_RETRY, + CI_FAILED, +}; + +struct checkout_item { + /* pointer to a istate->cache[] entry. Not owned by us. */ + struct cache_entry *ce; + struct conv_attrs ca; + struct stat st; + enum ci_status status; +}; + +struct parallel_checkout { + struct checkout_item *items; + size_t nr, alloc; +}; + +static struct parallel_checkout *parallel_checkout = NULL; + +enum pc_status { + PC_UNINITIALIZED = 0, + PC_ACCEPTING_ENTRIES, + PC_RUNNING, + PC_HANDLING_RESULTS, +}; + +static enum pc_status pc_status = PC_UNINITIALIZED; + +void init_parallel_checkout(void) +{ + if (parallel_checkout) + BUG("parallel checkout already initialized"); + + parallel_checkout = xcalloc(1, sizeof(*parallel_checkout)); + pc_status = PC_ACCEPTING_ENTRIES; +} + +static void finish_parallel_checkout(void) +{ + if (!parallel_checkout) + BUG("cannot finish parallel checkout: not initialized yet"); + + free(parallel_checkout->items); + FREE_AND_NULL(parallel_checkout); + pc_status = PC_UNINITIALIZED; +} + +static int is_eligible_for_parallel_checkout(const struct cache_entry *ce, + const struct conv_attrs *ca) +{ + enum conv_attrs_classification c; + + if (!S_ISREG(ce->ce_mode)) + return 0; + + c = classify_conv_attrs(ca); + switch (c) { + case CA_CLASS_INCORE: + return 1; + + case CA_CLASS_INCORE_FILTER: + /* + * It would be safe to allow concurrent instances of + * single-file smudge filters, like rot13, but we should not + * assume that all filters are parallel-process safe. So we + * don't allow this. + */ + return 0; + + case CA_CLASS_INCORE_PROCESS: + /* + * The parallel queue and the delayed queue are not compatible, + * so they must be kept completely separated. And we can't tell + * if a long-running process will delay its response without + * actually asking it to perform the filtering. Therefore, this + * type of filter is not allowed in parallel checkout. + * + * Furthermore, there should only be one instance of the + * long-running process filter as we don't know how it is + * managing its own concurrency. So, spreading the entries that + * requisite such a filter among the parallel workers would + * require a lot more inter-process communication. We would + * probably have to designate a single process to interact with + * the filter and send all the necessary data to it, for each + * entry. + */ + return 0; + + case CA_CLASS_STREAMABLE: + return 1; + + default: + BUG("unsupported conv_attrs classification '%d'", c); + } +} + +int enqueue_checkout(struct cache_entry *ce, struct conv_attrs *ca) +{ + struct checkout_item *ci; + + if (!parallel_checkout || pc_status != PC_ACCEPTING_ENTRIES || + !is_eligible_for_parallel_checkout(ce, ca)) + return -1; + + ALLOC_GROW(parallel_checkout->items, parallel_checkout->nr + 1, + parallel_checkout->alloc); + + ci = &parallel_checkout->items[parallel_checkout->nr++]; + ci->ce = ce; + memcpy(&ci->ca, ca, sizeof(ci->ca)); + + return 0; +} + +static int handle_results(struct checkout *state) +{ + int ret = 0; + size_t i; + + pc_status = PC_HANDLING_RESULTS; + + for (i = 0; i < parallel_checkout->nr; ++i) { + struct checkout_item *ci = &parallel_checkout->items[i]; + struct stat *st = &ci->st; + + switch(ci->status) { + case CI_SUCCESS: + update_ce_after_write(state, ci->ce, st); + break; + case CI_RETRY: + /* + * The fails for which we set CI_RETRY are the ones + * that might have been caused by a path collision. So + * we let checkout_entry_ca() retry writing, as it will + * properly handle collisions and the creation of + * leading dirs in the entry's path. + */ + ret |= checkout_entry_ca(ci->ce, &ci->ca, state, NULL, NULL); + break; + case CI_FAILED: + ret = -1; + break; + case CI_PENDING: + BUG("parallel checkout finished with pending entries"); + default: + BUG("unknown checkout item status in parallel checkout"); + } + } + + return ret; +} + +static int reset_fd(int fd, const char *path) +{ + if (lseek(fd, 0, SEEK_SET) != 0) + return error_errno("failed to rewind descriptor of %s", path); + if (ftruncate(fd, 0)) + return error_errno("failed to truncate file %s", path); + return 0; +} + +static int write_checkout_item_to_fd(int fd, struct checkout *state, + struct checkout_item *ci, const char *path) +{ + int ret; + struct stream_filter *filter; + struct strbuf buf = STRBUF_INIT; + char *new_blob; + unsigned long size; + size_t newsize = 0; + ssize_t wrote; + + /* Sanity check */ + assert(is_eligible_for_parallel_checkout(ci->ce, &ci->ca)); + + filter = get_stream_filter_ca(&ci->ca, &ci->ce->oid); + if (filter) { + if (stream_blob_to_fd(fd, &ci->ce->oid, filter, 1)) { + /* On error, reset fd to try writing without streaming */ + if (reset_fd(fd, path)) + return -1; + } else { + return 0; + } + } + + new_blob = read_blob_entry(ci->ce, &size); + if (!new_blob) + return error("unable to read sha1 file of %s (%s)", path, + oid_to_hex(&ci->ce->oid)); + + /* + * checkout metadata is used to give context for external process + * filters. Files requiring such filters are not eligible for parallel + * checkout, so pass NULL. + */ + ret = convert_to_working_tree_ca(&ci->ca, ci->ce->name, new_blob, size, + &buf, NULL); + + if (ret) { + free(new_blob); + new_blob = strbuf_detach(&buf, &newsize); + size = newsize; + } + + wrote = write_in_full(fd, new_blob, size); + free(new_blob); + if (wrote < 0) + return error("unable to write file %s", path); + + return 0; +} + +static int close_and_clear(int *fd) +{ + int ret = 0; + + if (*fd >= 0) { + ret = close(*fd); + *fd = -1; + } + + return ret; +} + +static int check_leading_dirs(const char *path, int len, int prefix_len) +{ + const char *slash = path + len; + + while (slash > path && *slash != '/') + slash--; + + return has_dirs_only_path(path, slash - path, prefix_len); +} + +static void write_checkout_item(struct checkout *state, struct checkout_item *ci) +{ + unsigned int mode = (ci->ce->ce_mode & 0100) ? 0777 : 0666; + int fd = -1, fstat_done = 0; + struct strbuf path = STRBUF_INIT; + + strbuf_add(&path, state->base_dir, state->base_dir_len); + strbuf_add(&path, ci->ce->name, ce_namelen(ci->ce)); + + /* + * At this point, leading dirs should have already been created. But if + * a symlink being checked out has collided with one of the dirs, due to + * file system folding rules, it's possible that the dirs are no longer + * present. So we have to check again, and report any path collisions. + */ + if (!check_leading_dirs(path.buf, path.len, state->base_dir_len)) { + ci->status = CI_RETRY; + goto out; + } + + fd = open(path.buf, O_WRONLY | O_CREAT | O_EXCL, mode); + + if (fd < 0) { + if (errno == EEXIST || errno == EISDIR) { + /* + * Errors which probably represent a path collision. + * Suppress the error message and mark the ci to be + * retried later, sequentially. ENOTDIR and ENOENT are + * also interesting, but check_leading_dirs() should + * have already caught these cases. + */ + ci->status = CI_RETRY; + } else { + error_errno("failed to open file %s", path.buf); + ci->status = CI_FAILED; + } + goto out; + } + + if (write_checkout_item_to_fd(fd, state, ci, path.buf)) { + /* Error was already reported. */ + ci->status = CI_FAILED; + goto out; + } + + fstat_done = fstat_checkout_output(fd, state, &ci->st); + + if (close_and_clear(&fd)) { + error_errno("unable to close file %s", path.buf); + ci->status = CI_FAILED; + goto out; + } + + if (state->refresh_cache && !fstat_done && lstat(path.buf, &ci->st) < 0) { + error_errno("unable to stat just-written file %s", path.buf); + ci->status = CI_FAILED; + goto out; + } + + ci->status = CI_SUCCESS; + +out: + /* + * No need to check close() return. At this point, either fd is already + * closed, or we are on an error path, that has already been reported. + */ + close_and_clear(&fd); + strbuf_release(&path); +} + +static int run_checkout_sequentially(struct checkout *state) +{ + size_t i; + + for (i = 0; i < parallel_checkout->nr; ++i) { + struct checkout_item *ci = &parallel_checkout->items[i]; + write_checkout_item(state, ci); + } + + return handle_results(state); +} + + +int run_parallel_checkout(struct checkout *state) +{ + int ret; + + if (!parallel_checkout) + BUG("cannot run parallel checkout: not initialized yet"); + + pc_status = PC_RUNNING; + + ret = run_checkout_sequentially(state); + + finish_parallel_checkout(); + return ret; +} diff --git a/parallel-checkout.h b/parallel-checkout.h new file mode 100644 index 0000000000..8eef59ffcd --- /dev/null +++ b/parallel-checkout.h @@ -0,0 +1,20 @@ +#ifndef PARALLEL_CHECKOUT_H +#define PARALLEL_CHECKOUT_H + +struct cache_entry; +struct checkout; +struct conv_attrs; + +void init_parallel_checkout(void); + +/* + * Return -1 if parallel checkout is currently not enabled or if the entry is + * not eligible for parallel checkout. Otherwise, enqueue the entry for later + * write and return 0. + */ +int enqueue_checkout(struct cache_entry *ce, struct conv_attrs *ca); + +/* Write all the queued entries, returning 0 on success.*/ +int run_parallel_checkout(struct checkout *state); + +#endif /* PARALLEL_CHECKOUT_H */ diff --git a/unpack-trees.c b/unpack-trees.c index a511fadd89..1b1da7485a 100644 --- a/unpack-trees.c +++ b/unpack-trees.c @@ -17,6 +17,7 @@ #include "object-store.h" #include "promisor-remote.h" #include "entry.h" +#include "parallel-checkout.h" /* * Error messages expected by scripts out of plumbing commands such as @@ -438,7 +439,6 @@ static int check_updates(struct unpack_trees_options *o, if (should_update_submodules()) load_gitmodules_file(index, &state); - enable_delayed_checkout(&state); if (has_promisor_remote()) { /* * Prefetch the objects that are to be checked out in the loop @@ -461,6 +461,9 @@ static int check_updates(struct unpack_trees_options *o, to_fetch.oid, to_fetch.nr); oid_array_clear(&to_fetch); } + + enable_delayed_checkout(&state); + init_parallel_checkout(); for (i = 0; i < index->cache_nr; i++) { struct cache_entry *ce = index->cache[i]; @@ -474,6 +477,7 @@ static int check_updates(struct unpack_trees_options *o, } } stop_progress(&progress); + errs |= run_parallel_checkout(&state); errs |= finish_delayed_checkout(&state, NULL); git_attr_set_direction(GIT_ATTR_CHECKIN);

[RFC,10/21] unpack-trees: add basic support for parallel checkout

Commit Message

Patch