[v5,1/8] Btrfs: introduce a tree for items that map UUIDs to something

Message ID	ef484aa41751485fc6301ce78b5e3cddaa3f9a52.1371749051.git.sbehrens@giantdisaster.de (mailing list archive)
State	Superseded, archived
Headers	show Return-Path: <linux-btrfs-owner@kernel.org> From: Stefan Behrens <sbehrens@giantdisaster.de> To: linux-btrfs@vger.kernel.org Subject: [PATCH v5 1/8] Btrfs: introduce a tree for items that map UUIDs to something Date: Thu, 20 Jun 2013 19:45:32 +0200 Message-Id: <ef484aa41751485fc6301ce78b5e3cddaa3f9a52.1371749051.git.sbehrens@giantdisaster.de> In-Reply-To: <cover.1371749051.git.sbehrens@giantdisaster.de> References: <cover.1371749051.git.sbehrens@giantdisaster.de> In-Reply-To: <cover.1371749051.git.sbehrens@giantdisaster.de> References: <cover.1371749051.git.sbehrens@giantdisaster.de> Sender: linux-btrfs-owner@vger.kernel.org Precedence: bulk

diff --git a/fs/btrfs/Makefile b/fs/btrfs/Makefile index 3932224..a550dfc 100644 --- a/fs/btrfs/Makefile +++ b/fs/btrfs/Makefile @@ -8,7 +8,8 @@ btrfs-y += super.o ctree.o extent-tree.o print-tree.o root-tree.o dir-item.o \ extent_io.o volumes.o async-thread.o ioctl.o locking.o orphan.o \ export.o tree-log.o free-space-cache.o zlib.o lzo.o \ compression.o delayed-ref.o relocation.o delayed-inode.o scrub.o \ - reada.o backref.o ulist.o qgroup.o send.o dev-replace.o raid56.o + reada.o backref.o ulist.o qgroup.o send.o dev-replace.o raid56.o \ + uuid-tree.o btrfs-$(CONFIG_BTRFS_FS_POSIX_ACL) += acl.o btrfs-$(CONFIG_BTRFS_FS_CHECK_INTEGRITY) += check-integrity.o diff --git a/fs/btrfs/ctree.h b/fs/btrfs/ctree.h index 76e4983..04447b6 100644 --- a/fs/btrfs/ctree.h +++ b/fs/btrfs/ctree.h @@ -91,6 +91,9 @@ struct btrfs_ordered_sum; /* holds quota configuration and tracking */ #define BTRFS_QUOTA_TREE_OBJECTID 8ULL +/* for storing items that use the BTRFS_UUID_KEY */ +#define BTRFS_UUID_TREE_OBJECTID 9ULL + /* for storing balance parameters in the root tree */ #define BTRFS_BALANCE_OBJECTID -4ULL @@ -953,6 +956,18 @@ struct btrfs_dev_replace_item { __le64 num_uncorrectable_read_errors; } __attribute__ ((__packed__)); +/* for items that use the BTRFS_UUID_KEY */ +#define BTRFS_UUID_ITEM_TYPE_SUBVOL 0 /* for UUIDs assigned to subvols */ +#define BTRFS_UUID_ITEM_TYPE_RECEIVED_SUBVOL 1 /* for UUIDs assigned to + * received subvols */ + +/* a sequence of such items is stored under the BTRFS_UUID_KEY */ +struct btrfs_uuid_item { + __le16 type; /* refer to BTRFS_UUID_ITEM_TYPE* defines above */ + __le32 len; /* number of following 64bit values */ + __le64 subid[0]; /* sequence of subids */ +} __attribute__ ((__packed__)); + /* different types of block groups (and chunks) */ #define BTRFS_BLOCK_GROUP_DATA (1ULL << 0) #define BTRFS_BLOCK_GROUP_SYSTEM (1ULL << 1) @@ -1922,6 +1937,17 @@ struct btrfs_ioctl_defrag_range_args { #define BTRFS_DEV_REPLACE_KEY 250 /* + * Stores items that allow to quickly map UUIDs to something else. + * These items are part of the filesystem UUID tree. + * The key is built like this: + * (UUID_upper_64_bits, BTRFS_UUID_KEY, UUID_lower_64_bits). + */ +#if BTRFS_UUID_SIZE != 16 +#error "UUID items require BTRFS_UUID_SIZE == 16!" +#endif +#define BTRFS_UUID_KEY 251 + +/* * string items are for debugging. They just store a short string of * data in the FS */ @@ -2979,6 +3005,12 @@ BTRFS_SETGET_FUNCS(dev_replace_cursor_left, struct btrfs_dev_replace_item, BTRFS_SETGET_FUNCS(dev_replace_cursor_right, struct btrfs_dev_replace_item, cursor_right, 64); +/* btrfs_uuid_item */ +BTRFS_SETGET_FUNCS(uuid_type, struct btrfs_uuid_item, type, 16); +BTRFS_SETGET_FUNCS(uuid_len, struct btrfs_uuid_item, len, 32); +BTRFS_SETGET_STACK_FUNCS(stack_uuid_type, struct btrfs_uuid_item, type, 16); +BTRFS_SETGET_STACK_FUNCS(stack_uuid_len, struct btrfs_uuid_item, len, 32); + BTRFS_SETGET_STACK_FUNCS(stack_dev_replace_src_devid, struct btrfs_dev_replace_item, src_devid, 64); BTRFS_SETGET_STACK_FUNCS(stack_dev_replace_cont_reading_from_srcdev_mode, @@ -3414,6 +3446,24 @@ void btrfs_check_and_init_root_item(struct btrfs_root_item *item); void btrfs_update_root_times(struct btrfs_trans_handle *trans, struct btrfs_root *root); +/* uuid-tree.c */ +int btrfs_lookup_uuid_subvol_item(struct btrfs_root *uuid_root, u8 *uuid, + u64 *subvol_id); +int btrfs_insert_uuid_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u64 subvol_id); +int btrfs_del_uuid_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u64 subvol_id); +int btrfs_lookup_uuid_received_subvol_item(struct btrfs_root *uuid_root, + u8 *uuid, u64 *subvol_id); +int btrfs_insert_uuid_received_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, + u8 *uuid, u64 subvol_id); +int btrfs_del_uuid_received_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u64 subvol_id); + /* dir-item.c */ int btrfs_check_dir_item_collision(struct btrfs_root *root, u64 dir, const char *name, int name_len); diff --git a/fs/btrfs/uuid-tree.c b/fs/btrfs/uuid-tree.c new file mode 100644 index 0000000..3939a54 --- /dev/null +++ b/fs/btrfs/uuid-tree.c @@ -0,0 +1,480 @@ +/* + * Copyright (C) STRATO AG 2013. All rights reserved. + * + * This program is free software; you can redistribute it and/or + * modify it under the terms of the GNU General Public + * License v2 as published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * General Public License for more details. + * + * You should have received a copy of the GNU General Public + * License along with this program; if not, write to the + * Free Software Foundation, Inc., 59 Temple Place - Suite 330, + * Boston, MA 021110-1307, USA. + */ +#include <linux/uuid.h> +#include <asm/unaligned.h> +#include "ctree.h" +#include "transaction.h" +#include "disk-io.h" +#include "print-tree.h" + + +/* + * One key is used to store a sequence of btrfs_uuid_item items. + * Each item in the sequence contains a type information and a sequence of + * ids (together with the information about the size of the sequence of ids). + * {[btrfs_uuid_item type0 {id0, id1, ..., idN}], + * ..., + * [btrfs_uuid_item typeZ {id0, id1, ..., idN}]} + * + * It is forbidden to put multiple items with the same type under the same key. + * Instead the sequence of ids is extended and used to store any additional + * ids for the same item type. + */ + +static void btrfs_uuid_to_key(u8 *uuid, struct btrfs_key *key) +{ + key->type = BTRFS_UUID_KEY; + key->objectid = get_unaligned_le64(uuid); + key->offset = get_unaligned_le64(uuid + sizeof(u64)); +} + +static struct btrfs_uuid_item *btrfs_match_uuid_item_type( + struct btrfs_path *path, u16 type) +{ + struct extent_buffer *eb; + int slot; + struct btrfs_uuid_item *ptr; + u32 item_size; + + eb = path->nodes[0]; + slot = path->slots[0]; + ptr = btrfs_item_ptr(eb, slot, struct btrfs_uuid_item); + item_size = btrfs_item_size_nr(eb, slot); + do { + u16 sub_item_type; + u64 sub_item_len; + + if (item_size < sizeof(*ptr)) { + pr_warn("btrfs: uuid item too short (%lu < %d)!\n", + (unsigned long)item_size, (int)sizeof(*ptr)); + return NULL; + } + item_size -= sizeof(*ptr); + sub_item_type = btrfs_uuid_type(eb, ptr); + sub_item_len = btrfs_uuid_len(eb, ptr); + if (sub_item_len * sizeof(u64) > item_size) { + pr_warn("btrfs: uuid item too short (%llu > %lu)!\n", + (unsigned long long)(sub_item_len * + sizeof(u64)), + (unsigned long)item_size); + return NULL; + } + if (sub_item_type == type) + return ptr; + item_size -= sub_item_len * sizeof(u64); + ptr = 1 + (struct btrfs_uuid_item *) + (((char *)ptr) + (sub_item_len * sizeof(u64))); + } while (item_size); + + return NULL; +} + +static int btrfs_uuid_tree_lookup_prepare(struct btrfs_root *uuid_root, + u8 *uuid, u16 type, + struct btrfs_path *path, + struct btrfs_uuid_item **ptr) +{ + int ret; + struct btrfs_key key; + + if (!uuid_root) { + WARN_ON_ONCE(1); + ret = -ENOENT; + goto out; + } + + btrfs_uuid_to_key(uuid, &key); + + ret = btrfs_search_slot(NULL, uuid_root, &key, path, 0, 0); + if (ret < 0) + goto out; + if (ret > 0) { + ret = -ENOENT; + goto out; + } + + *ptr = btrfs_match_uuid_item_type(path, type); + if (!*ptr) { + ret = -ENOENT; + goto out; + } + + ret = 0; + +out: + return ret; +} + +/* return -ENOENT for !found, < 0 for errors, or 0 if an item was found */ +static int btrfs_uuid_tree_lookup(struct btrfs_root *uuid_root, u8 *uuid, + u16 type, u64 subid) +{ + int ret; + struct btrfs_path *path; + struct extent_buffer *eb; + struct btrfs_uuid_item *ptr; + u32 sub_item_len; + unsigned long offset; + + path = btrfs_alloc_path(); + if (!path) { + ret = -ENOMEM; + goto out; + } + + ret = btrfs_uuid_tree_lookup_prepare(uuid_root, uuid, type, path, &ptr); + if (ret < 0) + goto out; + + eb = path->nodes[0]; + sub_item_len = btrfs_uuid_len(eb, ptr); + WARN_ON_ONCE(sub_item_len == 0); + ret = -ENOENT; + ptr++; + offset = (unsigned long)ptr; + while (sub_item_len > 0) { + u64 data; + + read_extent_buffer(eb, &data, offset, sizeof(data)); + data = le64_to_cpu(data); + if (data == subid) { + ret = 0; + break; + } + offset += sizeof(data); + sub_item_len--; + } + +out: + btrfs_free_path(path); + return ret; +} + +/* return -ENOENT for !found, < 0 for errors, or 0 if an item was found */ +static int btrfs_uuid_tree_lookup_any(struct btrfs_root *uuid_root, u8 *uuid, + u16 type, u64 *subid) +{ + int ret; + struct btrfs_path *path; + struct extent_buffer *eb; + struct btrfs_uuid_item *ptr; + u32 sub_item_len; + + path = btrfs_alloc_path(); + if (!path) { + ret = -ENOMEM; + goto out; + } + + ret = btrfs_uuid_tree_lookup_prepare(uuid_root, uuid, type, path, &ptr); + if (ret < 0) + goto out; + + eb = path->nodes[0]; + sub_item_len = btrfs_uuid_len(eb, ptr); + WARN_ON_ONCE(sub_item_len == 0); + if (sub_item_len > 0) { + /* return first stored id */ + read_extent_buffer(eb, subid, (unsigned long)(ptr + 1), + sizeof(*subid)); + *subid = le64_to_cpu(*subid); + ret = 0; + } else { + ret = -ENOENT; + } + +out: + btrfs_free_path(path); + return ret; +} + +/* it is not checked whether the entry to add already exists */ +static int btrfs_uuid_tree_add(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u16 type, u64 subid) +{ + int ret; + struct btrfs_path *path = NULL; + struct btrfs_key key; + struct extent_buffer *eb; + int slot; + struct btrfs_uuid_item *ptr; + u32 item_size; + + if (!uuid_root) { + WARN_ON_ONCE(1); + ret = -EINVAL; + goto out; + } + + btrfs_uuid_to_key(uuid, &key); + + path = btrfs_alloc_path(); + if (!path) { + ret = -ENOMEM; + goto out; + } + + ret = btrfs_insert_empty_item(trans, uuid_root, path, &key, + sizeof(*ptr) + sizeof(subid)); + if (ret == -EEXIST) { + ptr = btrfs_match_uuid_item_type(path, type); + if (ptr) { + /* + * An item with that type already exists. + * Extend the item and store the subid at the + * location of the first id of this type. + */ + unsigned long start; + unsigned long move_dst; + unsigned long move_src; + unsigned long move_len; + + btrfs_extend_item(uuid_root, path, sizeof(subid)); + ptr = (struct btrfs_uuid_item *) + (((char *)ptr) - sizeof(subid)); + eb = path->nodes[0]; + slot = path->slots[0]; + item_size = btrfs_item_size_nr(eb, slot); + WARN_ON(btrfs_uuid_len(eb, ptr) == 0); + btrfs_set_uuid_len(eb, ptr, + btrfs_uuid_len(eb, ptr) + 1); + ptr++; + start = btrfs_item_ptr_offset(eb, slot); + move_dst = ((unsigned long)ptr) + sizeof(subid); + move_src = (unsigned long)ptr; + move_len = item_size - (move_dst - start); + memmove_extent_buffer(eb, move_dst, move_src, move_len); + + goto write_subid; + } else { + btrfs_extend_item(uuid_root, path, + sizeof(*ptr) + sizeof(subid)); + } + } else if (ret < 0) { + pr_warn("btrfs: insert uuid item failed %d (0x%016llx, 0x%016llx) type %lu!\n", + ret, (unsigned long long)key.objectid, + (unsigned long long)key.offset, + (unsigned long)type); + goto out; + } + + /* + * Add an item for the type for the first time. Either add it behind + * items with different types, or write the very first item. + */ + eb = path->nodes[0]; + slot = path->slots[0]; + ptr = btrfs_item_ptr(eb, slot, struct btrfs_uuid_item); + item_size = btrfs_item_size_nr(eb, slot); + ptr = (struct btrfs_uuid_item *) + (((char *)ptr) + item_size - (sizeof(*ptr) + sizeof(subid))); + btrfs_set_uuid_type(eb, ptr, type); + btrfs_set_uuid_len(eb, ptr, 1); + ptr++; + +write_subid: + ret = 0; + subid = cpu_to_le64(subid); + write_extent_buffer(eb, &subid, (unsigned long)ptr, sizeof(subid)); + btrfs_mark_buffer_dirty(eb); + +out: + btrfs_free_path(path); + return ret; +} + +static int btrfs_uuid_tree_rem(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u16 type, u64 subid) +{ + int ret; + struct btrfs_path *path = NULL; + struct btrfs_key key; + struct extent_buffer *eb; + int slot; + struct btrfs_uuid_item *ptr_start; + unsigned long offset; + u32 item_size; + u32 id_index; + unsigned long start; + unsigned long move_dst; + unsigned long move_src; + unsigned long move_len; + + if (!uuid_root) { + WARN_ON_ONCE(1); + ret = -EINVAL; + goto out; + } + + btrfs_uuid_to_key(uuid, &key); + + path = btrfs_alloc_path(); + if (!path) { + ret = -ENOMEM; + goto out; + } + + ret = btrfs_search_slot(trans, uuid_root, &key, path, -1, 1); + if (ret < 0) { + pr_warn("btrfs: error %d while searching for uuid item!\n", + ret); + goto out; + } + if (ret > 0) { + ret = -ENOENT; + goto out; + } + + ptr_start = btrfs_match_uuid_item_type(path, type); + if (!ptr_start) { + /* case 1: no entry for that type is found */ + ret = -ENOENT; + goto out; + } + + eb = path->nodes[0]; + slot = path->slots[0]; + start = btrfs_item_ptr_offset(eb, slot); + item_size = btrfs_item_size_nr(eb, slot); + id_index = btrfs_uuid_len(eb, ptr_start); + offset = (unsigned long)(ptr_start + 1); + while (id_index > 0) { + u64 found_subid; + + read_extent_buffer(eb, &found_subid, offset, + sizeof(found_subid)); + found_subid = le64_to_cpu(found_subid); + if (found_subid == subid) + break; + offset += sizeof(found_subid); + id_index--; + } + + if (!id_index) { + /* + * case 2: an entry for that type is found, but no match + * for the id + */ + ret = -ENOENT; + goto out; + } + + if (btrfs_uuid_len(eb, ptr_start) == 1) { + if (item_size == sizeof(*ptr_start) + sizeof(subid)) { + /* + * case 3: no other types and ids are stored, + * delete the full item + */ + ret = btrfs_del_item(trans, uuid_root, path); + goto out; + } else { + /* + * case 4: No other ids for the particular type + * are stored, but other types exist. Shrink the + * item by the size of an id plus the size of the + * item for that type. + */ + move_dst = (unsigned long)ptr_start; + } + } else { + /* + * case 5: Other ids for that particular type are stored. + * Shrink the item by the size of an id. + */ + move_dst = offset; + WARN_ON(btrfs_uuid_len(eb, ptr_start) == 0); + btrfs_set_uuid_len(eb, ptr_start, + btrfs_uuid_len(eb, ptr_start) - 1); + } + move_src = offset + sizeof(subid); + move_len = item_size - (move_src - start); + + memmove_extent_buffer(eb, move_dst, move_src, move_len); + btrfs_truncate_item(uuid_root, path, item_size - (move_src - move_dst), + 1); + +out: + btrfs_free_path(path); + return ret; +} + +int btrfs_lookup_uuid_subvol_item(struct btrfs_root *uuid_root, u8 *uuid, + u64 *subvol_id) +{ + return btrfs_uuid_tree_lookup_any(uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_SUBVOL, + subvol_id); +} + +int btrfs_insert_uuid_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u64 subvol_id) +{ + int ret; + + ret = btrfs_uuid_tree_lookup(uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_SUBVOL, subvol_id); + if (ret == -ENOENT) + ret = btrfs_uuid_tree_add(trans, uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_SUBVOL, + subvol_id); + return ret; +} + +int btrfs_del_uuid_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u64 subvol_id) +{ + return btrfs_uuid_tree_rem(trans, uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_SUBVOL, subvol_id); +} + +int btrfs_lookup_uuid_received_subvol_item(struct btrfs_root *uuid_root, + u8 *uuid, u64 *subvol_id) +{ + return btrfs_uuid_tree_lookup_any(uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_RECEIVED_SUBVOL, + subvol_id); +} + +int btrfs_insert_uuid_received_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, + u8 *uuid, u64 subvol_id) +{ + int ret; + + ret = btrfs_uuid_tree_lookup(uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_RECEIVED_SUBVOL, + subvol_id); + if (ret == -ENOENT) + ret = btrfs_uuid_tree_add(trans, uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_RECEIVED_SUBVOL, + subvol_id); + return ret; +} + +int btrfs_del_uuid_received_subvol_item(struct btrfs_trans_handle *trans, + struct btrfs_root *uuid_root, u8 *uuid, + u64 subvol_id) +{ + return btrfs_uuid_tree_rem(trans, uuid_root, uuid, + BTRFS_UUID_ITEM_TYPE_RECEIVED_SUBVOL, + subvol_id); +}

[v5,1/8] Btrfs: introduce a tree for items that map UUIDs to something

Commit Message

Comments

Patch