On 22.12.2017 00:42, Liu Bo wrote: > We've observed that btrfs_get_extent() and merge_extent_mapping() could > return -EEXIST in several cases, and they are caused by some racy > condition, e.g dio read vs dio write, which makes the problem very tricky > to reproduce. > > This adds extent map selftests in order to simulate those racy situations. > > Signed-off-by: Liu Bo <bo.li....@oracle.com> > --- > fs/btrfs/Makefile | 2 +- > fs/btrfs/tests/btrfs-tests.c | 3 + > fs/btrfs/tests/btrfs-tests.h | 1 + > fs/btrfs/tests/extent-map-tests.c | 202 > ++++++++++++++++++++++++++++++++++++++ > 4 files changed, 207 insertions(+), 1 deletion(-) > create mode 100644 fs/btrfs/tests/extent-map-tests.c > > diff --git a/fs/btrfs/Makefile b/fs/btrfs/Makefile > index 6fe881d..0c43736 100644 > --- a/fs/btrfs/Makefile > +++ b/fs/btrfs/Makefile > @@ -19,4 +19,4 @@ btrfs-$(CONFIG_BTRFS_FS_REF_VERIFY) += ref-verify.o > btrfs-$(CONFIG_BTRFS_FS_RUN_SANITY_TESTS) += tests/free-space-tests.o \ > tests/extent-buffer-tests.o tests/btrfs-tests.o \ > tests/extent-io-tests.o tests/inode-tests.o tests/qgroup-tests.o \ > - tests/free-space-tree-tests.o > + tests/free-space-tree-tests.o tests/extent-map-tests.o > diff --git a/fs/btrfs/tests/btrfs-tests.c b/fs/btrfs/tests/btrfs-tests.c > index d3f2537..9786d8c 100644 > --- a/fs/btrfs/tests/btrfs-tests.c > +++ b/fs/btrfs/tests/btrfs-tests.c > @@ -277,6 +277,9 @@ int btrfs_run_sanity_tests(void) > goto out; > } > } > + ret = btrfs_test_extent_map(); > + if (ret) > + goto out; > out: > btrfs_destroy_test_fs(); > return ret; > diff --git a/fs/btrfs/tests/btrfs-tests.h b/fs/btrfs/tests/btrfs-tests.h > index 266f1e3..bc0615b 100644 > --- a/fs/btrfs/tests/btrfs-tests.h > +++ b/fs/btrfs/tests/btrfs-tests.h > @@ -33,6 +33,7 @@ int btrfs_test_extent_io(u32 sectorsize, u32 nodesize); > int btrfs_test_inodes(u32 sectorsize, u32 nodesize); > int btrfs_test_qgroups(u32 sectorsize, u32 nodesize); > int btrfs_test_free_space_tree(u32 sectorsize, u32 nodesize); > +int btrfs_test_extent_map(void); > struct inode *btrfs_new_test_inode(void); > struct btrfs_fs_info *btrfs_alloc_dummy_fs_info(u32 nodesize, u32 > sectorsize); > void btrfs_free_dummy_fs_info(struct btrfs_fs_info *fs_info); > diff --git a/fs/btrfs/tests/extent-map-tests.c > b/fs/btrfs/tests/extent-map-tests.c > new file mode 100644 > index 0000000..0407396 > --- /dev/null > +++ b/fs/btrfs/tests/extent-map-tests.c > @@ -0,0 +1,202 @@ > +/* > + * Copyright (C) 2017 Oracle. All rights reserved. > + * > + * This program is free software; you can redistribute it and/or > + * modify it under the terms of the GNU General Public > + * License v2 as published by the Free Software Foundation. > + * > + * This program is distributed in the hope that it will be useful, > + * but WITHOUT ANY WARRANTY; without even the implied warranty of > + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU > + * General Public License for more details. > + * > + * You should have received a copy of the GNU General Public > + * License along with this program; if not, write to the > + * Free Software Foundation, Inc., 59 Temple Place - Suite 330, > + * Boston, MA 021110-1307, USA. > + */ > + > +#include <linux/types.h> > +#include "btrfs-tests.h" > +#include "../ctree.h" > + > +static void free_extent_map_tree(struct extent_map_tree *em_tree) > +{ > + struct extent_map *em; > + struct rb_node *node; > + > + while (!RB_EMPTY_ROOT(&em_tree->map)) { > + node = rb_first(&em_tree->map); > + em = rb_entry(node, struct extent_map, rb_node); > + remove_extent_mapping(em_tree, em); > + > +#ifdef CONFIG_BTRFS_DEBUG > + if (refcount_read(&em->refs) != 1) { > + test_msg( > + "Oops we have a em leak: em (start 0x%llx len > 0x%llx block_start 0x%llx block_len 0x%llx) refs %d\n", > + em->start, em->len, em->block_start, > + em->block_len, refcount_read(&em->refs)); > + > + refcount_set(&em->refs, 1); > + } > +#endif > + free_extent_map(em); > + } > +} > + > +/* > + * Test scenario: > + * > + * Suppose that no extent map has been loaded into memory yet, there is a > file > + * extent [0, 16K), followed by another file extent [16K, 20K), two dio reads > + * are entering btrfs_get_extent() concurrently, t1 is reading [8K, 16K), t2 > is > + * reading [0, 8K) > + * > + * t1 t2 > + * btrfs_get_extent() btrfs_get_extent() > + * -> lookup_extent_mapping() ->lookup_extent_mapping() > + * -> add_extent_mapping(0, 16K) > + * -> return em > + * ->add_extent_mapping(0, 16K) > + * -> #handle -EEXIST > + */ > +static void test_case_1(struct extent_map_tree *em_tree) > +{
So here you are testing the "fully overlapping" case in btrfs_add_extent_mapping. What about another test case about merging 2 adjacent extents i.e. this block of code: } else if (start >= extent_map_end(existing) || start <= existing->start) { > + struct extent_map *em; > + u64 start = 0; > + u64 len = SZ_8K; > + int ret; > + > + em = alloc_extent_map(); > + if (!em) > + /* Skip the test on error. */ > + return; > + > + /* Add [0, 16K) */ > + em->start = 0; > + em->len = SZ_16K; > + em->block_start = 0; > + em->block_len = SZ_16K; > + ret = add_extent_mapping(em_tree, em, 0); > + ASSERT(ret == 0); > + free_extent_map(em); > + > + /* Add [16K, 20K) following [0, 16K) */ > + em = alloc_extent_map(); > + if (!em) > + goto out; > + > + em->start = SZ_16K; > + em->len = SZ_4K; > + em->block_start = SZ_32K; /* avoid merging */ > + em->block_len = SZ_4K; > + ret = add_extent_mapping(em_tree, em, 0); > + ASSERT(ret == 0); > + free_extent_map(em); > + > + em = alloc_extent_map(); > + if (!em) > + goto out; > + > + /* Add [0, 8K), should return [0, 16K) instead. */ > + em->start = start; > + em->len = len; > + em->block_start = start; > + em->block_len = len; Any particular reason you are using start/len and not the constants as in the previous 2 extent insertion cases? Makes it a lot easier to see what's happening without reading the above variables? > + ret = btrfs_add_extent_mapping(em_tree, &em, em->start, em->len); > + if (ret) > + test_msg("case1 [%llu %llu]: ret %d\n", > + start, start + len, ret); > + if (em && > + (em->start != 0 || extent_map_end(em) != SZ_16K || > + em->block_start != 0 || em->block_len != SZ_16K)) > + test_msg("case1 [%llu %llu]: ret %d return a wrong em (start > %llu len %llu block_start %llu block_len %llu\n", > + start, start + len, ret, em->start, em->len, > + em->block_start, em->block_len); > + free_extent_map(em); > +out: > + /* free memory */ > + free_extent_map_tree(em_tree); > +} > + > +/* > + * Test scenario: > + * > + * Reading the inline ending up with EEXIST, ie. read an inline > + * extent and discard page cache and read it again. > + */ > +static void test_case_2(struct extent_map_tree *em_tree) > +{ > + struct extent_map *em; > + int ret; > + > + em = alloc_extent_map(); > + if (!em) > + /* Skip the test on error. */ > + return; > + > + /* Add [0, 1K) */ > + em->start = 0; > + em->len = SZ_1K; > + em->block_start = EXTENT_MAP_INLINE; > + em->block_len = (u64)-1; > + ret = add_extent_mapping(em_tree, em, 0); > + ASSERT(ret == 0); > + free_extent_map(em); > + > + /* Add [4K, 4K) following [0, 1K) */ > + em = alloc_extent_map(); > + if (!em) > + goto out; > + > + em->start = SZ_4K; > + em->len = SZ_4K; > + em->block_start = SZ_4K; > + em->block_len = SZ_4K; > + ret = add_extent_mapping(em_tree, em, 0); > + ASSERT(ret == 0); > + free_extent_map(em); > + > + em = alloc_extent_map(); > + if (!em) > + goto out; > + > + /* Add [0, 1K) */ > + em->start = 0; > + em->len = SZ_1K; > + em->block_start = EXTENT_MAP_INLINE; > + em->block_len = (u64)-1; > + ret = btrfs_add_extent_mapping(em_tree, &em, em->start, em->len); > + if (ret) > + test_msg("case2 [0 1K]: ret %d\n", ret); > + if (em && > + (em->start != 0 || extent_map_end(em) != SZ_1K || > + em->block_start != EXTENT_MAP_INLINE || em->block_len != (u64)-1)) > + test_msg("case2 [0 1K]: ret %d return a wrong em (start %llu > len %llu block_start %llu block_len %llu\n", > + ret, em->start, em->len, em->block_start, > + em->block_len); > + free_extent_map(em); > +out: > + /* free memory */ > + free_extent_map_tree(em_tree); > +} > + > +int btrfs_test_extent_map() > +{ > + struct extent_map_tree *em_tree; > + > + test_msg("Running extent_map tests\n"); > + > + em_tree = kzalloc(sizeof(*em_tree), GFP_KERNEL); > + if (!em_tree) > + /* Skip the test on error. */ > + return 0; > + > + extent_map_tree_init(em_tree); > + > + test_case_1(em_tree); > + test_case_2(em_tree); > + > + kfree(em_tree); > + return 0; > +} > -- To unsubscribe from this list: send the line "unsubscribe linux-btrfs" in the body of a message to majord...@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html