In an instrumented testing it is possible that the mount and a newer mkfs.btrfs thread on the same device can race and if the new mkfs.btrfs wins it will free the older fs_devices, then the mount thread will lead to oops.
Thread1 Thread2 ------- ------- mkfs.btrfs -fq /dev/sdb mount /dev/sdb /btrfs |_btrfs_mount_root() |_btrfs_scan_one_device(... &fs_devices) mkfs.btrfs -fq /dev/sdb |_btrfs_contol_ioctl() |_btrfs_scan_one_device(... &fs_devices) |_:: |_btrfs_free_stale_devices() |_btrfs_open_devices(fs_devices ..) <-- stale fs_devices. Fix this with a mutually exclusive flag BTRFS_VOL_FLAG_EXCL_OPS. Signed-off-by: Anand Jain <anand.j...@oracle.com> --- fs/btrfs/super.c | 6 ++++++ fs/btrfs/volumes.c | 10 +++++++++- fs/btrfs/volumes.h | 1 + 3 files changed, 16 insertions(+), 1 deletion(-) diff --git a/fs/btrfs/super.c b/fs/btrfs/super.c index f0c13defc9eb..b60e7cbe39f5 100644 --- a/fs/btrfs/super.c +++ b/fs/btrfs/super.c @@ -1565,7 +1565,13 @@ static struct dentry *btrfs_mount_root(struct file_system_type *fs_type, goto error_fs_info; } + if (test_and_set_bit(BTRFS_VOLUME_STATE_EXCL_OPS, &fs_devices->volume_state)) { + error = -EBUSY; + goto error_fs_info; + } + error = btrfs_open_devices(fs_devices, mode, fs_type); + clear_bit(BTRFS_VOLUME_STATE_EXCL_OPS, &fs_devices->volume_state); if (error) goto error_fs_info; diff --git a/fs/btrfs/volumes.c b/fs/btrfs/volumes.c index 87a4b12f98e3..3137cc990550 100644 --- a/fs/btrfs/volumes.c +++ b/fs/btrfs/volumes.c @@ -635,7 +635,7 @@ static void pending_bios_fn(struct btrfs_work *work) * devices. */ static void free_stale_devices(const char *path, - struct btrfs_device *skip_device) + struct btrfs_device *skip_device) { struct btrfs_fs_devices *fs_devices, *tmp_fs_devices; struct btrfs_device *device, *tmp_device; @@ -643,9 +643,15 @@ static void free_stale_devices(const char *path, list_for_each_entry_safe(fs_devices, tmp_fs_devices, &fs_uuids, fs_list) { + if (test_and_set_bit(BTRFS_VOLUME_STATE_EXCL_OPS, + &fs_devices->volume_state)) + continue; + mutex_lock(&fs_devices->device_list_mutex); if (fs_devices->opened) { mutex_unlock(&fs_devices->device_list_mutex); + clear_bit(BTRFS_VOLUME_STATE_EXCL_OPS, + &fs_devices->volume_state); continue; } @@ -680,6 +686,8 @@ static void free_stale_devices(const char *path, list_del(&fs_devices->fs_list); free_fs_devices(fs_devices); } + clear_bit(BTRFS_VOLUME_STATE_EXCL_OPS, + &fs_devices->volume_state); } } diff --git a/fs/btrfs/volumes.h b/fs/btrfs/volumes.h index cd18916f2bbc..60eea973a501 100644 --- a/fs/btrfs/volumes.h +++ b/fs/btrfs/volumes.h @@ -214,6 +214,7 @@ BTRFS_DEVICE_GETSET_FUNCS(bytes_used); */ #define BTRFS_VOLUME_STATE_ROTATING (0) #define BTRFS_VOLUME_STATE_SEEDING (1) +#define BTRFS_VOLUME_STATE_EXCL_OPS (2) struct btrfs_fs_devices { u8 fsid[BTRFS_FSID_SIZE]; /* FS specific uuid */ -- 2.15.0 -- To unsubscribe from this list: send the line "unsubscribe linux-btrfs" in the body of a message to majord...@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html