On 2018/10/23 下午5:41, Su Yue wrote:
> From: Su Yanjun <suyj.f...@cn.fujitsu.com>
> 
> In original mode, if some file extent item has unaligned extent backref,
> fixup_extent_refs can't repair it. This patch will check extent alignment
> then delete file extent with unaligned extent backref.

This looks a little strange to me.

You mean, an unaligned FILE EXTENT has an unaligned EXTENT_ITEM?

Then why not just delete the EXTENT_ITEM directly? No need to go back
checking if it has a corresponding EXTENT_DATA since unaligned one is
definitely corrupted.

For corrupted EXTENT_DATA, it should get deleted when we check fs tree.

This would save you a lot of codes.

Thanks,
Qu

> 
> Signed-off-by: Su Yanjun <suyj.f...@cn.fujitsu.com>
> ---
>  check/main.c          | 278 +++++++++++++++++++++++++++++++++++++++++-
>  check/mode-original.h |  13 ++
>  ctree.h               |   2 +
>  disk-io.c             |   1 +
>  4 files changed, 293 insertions(+), 1 deletion(-)
> 
> diff --git a/check/main.c b/check/main.c
> index 90d9fd570287..b5e68b3241e5 100644
> --- a/check/main.c
> +++ b/check/main.c
> @@ -460,6 +460,8 @@ static struct inode_record *clone_inode_rec(struct 
> inode_record *orig_rec)
>       struct inode_backref *backref;
>       struct inode_backref *orig;
>       struct inode_backref *tmp;
> +     struct unaligned_extent_rec_t *src;
> +     struct unaligned_extent_rec_t *dst;
>       struct rb_node *rb;
>       size_t size;
>       int ret;
> @@ -470,6 +472,7 @@ static struct inode_record *clone_inode_rec(struct 
> inode_record *orig_rec)
>       memcpy(rec, orig_rec, sizeof(*rec));
>       rec->refs = 1;
>       INIT_LIST_HEAD(&rec->backrefs);
> +     INIT_LIST_HEAD(&rec->unaligned_extent_recs);
>       rec->holes = RB_ROOT;
>  
>       list_for_each_entry(orig, &orig_rec->backrefs, list) {
> @@ -483,6 +486,17 @@ static struct inode_record *clone_inode_rec(struct 
> inode_record *orig_rec)
>               list_add_tail(&backref->list, &rec->backrefs);
>       }
>  
> +     list_for_each_entry(src, &orig_rec->unaligned_extent_recs, list) {
> +             size = sizeof(*src);
> +             dst = malloc(size);
> +             if (!dst) {
> +                     ret = -ENOMEM;
> +                     goto cleanup;
> +             }
> +             memcpy(dst, src, size);
> +             list_add_tail(&dst->list, &rec->unaligned_extent_recs);
> +     }
> +
>       ret = copy_file_extent_holes(&rec->holes, &orig_rec->holes);
>       if (ret < 0)
>               goto cleanup_rb;
> @@ -506,6 +520,13 @@ cleanup:
>                       free(orig);
>               }
>  
> +     if (!list_empty(&rec->unaligned_extent_recs))
> +             list_for_each_entry_safe(src, dst, &rec->unaligned_extent_recs,
> +                             list) {
> +                     list_del(&src->list);
> +                     free(src);
> +             }
> +
>       free(rec);
>  
>       return ERR_PTR(ret);
> @@ -643,6 +664,7 @@ static struct inode_record *get_inode_rec(struct 
> cache_tree *inode_cache,
>               rec->extent_start = (u64)-1;
>               rec->refs = 1;
>               INIT_LIST_HEAD(&rec->backrefs);
> +             INIT_LIST_HEAD(&rec->unaligned_extent_recs);
>               rec->holes = RB_ROOT;
>  
>               node = malloc(sizeof(*node));
> @@ -664,6 +686,18 @@ static struct inode_record *get_inode_rec(struct 
> cache_tree *inode_cache,
>       return rec;
>  }
>  
> +static void free_unaligned_extent_recs(struct list_head 
> *unaligned_extent_recs)
> +{
> +     struct unaligned_extent_rec_t *urec;
> +
> +     while (!list_empty(unaligned_extent_recs)) {
> +             urec = list_entry(unaligned_extent_recs->next,
> +                             struct unaligned_extent_rec_t, list);
> +             list_del(&urec->list);
> +             free(urec);
> +     }
> +}
> +
>  static void free_inode_rec(struct inode_record *rec)
>  {
>       struct inode_backref *backref;
> @@ -676,6 +710,7 @@ static void free_inode_rec(struct inode_record *rec)
>               list_del(&backref->list);
>               free(backref);
>       }
> +     free_unaligned_extent_recs(&rec->unaligned_extent_recs);
>       free_file_extent_holes(&rec->holes);
>       free(rec);
>  }
> @@ -2474,18 +2509,154 @@ out:
>       return ret;
>  }
>  
> +static int btrfs_delete_item(struct btrfs_trans_handle *trans,
> +             struct btrfs_root *root, struct btrfs_key *key)
> +{
> +     struct btrfs_path path;
> +     int ret = 0;
> +
> +     btrfs_init_path(&path);
> +
> +     ret = btrfs_search_slot(trans, root, key, &path, -1, 1);
> +     if (ret) {
> +             if (ret > 0)
> +                     ret = -ENOENT;
> +
> +             btrfs_release_path(&path);
> +             return ret;
> +     }
> +
> +     ret = btrfs_del_item(trans, root, &path);
> +
> +     btrfs_release_path(&path);
> +     return ret;
> +}
> +
> +static int find_file_extent_offset_by_bytenr(struct btrfs_root *root,
> +             u64 owner, u64 bytenr, u64 *offset_ret)
> +{
> +     int ret = 0;
> +     struct btrfs_path path;
> +     struct btrfs_key key;
> +     struct btrfs_key found_key;
> +     struct btrfs_file_extent_item *fi;
> +     struct extent_buffer *leaf;
> +     u64 disk_bytenr;
> +     int slot;
> +
> +     btrfs_init_path(&path);
> +
> +     key.objectid = owner;
> +     key.type = BTRFS_INODE_ITEM_KEY;
> +     key.offset = 0;
> +
> +     ret = btrfs_search_slot(NULL, root, &key, &path, 0, 0);
> +     if (ret) {
> +             if (ret > 0)
> +                     ret = -ENOENT;
> +             btrfs_release_path(&path);
> +             return ret;
> +     }
> +
> +     btrfs_release_path(&path);
> +
> +     key.objectid = owner;
> +     key.type = BTRFS_EXTENT_DATA_KEY;
> +     key.offset = 0;
> +
> +     ret = btrfs_search_slot(NULL, root, &key, &path, 0, 0);
> +     if (ret < 0) {
> +             btrfs_release_path(&path);
> +             return ret;
> +     }
> +
> +     while (1) {
> +             leaf = path.nodes[0];
> +             slot = path.slots[0];
> +
> +             if (slot >= btrfs_header_nritems(leaf)) {
> +                     ret = btrfs_next_leaf(root, &path);
> +                     if (ret) {
> +                             if (ret > 0)
> +                                     ret = 0;
> +                             break;
> +                     }
> +
> +                     leaf = path.nodes[0];
> +                     slot = path.slots[0];
> +             }
> +
> +             btrfs_item_key_to_cpu(leaf, &found_key, slot);
> +             if ((found_key.objectid != owner) ||
> +                     (found_key.type != BTRFS_EXTENT_DATA_KEY))
> +                     break;
> +
> +             fi = btrfs_item_ptr(leaf, slot,
> +                             struct btrfs_file_extent_item);
> +
> +             disk_bytenr = btrfs_file_extent_disk_bytenr(leaf, fi);
> +             if (disk_bytenr == bytenr) {
> +                     *offset_ret = found_key.offset;
> +                     ret = 0;
> +                     break;
> +             }
> +             path.slots[0]++;
> +     }
> +
> +     btrfs_release_path(&path);
> +     return ret;
> +}
> +
> +static int repair_unaligned_extent_recs(struct btrfs_trans_handle *trans,
> +                             struct btrfs_root *root,
> +                             struct btrfs_path *path,
> +                             struct inode_record *rec)
> +{
> +     int ret = 0;
> +     struct btrfs_key key;
> +     struct unaligned_extent_rec_t *urec;
> +     struct unaligned_extent_rec_t *tmp;
> +
> +     list_for_each_entry_safe(urec, tmp, &rec->unaligned_extent_recs, list) {
> +
> +             key.objectid = urec->owner;
> +             key.type = BTRFS_EXTENT_DATA_KEY;
> +             key.offset = urec->offset;
> +             fprintf(stderr, "delete file extent item [%llu,%llu]\n",
> +                                     urec->owner, urec->offset);
> +             ret = btrfs_delete_item(trans, root, &key);
> +             if (ret)
> +                     return ret;
> +
> +             list_del(&urec->list);
> +             free(urec);
> +     }
> +     rec->errors &= ~I_ERR_UNALIGNED_EXTENT_REC;
> +
> +     return ret;
> +}
> +
>  static int try_repair_inode(struct btrfs_root *root, struct inode_record 
> *rec)
>  {
>       struct btrfs_trans_handle *trans;
>       struct btrfs_path path;
>       int ret = 0;
>  
> +     /*
> +      * unaligned extent recs always lead to csum missing error, clean it
> +      */
> +     if ((rec->errors & I_ERR_SOME_CSUM_MISSING) &&
> +                     (rec->errors & I_ERR_UNALIGNED_EXTENT_REC))
> +             rec->errors &= ~I_ERR_SOME_CSUM_MISSING;
> +
> +
>       if (!(rec->errors & (I_ERR_DIR_ISIZE_WRONG |
>                            I_ERR_NO_ORPHAN_ITEM |
>                            I_ERR_LINK_COUNT_WRONG |
>                            I_ERR_NO_INODE_ITEM |
>                            I_ERR_FILE_EXTENT_DISCOUNT |
>                            I_ERR_FILE_NBYTES_WRONG |
> +                          I_ERR_UNALIGNED_EXTENT_REC |
>                            I_ERR_INLINE_RAM_BYTES_WRONG)))
>               return rec->errors;
>  
> @@ -2515,6 +2686,8 @@ static int try_repair_inode(struct btrfs_root *root, 
> struct inode_record *rec)
>               ret = repair_inode_nbytes(trans, root, &path, rec);
>       if (!ret && rec->errors & I_ERR_INLINE_RAM_BYTES_WRONG)
>               ret = repair_inline_ram_bytes(trans, root, &path, rec);
> +     if (!ret && rec->errors & I_ERR_UNALIGNED_EXTENT_REC)
> +             ret = repair_unaligned_extent_recs(trans, root, &path, rec);
>       btrfs_commit_transaction(trans, root);
>       btrfs_release_path(&path);
>       return ret;
> @@ -3128,6 +3301,8 @@ static int check_fs_root(struct btrfs_root *root,
>       struct cache_tree corrupt_blocks;
>       enum btrfs_tree_block_status status;
>       struct node_refs nrefs;
> +     struct unaligned_extent_rec_t *urec;
> +     struct unaligned_extent_rec_t *tmp;
>  
>       /*
>        * Reuse the corrupt_block cache tree to record corrupted tree block
> @@ -3151,6 +3326,30 @@ static int check_fs_root(struct btrfs_root *root,
>       cache_tree_init(&root_node.inode_cache);
>       memset(&nrefs, 0, sizeof(nrefs));
>  
> +     /*
> +      * Mode unaligned extent recs to corresponding inode record
> +      */
> +     list_for_each_entry_safe(urec, tmp,
> +                     &root->unaligned_extent_recs, list) {
> +             struct inode_record *inode;
> +
> +             inode = get_inode_rec(&root_node.inode_cache, urec->owner, 1);
> +
> +             if (IS_ERR_OR_NULL(inode)) {
> +                     fprintf(stderr,
> +                             "fail to get inode rec on [%llu,%llu]\n",
> +                             urec->objectid, urec->owner);
> +
> +                     list_del(&urec->list);
> +                     free(urec);
> +
> +                     continue;
> +             }
> +
> +             inode->errors |= I_ERR_UNALIGNED_EXTENT_REC;
> +             list_move(&urec->list, &inode->unaligned_extent_recs);
> +     }
> +
>       level = btrfs_header_level(root->node);
>       memset(wc->nodes, 0, sizeof(wc->nodes));
>       wc->nodes[level] = &root_node;
> @@ -7425,6 +7624,68 @@ static int prune_corrupt_blocks(struct btrfs_fs_info 
> *info)
>       return 0;
>  }
>  
> +static int record_unaligned_extent_rec(struct btrfs_fs_info *fs_info,
> +                                     struct extent_record *rec)
> +{
> +
> +     struct extent_backref *back, *tmp;
> +     struct data_backref *dback;
> +     struct btrfs_root *dest_root;
> +     struct btrfs_key key;
> +     struct unaligned_extent_rec_t *urec;
> +     LIST_HEAD(entries);
> +     int ret = 0;
> +
> +     fprintf(stderr, "record unaligned extent record on %llu %llu\n",
> +                     rec->start, rec->nr);
> +
> +     /*
> +      * Metadata is easy and the backrefs should always agree on bytenr and
> +      * size, if not we've got bigger issues.
> +      */
> +     if (rec->metadata)
> +             return 0;
> +
> +     rbtree_postorder_for_each_entry_safe(back, tmp,
> +                                          &rec->backref_tree, node) {
> +             if (back->full_backref || !back->is_data)
> +                     continue;
> +
> +             dback = to_data_backref(back);
> +
> +             key.objectid = dback->root;
> +             key.type = BTRFS_ROOT_ITEM_KEY;
> +             key.offset = (u64)-1;
> +
> +             dest_root = btrfs_read_fs_root(fs_info, &key);
> +
> +             /*
> +              * For non-exist root we just skip it
> +              */
> +             if (IS_ERR_OR_NULL(dest_root))
> +                     continue;
> +
> +             urec = malloc(sizeof(struct unaligned_extent_rec_t));
> +             if (!urec)
> +                     return -ENOMEM;
> +
> +             INIT_LIST_HEAD(&urec->list);
> +             urec->objectid = dest_root->objectid;
> +             urec->owner = dback->owner;
> +             urec->offset = 0;
> +             urec->bytenr = rec->start;
> +             ret = find_file_extent_offset_by_bytenr(dest_root,
> +                             dback->owner, rec->start, &urec->offset);
> +             if (ret) {
> +                     free(urec);
> +                     return ret;
> +             }
> +             list_add(&urec->list, &dest_root->unaligned_extent_recs);
> +     }
> +
> +     return ret;
> +}
> +
>  static int check_extent_refs(struct btrfs_root *root,
>                            struct cache_tree *extent_cache)
>  {
> @@ -7522,6 +7783,21 @@ static int check_extent_refs(struct btrfs_root *root,
>                       fix = 1;
>                       cur_err = 1;
>               }
> +
> +             if (!IS_ALIGNED(rec->start, root->fs_info->sectorsize)) {
> +                     fprintf(stderr, "unaligned extent rec on [%llu %llu]\n",
> +                             (unsigned long long)rec->start,
> +                             (unsigned long long)rec->nr);
> +                     ret = record_unaligned_extent_rec(root->fs_info, rec);
> +                     if (ret)
> +                             goto repair_abort;
> +
> +                     /*
> +                      * free extent record
> +                      */
> +                     goto next;
> +             }
> +
>               if (all_backpointers_checked(rec, 1)) {
>                       fprintf(stderr, "backpointer mismatch on [%llu %llu]\n",
>                               (unsigned long long)rec->start,
> @@ -7574,7 +7850,7 @@ static int check_extent_refs(struct btrfs_root *root,
>                               rec->start, rec->start + rec->max_size);
>                       cur_err = 1;
>               }
> -
> +next:
>               err = cur_err;
>               remove_cache_extent(extent_cache, cache);
>               free_all_extent_backrefs(rec);
> diff --git a/check/mode-original.h b/check/mode-original.h
> index ed995931fcd5..b23594863199 100644
> --- a/check/mode-original.h
> +++ b/check/mode-original.h
> @@ -155,6 +155,16 @@ struct file_extent_hole {
>       u64 len;
>  };
>  
> +struct unaligned_extent_rec_t {
> +     struct list_head list;
> +
> +     u64 objectid;
> +     u64 owner;
> +     u64 offset;
> +
> +     u64 bytenr;
> +};
> +
>  #define I_ERR_NO_INODE_ITEM          (1 << 0)
>  #define I_ERR_NO_ORPHAN_ITEM         (1 << 1)
>  #define I_ERR_DUP_INODE_ITEM         (1 << 2)
> @@ -169,6 +179,7 @@ struct file_extent_hole {
>  #define I_ERR_ODD_CSUM_ITEM          (1 << 11)
>  #define I_ERR_SOME_CSUM_MISSING              (1 << 12)
>  #define I_ERR_LINK_COUNT_WRONG               (1 << 13)
> +#define I_ERR_UNALIGNED_EXTENT_REC   (1 << 14)
>  #define I_ERR_FILE_EXTENT_TOO_LARGE  (1 << 15)
>  #define I_ERR_ODD_INODE_FLAGS                (1 << 16)
>  #define I_ERR_INLINE_RAM_BYTES_WRONG (1 << 17)
> @@ -185,6 +196,8 @@ struct inode_record {
>       unsigned int nodatasum:1;
>       int errors;
>  
> +     struct list_head unaligned_extent_recs;
> +
>       u64 ino;
>       u32 nlink;
>       u32 imode;
> diff --git a/ctree.h b/ctree.h
> index 2e0896390434..d0f441587f9f 100644
> --- a/ctree.h
> +++ b/ctree.h
> @@ -1177,6 +1177,8 @@ struct btrfs_root {
>       u32 type;
>       u64 last_inode_alloc;
>  
> +     struct list_head unaligned_extent_recs;
> +
>       /* the dirty list is only used by non-reference counted roots */
>       struct list_head dirty_list;
>       struct rb_node rb_node;
> diff --git a/disk-io.c b/disk-io.c
> index 992f4b870e9f..0dfd51ed87bf 100644
> --- a/disk-io.c
> +++ b/disk-io.c
> @@ -480,6 +480,7 @@ void btrfs_setup_root(struct btrfs_root *root, struct 
> btrfs_fs_info *fs_info,
>       root->last_inode_alloc = 0;
>  
>       INIT_LIST_HEAD(&root->dirty_list);
> +     INIT_LIST_HEAD(&root->unaligned_extent_recs);
>       memset(&root->root_key, 0, sizeof(root->root_key));
>       memset(&root->root_item, 0, sizeof(root->root_item));
>       root->root_key.objectid = objectid;
> 

Reply via email to