On Thu, Aug 13, 2020 at 7:36 PM Kevin Wolf <kw...@redhat.com> wrote:

> Instead of implementing qemu-nbd --offset in the NBD code, just put a
> raw block node with the requested offset on top of the user image and
> rely on that doing the job.
>
> This does not only simplify the nbd_export_new() interface and bring it
> closer to the set of options that the nbd-server-add QMP command offers,
> but in fact it also eliminates a potential source for bugs in the NBD
> code which previously had to add the offset manually in all relevant
> places.
>

Just to make sure I understand this correctly -

qemu-nbd can work with:

    $ qemu-nbd 'json:{"driver": "file", "filename": "test.raw"}'

And:

    $ qemu-nbd 'json:{"driver": "raw", "file": {"driver": "file",
"filename": "test.raw"}}'

I assumed that we always create the raw node?

oVirt always uses the second form to make it easier to support offset,
size, and backing.
https://github.com/oVirt/ovirt-imageio/blob/2021164d064227d7c5e03c8da087adc66e3a577e/daemon/ovirt_imageio/_internal/qemu_nbd.py#L104

This also seems to be the way libvirt builds the nodes using -blockdev.

Do we have a way to visualize the internal node graph used by
qemu-nbd/qemu-img?

Nir

Signed-off-by: Kevin Wolf <kw...@redhat.com>
> ---
>  include/block/nbd.h |  4 ++--
>  blockdev-nbd.c      |  9 +--------
>  nbd/server.c        | 34 +++++++++++++++++-----------------
>  qemu-nbd.c          | 27 ++++++++++++---------------
>  4 files changed, 32 insertions(+), 42 deletions(-)
>
> diff --git a/include/block/nbd.h b/include/block/nbd.h
> index c8c5cb6b61..3846d2bac8 100644
> --- a/include/block/nbd.h
> +++ b/include/block/nbd.h
> @@ -329,8 +329,8 @@ typedef struct NBDExport NBDExport;
>  typedef struct NBDClient NBDClient;
>
>  BlockExport *nbd_export_create(BlockExportOptions *exp_args, Error
> **errp);
> -NBDExport *nbd_export_new(BlockDriverState *bs, uint64_t dev_offset,
> -                          uint64_t size, const char *name, const char
> *desc,
> +NBDExport *nbd_export_new(BlockDriverState *bs,
> +                          const char *name, const char *desc,
>                            const char *bitmap, bool readonly, bool shared,
>                            void (*close)(NBDExport *), bool writethrough,
>                            BlockBackend *on_eject_blk, Error **errp);
> diff --git a/blockdev-nbd.c b/blockdev-nbd.c
> index a1dc11bdd7..16cda3b052 100644
> --- a/blockdev-nbd.c
> +++ b/blockdev-nbd.c
> @@ -154,7 +154,6 @@ BlockExport *nbd_export_create(BlockExportOptions
> *exp_args, Error **errp)
>      BlockDriverState *bs = NULL;
>      BlockBackend *on_eject_blk;
>      NBDExport *exp = NULL;
> -    int64_t len;
>      AioContext *aio_context;
>
>      assert(exp_args->type == BLOCK_EXPORT_TYPE_NBD);
> @@ -192,12 +191,6 @@ BlockExport *nbd_export_create(BlockExportOptions
> *exp_args, Error **errp)
>
>      aio_context = bdrv_get_aio_context(bs);
>      aio_context_acquire(aio_context);
> -    len = bdrv_getlength(bs);
> -    if (len < 0) {
> -        error_setg_errno(errp, -len,
> -                         "Failed to determine the NBD export's length");
> -        goto out;
> -    }
>
>      if (!arg->has_writable) {
>          arg->writable = false;
> @@ -206,7 +199,7 @@ BlockExport *nbd_export_create(BlockExportOptions
> *exp_args, Error **errp)
>          arg->writable = false;
>      }
>
> -    exp = nbd_export_new(bs, 0, len, arg->name, arg->description,
> arg->bitmap,
> +    exp = nbd_export_new(bs, arg->name, arg->description, arg->bitmap,
>                           !arg->writable, !arg->writable,
>                           NULL, false, on_eject_blk, errp);
>      if (!exp) {
> diff --git a/nbd/server.c b/nbd/server.c
> index 774325dbe5..92360d1f08 100644
> --- a/nbd/server.c
> +++ b/nbd/server.c
> @@ -89,7 +89,6 @@ struct NBDExport {
>      BlockBackend *blk;
>      char *name;
>      char *description;
> -    uint64_t dev_offset;
>      uint64_t size;
>      uint16_t nbdflags;
>      QTAILQ_HEAD(, NBDClient) clients;
> @@ -1507,8 +1506,8 @@ static void nbd_eject_notifier(Notifier *n, void
> *data)
>      aio_context_release(aio_context);
>  }
>
> -NBDExport *nbd_export_new(BlockDriverState *bs, uint64_t dev_offset,
> -                          uint64_t size, const char *name, const char
> *desc,
> +NBDExport *nbd_export_new(BlockDriverState *bs,
> +                          const char *name, const char *desc,
>                            const char *bitmap, bool readonly, bool shared,
>                            void (*close)(NBDExport *), bool writethrough,
>                            BlockBackend *on_eject_blk, Error **errp)
> @@ -1516,9 +1515,17 @@ NBDExport *nbd_export_new(BlockDriverState *bs,
> uint64_t dev_offset,
>      AioContext *ctx;
>      BlockBackend *blk;
>      NBDExport *exp;
> +    int64_t size;
>      uint64_t perm;
>      int ret;
>
> +    size = bdrv_getlength(bs);
> +    if (size < 0) {
> +        error_setg_errno(errp, -size,
> +                         "Failed to determine the NBD export's length");
> +        return NULL;
> +    }
> +
>      exp = g_new0(NBDExport, 1);
>      exp->common = (BlockExport) {
>          .drv = &blk_exp_nbd,
> @@ -1553,8 +1560,6 @@ NBDExport *nbd_export_new(BlockDriverState *bs,
> uint64_t dev_offset,
>      exp->refcount = 1;
>      QTAILQ_INIT(&exp->clients);
>      exp->blk = blk;
> -    assert(dev_offset <= INT64_MAX);
> -    exp->dev_offset = dev_offset;
>      exp->name = g_strdup(name);
>      assert(!desc || strlen(desc) <= NBD_MAX_STRING_SIZE);
>      exp->description = g_strdup(desc);
> @@ -1569,7 +1574,7 @@ NBDExport *nbd_export_new(BlockDriverState *bs,
> uint64_t dev_offset,
>          exp->nbdflags |= (NBD_FLAG_SEND_TRIM | NBD_FLAG_SEND_WRITE_ZEROES
> |
>                            NBD_FLAG_SEND_FAST_ZERO);
>      }
> -    assert(size <= INT64_MAX - dev_offset);
> +    assert(size <= INT64_MAX);
>      exp->size = QEMU_ALIGN_DOWN(size, BDRV_SECTOR_SIZE);
>
>      if (bitmap) {
> @@ -1928,8 +1933,7 @@ static int coroutine_fn
> nbd_co_send_sparse_read(NBDClient *client,
>              stl_be_p(&chunk.length, pnum);
>              ret = nbd_co_send_iov(client, iov, 1, errp);
>          } else {
> -            ret = blk_pread(exp->blk, offset + progress + exp->dev_offset,
> -                            data + progress, pnum);
> +            ret = blk_pread(exp->blk, offset + progress, data + progress,
> pnum);
>              if (ret < 0) {
>                  error_setg_errno(errp, -ret, "reading from file failed");
>                  break;
> @@ -2303,8 +2307,7 @@ static coroutine_fn int nbd_do_cmd_read(NBDClient
> *client, NBDRequest *request,
>                                         data, request->len, errp);
>      }
>
> -    ret = blk_pread(exp->blk, request->from + exp->dev_offset, data,
> -                    request->len);
> +    ret = blk_pread(exp->blk, request->from, data, request->len);
>      if (ret < 0) {
>          return nbd_send_generic_reply(client, request->handle, ret,
>                                        "reading from file failed", errp);
> @@ -2339,7 +2342,7 @@ static coroutine_fn int nbd_do_cmd_cache(NBDClient
> *client, NBDRequest *request,
>
>      assert(request->type == NBD_CMD_CACHE);
>
> -    ret = blk_co_preadv(exp->blk, request->from + exp->dev_offset,
> request->len,
> +    ret = blk_co_preadv(exp->blk, request->from, request->len,
>                          NULL, BDRV_REQ_COPY_ON_READ | BDRV_REQ_PREFETCH);
>
>      return nbd_send_generic_reply(client, request->handle, ret,
> @@ -2370,8 +2373,7 @@ static coroutine_fn int nbd_handle_request(NBDClient
> *client,
>          if (request->flags & NBD_CMD_FLAG_FUA) {
>              flags |= BDRV_REQ_FUA;
>          }
> -        ret = blk_pwrite(exp->blk, request->from + exp->dev_offset,
> -                         data, request->len, flags);
> +        ret = blk_pwrite(exp->blk, request->from, data, request->len,
> flags);
>          return nbd_send_generic_reply(client, request->handle, ret,
>                                        "writing to file failed", errp);
>
> @@ -2386,8 +2388,7 @@ static coroutine_fn int nbd_handle_request(NBDClient
> *client,
>          if (request->flags & NBD_CMD_FLAG_FAST_ZERO) {
>              flags |= BDRV_REQ_NO_FALLBACK;
>          }
> -        ret = blk_pwrite_zeroes(exp->blk, request->from + exp->dev_offset,
> -                                request->len, flags);
> +        ret = blk_pwrite_zeroes(exp->blk, request->from, request->len,
> flags);
>          return nbd_send_generic_reply(client, request->handle, ret,
>                                        "writing to file failed", errp);
>
> @@ -2401,8 +2402,7 @@ static coroutine_fn int nbd_handle_request(NBDClient
> *client,
>                                        "flush failed", errp);
>
>      case NBD_CMD_TRIM:
> -        ret = blk_co_pdiscard(exp->blk, request->from + exp->dev_offset,
> -                              request->len);
> +        ret = blk_co_pdiscard(exp->blk, request->from, request->len);
>          if (ret == 0 && request->flags & NBD_CMD_FLAG_FUA) {
>              ret = blk_co_flush(exp->blk);
>          }
> diff --git a/qemu-nbd.c b/qemu-nbd.c
> index d2657b8db5..818c3f5d46 100644
> --- a/qemu-nbd.c
> +++ b/qemu-nbd.c
> @@ -523,7 +523,6 @@ int main(int argc, char **argv)
>      const char *port = NULL;
>      char *sockpath = NULL;
>      char *device = NULL;
> -    int64_t fd_size;
>      QemuOpts *sn_opts = NULL;
>      const char *sn_id_or_name = NULL;
>      const char *sopt = "hVb:o:p:rsnc:dvk:e:f:tl:x:T:D:B:L";
> @@ -1028,6 +1027,17 @@ int main(int argc, char **argv)
>      }
>      bs = blk_bs(blk);
>
> +    if (dev_offset) {
> +        QDict *raw_opts = qdict_new();
> +        qdict_put_str(raw_opts, "driver", "raw");
> +        qdict_put_str(raw_opts, "file", bs->node_name);
> +        qdict_put_int(raw_opts, "offset", dev_offset);
> +        bs = bdrv_open(NULL, NULL, raw_opts, flags, &error_fatal);
> +        blk_remove_bs(blk);
> +        blk_insert_bs(blk, bs, &error_fatal);
> +        bdrv_unref(bs);
> +    }
> +
>      blk_set_enable_write_cache(blk, !writethrough);
>
>      if (sn_opts) {
> @@ -1045,21 +1055,8 @@ int main(int argc, char **argv)
>      }
>
>      bs->detect_zeroes = detect_zeroes;
> -    fd_size = blk_getlength(blk);
> -    if (fd_size < 0) {
> -        error_report("Failed to determine the image length: %s",
> -                     strerror(-fd_size));
> -        exit(EXIT_FAILURE);
> -    }
> -
> -    if (dev_offset >= fd_size) {
> -        error_report("Offset (%" PRIu64 ") has to be smaller than the
> image "
> -                     "size (%" PRId64 ")", dev_offset, fd_size);
> -        exit(EXIT_FAILURE);
> -    }
> -    fd_size -= dev_offset;
>
> -    export = nbd_export_new(bs, dev_offset, fd_size, export_name,
> +    export = nbd_export_new(bs, export_name,
>                              export_description, bitmap, readonly, shared
> > 1,
>                              nbd_export_closed, writethrough, NULL,
>                              &error_fatal);
> --
> 2.25.4
>
>
>

Reply via email to