On Thu, Mar 12, 2026 at 2:24 PM Eugenio Perez Martin
<[email protected]> wrote:
>
> On Thu, Mar 12, 2026 at 4:58 AM Jason Wang <[email protected]> wrote:
> >
> > On Wed, Mar 11, 2026 at 3:08 AM Eugenio Pérez <[email protected]> wrote:
> > >
> > > Add the VDUSE_F_QUEUE_READY feature flag. This allows the kernel module
> > > to explicitly signal userspace when a specific virtqueue has been
> > > enabled.
> > >
> > > In scenarios like Live Migration of VirtIO net devices, the dataplane
> > > starts after the control virtqueue allowing QEMU to apply configuration
> > > in the destination device.
> > >
> > > Signed-off-by: Eugenio Pérez <[email protected]>
> > > ---
> > > v2:
> > > * Fix comment of vduse_dev_request.vq_ready
> > > * Set vq_ready before sending the message to the VDUSE userland
> > > instance, avoiding the need for SMP sync after receiving the message.
> > > ---
> > > drivers/vdpa/vdpa_user/vduse_dev.c | 28 +++++++++++++++++++++++++++-
> > > include/uapi/linux/vduse.h | 18 ++++++++++++++++++
> > > 2 files changed, 45 insertions(+), 1 deletion(-)
> > >
> > > diff --git a/drivers/vdpa/vdpa_user/vduse_dev.c
> > > b/drivers/vdpa/vdpa_user/vduse_dev.c
> > > index 17e0358d3a68..4f642b95a7cb 100644
> > > --- a/drivers/vdpa/vdpa_user/vduse_dev.c
> > > +++ b/drivers/vdpa/vdpa_user/vduse_dev.c
> > > @@ -9,6 +9,7 @@
> > > */
> > >
> > > #include "linux/virtio_net.h"
> > > +#include <linux/bits.h>
> > > #include <linux/cleanup.h>
> > > #include <linux/init.h>
> > > #include <linux/module.h>
> > > @@ -53,7 +54,7 @@
> > > #define IRQ_UNBOUND -1
> > >
> > > /* Supported VDUSE features */
> > > -static const uint64_t vduse_features;
> > > +static const uint64_t vduse_features = BIT_U64(VDUSE_F_QUEUE_READY);
> > >
> > > /*
> > > * VDUSE instance have not asked the vduse API version, so assume 0.
> > > @@ -120,6 +121,7 @@ struct vduse_dev {
> > > char *name;
> > > struct mutex lock;
> > > spinlock_t msg_lock;
> > > + u64 vduse_features;
> > > u64 msg_unique;
> > > u32 msg_timeout;
> > > wait_queue_head_t waitq;
> > > @@ -601,8 +603,29 @@ static void vduse_vdpa_set_vq_ready(struct
> > > vdpa_device *vdpa,
> > > {
> > > struct vduse_dev *dev = vdpa_to_vduse(vdpa);
> > > struct vduse_virtqueue *vq = dev->vqs[idx];
> > > + struct vduse_dev_msg msg = { 0 };
> > > + int r;
> > >
> > > vq->ready = ready;
> > > +
> > > + if (!(dev->vduse_features & BIT_U64(VDUSE_F_QUEUE_READY)))
> > > + return;
> > > +
> > > + msg.req.type = VDUSE_SET_VQ_READY;
> > > + msg.req.vq_ready.num = idx;
> > > + msg.req.vq_ready.ready = !!ready;
> > > +
> > > + r = vduse_dev_msg_sync(dev, &msg);
> > > +
> > > + if (r < 0) {
> > > + dev_dbg(&vdpa->dev, "device refuses to set vq %u ready
> > > %u",
> > > + idx, ready);
> > > +
> > > + /* We can't do better than break the device in this case
> > > */
> >
> > It's better to explain why we can't depend on vduse_dev_msg_sync() here.
> >
> > For example it did:
> >
> > if (unlikely(dev->broken))
> > return -EIO;
> >
> > init_waitqueue_head(&msg->waitq);
> > spin_lock(&dev->msg_lock);
> > if (unlikely(dev->broken)) {
> > spin_unlock(&dev->msg_lock);
> > return -EIO;
> > }
> >
> > and
> >
> > if (!msg->completed) {
> > list_del(&msg->list);
> > msg->resp.result = VDUSE_REQ_RESULT_FAILED;
> > /* Mark the device as malfunction when there is a timeout */
> > if (!ret)
> > vduse_dev_broken(dev);
> > }
> >
>
> I'm not sure I follow you here.
>
> We can't do better than breaking the device because the function
> returns no error state, and the caller does not expect an error code.
> Do you mean we can't depend on vduse_dev_msg_sync to call
> vduse_dev_broken(dev) by itself?
I think I meant, reset seems to be more heavyweight than suspend.
So if reset can fail, I don't see reason ot break device only for
suspend failure.
Thanks
>
> > > + spin_lock(&dev->msg_lock);
> > > + vduse_dev_broken(dev);
> > > + spin_unlock(&dev->msg_lock);
> > > + }
> > > }
> > >
> > > static bool vduse_vdpa_get_vq_ready(struct vdpa_device *vdpa, u16 idx)
> > > @@ -2078,6 +2101,9 @@ static int vduse_create_dev(struct vduse_dev_config
> > > *config,
> > > dev->device_features = config->features;
> > > dev->device_id = config->device_id;
> > > dev->vendor_id = config->vendor_id;
> > > + dev->vduse_features = config->vduse_features;
> > > + dev_dbg(vduse_ctrl_dev, "Creating device %s with features 0x%llx",
> > > + config->name, config->vduse_features);
> > >
> > > dev->nas = (dev->api_version < VDUSE_API_VERSION_1) ? 1 :
> > > config->nas;
> > > dev->as = kcalloc(dev->nas, sizeof(dev->as[0]), GFP_KERNEL);
> > > diff --git a/include/uapi/linux/vduse.h b/include/uapi/linux/vduse.h
> > > index e9b5f32a452d..7324faea5df4 100644
> > > --- a/include/uapi/linux/vduse.h
> > > +++ b/include/uapi/linux/vduse.h
> > > @@ -14,6 +14,9 @@
> > >
> > > #define VDUSE_API_VERSION_1 1
> > >
> > > +/* The VDUSE instance expects a request for vq ready */
> > > +#define VDUSE_F_QUEUE_READY 0
> > > +
> > > /*
> > > * Get the version of VDUSE API that kernel supported
> > > (VDUSE_API_VERSION).
> > > * This is used for future extension.
> > > @@ -330,6 +333,7 @@ enum vduse_req_type {
> > > VDUSE_SET_STATUS,
> > > VDUSE_UPDATE_IOTLB,
> > > VDUSE_SET_VQ_GROUP_ASID,
> > > + VDUSE_SET_VQ_READY,
> > > };
> > >
> > > /**
> > > @@ -377,6 +381,15 @@ struct vduse_iova_range_v2 {
> > > __u32 padding;
> > > };
> > >
> > > +/**
> > > + * struct vduse_vq_ready - Virtqueue ready request message
> > > + * @num: Virtqueue number
> > > + */
> > > +struct vduse_vq_ready {
> > > + __u32 num;
> > > + __u32 ready;
> > > +};
> > > +
> > > /**
> > > * struct vduse_dev_request - control request
> > > * @type: request type
> > > @@ -387,6 +400,7 @@ struct vduse_iova_range_v2 {
> > > * @iova: IOVA range for updating
> > > * @iova_v2: IOVA range for updating if API_VERSION >= 1
> > > * @vq_group_asid: ASID of a virtqueue group
> > > + * @vq_ready: Virtqueue ready request
> > > * @padding: padding
> > > *
> > > * Structure used by read(2) on /dev/vduse/$NAME.
> > > @@ -404,6 +418,10 @@ struct vduse_dev_request {
> > > */
> > > struct vduse_iova_range_v2 iova_v2;
> > > struct vduse_vq_group_asid vq_group_asid;
> > > +
> > > + /* Only if VDUSE_F_QUEUE_READY is negotiated */
> > > + struct vduse_vq_ready vq_ready;
> > > +
> > > __u32 padding[32];
> > > };
> > > };
> > > --
> > > 2.53.0
> > >
> >
> > Thanks
> >
>