> -----邮件原件----- > 发件人: Stefan Hajnoczi <stefa...@redhat.com> > 发送时间: 2020年6月22日 20:14 > 收件人: Lin Ma <l...@suse.com> > 抄送: qemu-devel@nongnu.org; f...@euphon.net; kw...@redhat.com; > mre...@redhat.com; pbonz...@redhat.com > 主题: Re: [PATCH v2 3/3] scsi-disk: Add support for the GET LBA STATUS 16 > command > > On Wed, Jun 17, 2020 at 06:30:18PM +0800, Lin Ma wrote: > > Signed-off-by: Lin Ma <l...@suse.com> > > --- > > hw/scsi/scsi-disk.c | 90 > ++++++++++++++++++++++++++++++++++++++ > > include/block/accounting.h | 1 + > > include/scsi/constants.h | 1 + > > 3 files changed, 92 insertions(+) > > > > diff --git a/hw/scsi/scsi-disk.c b/hw/scsi/scsi-disk.c index > > 387503e11b..9e3002ddaf 100644 > > --- a/hw/scsi/scsi-disk.c > > +++ b/hw/scsi/scsi-disk.c > > @@ -1866,6 +1866,89 @@ static void > scsi_disk_emulate_write_data(SCSIRequest *req) > > } > > } > > > > +typedef struct GetLbaStatusCBData { > > + uint32_t num_blocks; > > + uint32_t is_deallocated; > > + SCSIDiskReq *r; > > +} GetLbaStatusCBData; > > + > > +static void scsi_get_lba_status_complete(void *opaque, int ret); > > + > > +static void scsi_get_lba_status_complete_noio(GetLbaStatusCBData > > +*data, int ret) { > > + SCSIDiskReq *r = data->r; > > + SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev); > > + > > + assert(r->req.aiocb == NULL); > > + > > + block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct, > > + s->qdev.blocksize, > BLOCK_ACCT_GET_LBA_STATUS); > > + > > + r->req.aiocb = blk_aio_get_lba_status(s->qdev.conf.blk, > > + r->req.cmd.lba * > s->qdev.blocksize, > > + s->qdev.blocksize, > > + > > +scsi_get_lba_status_complete, data); } > > + > > +static void scsi_get_lba_status_complete(void *opaque, int ret) { > > + GetLbaStatusCBData *data = opaque; > > + SCSIDiskReq *r = data->r; > > + SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev); > > + > > + assert(r->req.aiocb != NULL); > > + r->req.aiocb = NULL; > > + > > + aio_context_acquire(blk_get_aio_context(s->qdev.conf.blk)); > > + if (scsi_disk_req_check_error(r, ret, true)) { > > + g_free(data); > > + goto done; > > + } > > + > > + block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct); > > + scsi_req_unref(&r->req); > > + g_free(data); > > + > > +done: > > + aio_context_release(blk_get_aio_context(s->qdev.conf.blk)); > > +} > > + > > +static void scsi_disk_emulate_get_lba_status(SCSIRequest *req, > > +uint8_t *outbuf) { > > + SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req); > > + GetLbaStatusCBData *data; > > + uint32_t *num_blocks; > > + uint32_t *is_deallocated; > > + > > + data = g_new0(GetLbaStatusCBData, 1); > > + data->r = r; > > + num_blocks = &(data->num_blocks); > > + is_deallocated = &(data->is_deallocated); > > + > > + scsi_req_ref(&r->req); > > + scsi_get_lba_status_complete_noio(data, 0); > > scsi_get_lba_status_complete_noio() looks asynchronous. If the BlockDriver > yields in .bdrv_co_block_status() then the operation has not completed yet > when scsi_get_lba_status_complete_noio() returns. It is not safe to access the > GetLbaStatusCBData data until the async operation is complete. > > Also, scsi_get_lba_status_complete() calls g_free(data) so there is a > use-after-free when *num_blocks and *is_deallocated are accessed.
Got it, I'll fill the outbuf[] in the completion function in V3. > These issues can be solved by making this code asynchronous (similar to > read/write/flush/discard_zeroes/ioctl). outbuf[] will be filled in in the > completion > function before g_free(data) is called. I looked into block/io.c, The 'bdrv_co_pdiscard()', the 'bdrv_co_block_status' and the 'bdrv_co_flush()', They look similiar, They called corresponding bs->drv->bdrv_co_*() or the bs->drv->bdrv_aio_*() between pair of blk_inc/dec_in_flight(): The 'bdrv_co_pdiscard()' calls bs->drv->bdrv_co_pdiscard() or bs->drv->bdrv_aio_pdiscard() The 'bdrv_co_flush()' calls bs->drv->bdrv_co_flush*() or bs->drv->bdrv_aio_flush(). The 'bdrv_co_block_status' calls bs->drv->bdrv_co_block_status(). qemu contains the coroutine version of block_status, no aio version of block_status. About "making this code asynchronous", Well, In fact I havn't realized yet where the issue is. If what you mean is that make the 'bdrv_co_get_lba_status()' asynchronous, How about directly calling coroutine-based 'bdrv_co_block_status()' instead of 'bdrv_block_status()' in it? Or could you please suggest more detailed information? BTW, IMO the existing BlockDriver->bdrv_co_block_status() is enough, It's not necessary to implement a drv->bdrv_aio_get_block_status() in BlockDrivers(say qcow2 or raw), Am I right? I'm not familiar with qemu block layer and coroutine, Sorry for any inconvenience. > > + > > + /* > > + * 8 + 16 is the length in bytes of response header and > > + * one LBA status descriptor > > + */ > > + memset(outbuf, 0, 8 + 16); > > + outbuf[3] = 20; > > + outbuf[8] = (req->cmd.lba >> 56) & 0xff; > > + outbuf[9] = (req->cmd.lba >> 48) & 0xff; > > + outbuf[10] = (req->cmd.lba >> 40) & 0xff; > > + outbuf[11] = (req->cmd.lba >> 32) & 0xff; > > + outbuf[12] = (req->cmd.lba >> 24) & 0xff; > > + outbuf[13] = (req->cmd.lba >> 16) & 0xff; > > + outbuf[14] = (req->cmd.lba >> 8) & 0xff; > > + outbuf[15] = req->cmd.lba & 0xff; > > + outbuf[16] = (*num_blocks >> 24) & 0xff; > > + outbuf[17] = (*num_blocks >> 16) & 0xff; > > + outbuf[18] = (*num_blocks >> 8) & 0xff; > > + outbuf[19] = *num_blocks & 0xff; > > + outbuf[20] = *is_deallocated ? 1 : 0; > > SCSI defines 3 values and QEMU can represent all of them: > > 0 - mapped or unknown > 1 - deallocated > 2 - anchored > > See the BDRV_BLOCK_* constants in include/block/block.h. The is_deallocated > boolean is not enough to represent this state, but the > bdrv_block_status() return value can be used instead. > > > +} > > + > > static int32_t scsi_disk_emulate_command(SCSIRequest *req, uint8_t > > *buf) { > > SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req); @@ -2076,6 > > +2159,13 @@ static int32_t scsi_disk_emulate_command(SCSIRequest *req, > > uint8_t *buf) > > > > /* Protection, exponent and lowest lba field left blank. */ > > break; > > + } else if ((req->cmd.buf[1] & 31) == SAI_GET_LBA_STATUS) { > > + if (req->cmd.lba > s->qdev.max_lba) { > > + goto illegal_lba; > > + } > > + scsi_disk_emulate_get_lba_status(req, outbuf); > > + r->iov.iov_len = req->cmd.xfer; > > + return r->iov.iov_len; > > Is there something tricky going on here with iov_len that prevents us from > using > break here and sharing the functions normal return code path? > > > } > > trace_scsi_disk_emulate_command_SAI_unsupported(); > > goto illegal_request; > > diff --git a/include/block/accounting.h b/include/block/accounting.h > > index 878b4c3581..645014fb0b 100644 > > --- a/include/block/accounting.h > > +++ b/include/block/accounting.h > > @@ -38,6 +38,7 @@ enum BlockAcctType { > > BLOCK_ACCT_WRITE, > > BLOCK_ACCT_FLUSH, > > BLOCK_ACCT_UNMAP, > > + BLOCK_ACCT_GET_LBA_STATUS, > > BLOCK_MAX_IOTYPE, > > }; > > > > diff --git a/include/scsi/constants.h b/include/scsi/constants.h index > > 874176019e..b18377b214 100644 > > --- a/include/scsi/constants.h > > +++ b/include/scsi/constants.h > > @@ -154,6 +154,7 @@ > > * SERVICE ACTION IN subcodes > > */ > > #define SAI_READ_CAPACITY_16 0x10 > > +#define SAI_GET_LBA_STATUS 0x12 > > > > /* > > * READ POSITION service action codes > > -- > > 2.26.0 > >