dio_submit and dio_submit_pad may produce several bios. This makes
processing of REQ_FUA complicated because in order to preserve correctness
we have to TAG each bio with FUA flag which is suboptimal.
Obviously there is a room for optimization here: once all bios was acknowledged
by lower layer we may issue empty barrier aka ->issue_flush().
post_submit call back is the place where we all bios completed already.

b1:FUA, b2:FUA, b3:FUA =>  b1,b2,b3,wait_for_bios,bX:FLUSH

This allow us to remove all this REQ_FORCE_{FLUSH,FUA} crap and

Signed-off-by: Dmitry Monakhov <dmonak...@openvz.org>
---
 drivers/block/ploop/io_direct.c | 48 +++++++++++++++++------------------------
 include/linux/ploop/ploop.h     |  2 ++
 2 files changed, 22 insertions(+), 28 deletions(-)

diff --git a/drivers/block/ploop/io_direct.c b/drivers/block/ploop/io_direct.c
index 195d318..752a9c3e 100644
--- a/drivers/block/ploop/io_direct.c
+++ b/drivers/block/ploop/io_direct.c
@@ -82,31 +82,13 @@ dio_submit(struct ploop_io *io, struct ploop_request * preq,
        sector_t sec, nsec;
        int err;
        struct bio_list_walk bw;
-       int preflush;
-       int postfua = 0;
+       int preflush = !!(rw & REQ_FLUSH);
+       int postflush = !!(rw & REQ_FUA);
        int write = !!(rw & REQ_WRITE);
 
        trace_submit(preq);
 
-       preflush = !!(rw & REQ_FLUSH);
-
-       if (test_and_clear_bit(PLOOP_REQ_FORCE_FLUSH, &preq->state))
-               preflush = 1;
-
-       if (test_and_clear_bit(PLOOP_REQ_FORCE_FUA, &preq->state))
-               postfua = 1;
-
-       if (!postfua && ploop_req_delay_fua_possible(rw, preq)) {
-
-               /* Mark req that delayed flush required */
-               set_bit(PLOOP_REQ_FORCE_FLUSH, &preq->state);
-       } else if (rw & REQ_FUA) {
-               postfua = 1;
-       }
-
        rw &= ~(REQ_FLUSH | REQ_FUA);
-
-
        bio_list_init(&bl);
 
        if (iblk == PLOOP_ZERO_INDEX)
@@ -237,13 +219,14 @@ flush_bio:
                        rw2 |= REQ_FLUSH;
                        preflush = 0;
                }
-               if (unlikely(postfua && !bl.head))
-                       rw2 |= REQ_FUA;
-
                ploop_acc_ff_out(preq->plo, rw2 | b->bi_rw);
                submit_bio(rw2, b);
        }
-
+       /* TODO: minor optimization is possible for single bio case */
+       if (postflush) {
+               set_bit(PLOOP_REQ_DEL_FLUSH, &preq->state);
+               ploop_add_post_submit(io, preq);
+       }
        ploop_complete_io_request(preq);
        return;
 
@@ -523,9 +506,10 @@ dio_convert_extent(struct ploop_io *io, struct 
ploop_request * preq)
                                              (loff_t)sec << 9, clu_siz);
 
        /* highly unlikely case: FUA coming to a block not provisioned yet */
-       if (!err && force_sync)
+       if (!err && force_sync) {
+               clear_bit(PLOOP_REQ_DEL_FLUSH, &preq->state);
                err = io->ops->sync(io);
-
+       }
        if (!force_sync) {
                spin_lock_irq(&plo->lock);
                io->io_count++;
@@ -546,7 +530,12 @@ dio_post_submit(struct ploop_io *io, struct ploop_request 
* preq)
        if (test_and_clear_bit(PLOOP_REQ_DEL_CONV, &preq->state))
                dio_convert_extent(io, preq);
 
+       if (test_and_clear_bit(PLOOP_REQ_DEL_FLUSH, &preq->state)) {
+               io->ops->issue_flush(io, preq);
+               return 1;
+       }
        return 0;
+
 }
 
 /* Submit the whole cluster. If preq contains only partial data
@@ -562,7 +551,6 @@ dio_submit_pad(struct ploop_io *io, struct ploop_request * 
preq,
        sector_t sec, end_sec, nsec, start, end;
        struct bio_list_walk bw;
        int err;
-
        bio_list_init(&bl);
 
        /* sec..end_sec is the range which we are going to write */
@@ -694,7 +682,11 @@ flush_bio:
                ploop_acc_ff_out(preq->plo, rw | b->bi_rw);
                submit_bio(rw, b);
        }
-
+       /* TODO: minor optimization is possible for single bio case */
+       if (preq->req_rw &  REQ_FUA) {
+               set_bit(PLOOP_REQ_DEL_FLUSH, &preq->state);
+               ploop_add_post_submit(io, preq);
+       }
        ploop_complete_io_request(preq);
        return;
 
diff --git a/include/linux/ploop/ploop.h b/include/linux/ploop/ploop.h
index 4c52a40..5076f16 100644
--- a/include/linux/ploop/ploop.h
+++ b/include/linux/ploop/ploop.h
@@ -472,6 +472,7 @@ enum
        PLOOP_REQ_PUSH_BACKUP, /* preq was ACKed by userspace push_backup */
        PLOOP_REQ_ALLOW_READS, /* READs are allowed for given req_cluster */
        PLOOP_REQ_DEL_CONV,    /* post_submit: conversion required */
+       PLOOP_REQ_DEL_FLUSH,   /* post_submit: REQ_FLUSH required */
        PLOOP_REQ_FSYNC_DONE,  /* fsync_thread() performed f_op->fsync() */
 };
 
@@ -482,6 +483,7 @@ enum
 #define PLOOP_REQ_ZERO_FL (1 << PLOOP_REQ_ZERO)
 #define PLOOP_REQ_POST_SUBMIT_FL (1 << PLOOP_REQ_POST_SUBMIT)
 #define PLOOP_REQ_DEL_CONV_FL (1 << PLOOP_REQ_DEL_CONV)
+#define PLOOP_REQ_DEL_FLUSH_FL (1 << PLOOP_REQ_DEL_FLUSH)
 
 enum
 {
-- 
1.8.3.1

_______________________________________________
Devel mailing list
Devel@openvz.org
https://lists.openvz.org/mailman/listinfo/devel

Reply via email to