[Devel] [PATCH rh7] ploop: fix barriers for ordinary requests
Dmitry Monakhov
dmonakhov at openvz.org
Wed Jun 22 06:41:39 PDT 2016
Maxim Patlasov <mpatlasov at virtuozzo.com> writes:
> The way how io_direct.c handles FLUSH|FUA: b1:FLUSH,b2,b3,b4,b5:FLUSH|FUA
> is completely wrong: to make sure that b1:FLUSH made effect we have to
> wait for its completion. Similarly, even if we're sure that FUA will be
> processed as post-FLUSH (also dubious!), we have to wait for completion
> b1..b4 to make sure that that flush will cover them.
>
> The patch fixes all these issues pretty simple: let's mark outgouing
> bio-s with FLUSH|FUA based on those flags in *corresponing* incoming
> bio-s.
One more thing please see below.
>
> Signed-off-by: Maxim Patlasov <mpatlasov at virtuozzo.com>
> ---
> drivers/block/ploop/dev.c | 1 -
> drivers/block/ploop/io_direct.c | 47 ++++++++++++---------------------------
> 2 files changed, 15 insertions(+), 33 deletions(-)
>
> diff --git a/drivers/block/ploop/dev.c b/drivers/block/ploop/dev.c
> index 2ef1449..6b5702f 100644
> --- a/drivers/block/ploop/dev.c
> +++ b/drivers/block/ploop/dev.c
> @@ -498,7 +498,6 @@ ploop_bio_queue(struct ploop_device * plo, struct bio * bio,
> preq->req_sector = bio->bi_sector;
> preq->req_size = bio->bi_size >> 9;
> preq->req_rw = bio->bi_rw;
> - bio->bi_rw &= ~(REQ_FLUSH | REQ_FUA);
> preq->eng_state = PLOOP_E_ENTRY;
> preq->state = 0;
> preq->error = 0;
> diff --git a/drivers/block/ploop/io_direct.c b/drivers/block/ploop/io_direct.c
> index 6ef9cd8..84c9a48 100644
> --- a/drivers/block/ploop/io_direct.c
> +++ b/drivers/block/ploop/io_direct.c
> @@ -92,7 +92,6 @@ dio_submit(struct ploop_io *io, struct ploop_request * preq,
> int preflush;
> int postfua = 0;
> int write = !!(rw & REQ_WRITE);
> - int bio_num;
>
> trace_submit(preq);
>
> @@ -233,13 +232,13 @@ flush_bio:
> goto flush_bio;
> }
>
> + bio->bi_rw |= bw.cur->bi_rw & (REQ_FLUSH | REQ_FUA);
> bw.bv_off += copy;
> size -= copy >> 9;
> sec += copy >> 9;
> }
> ploop_extent_put(em);
>
> - bio_num = 0;
> while (bl.head) {
> struct bio * b = bl.head;
> unsigned long rw2 = rw;
> @@ -255,11 +254,10 @@ flush_bio:
> preflush = 0;
> }
> if (unlikely(postfua && !bl.head))
> - rw2 |= (REQ_FUA | ((bio_num) ? REQ_FLUSH : 0));
> + rw2 |= REQ_FUA;
>
> ploop_acc_ff_out(preq->plo, rw2 | b->bi_rw);
> - submit_bio(rw2, b);
> - bio_num++;
> + submit_bio(rw2 | b->bi_rw, b);
> }
>
> ploop_complete_io_request(preq);
> @@ -567,7 +565,6 @@ dio_submit_pad(struct ploop_io *io, struct ploop_request * preq,
> sector_t sec, end_sec, nsec, start, end;
> struct bio_list_walk bw;
> int err;
> - int preflush = !!(preq->req_rw & REQ_FLUSH);
>
> bio_list_init(&bl);
>
> @@ -598,14 +595,17 @@ dio_submit_pad(struct ploop_io *io, struct ploop_request * preq,
> while (sec < end_sec) {
> struct page * page;
> unsigned int poff, plen;
> + bool zero_page;
>
> if (sec < start) {
> + zero_page = true;
> page = ZERO_PAGE(0);
> poff = 0;
> plen = start - sec;
> if (plen > (PAGE_SIZE>>9))
> plen = (PAGE_SIZE>>9);
> } else if (sec >= end) {
> + zero_page = true;
> page = ZERO_PAGE(0);
> poff = 0;
> plen = end_sec - sec;
> @@ -614,6 +614,7 @@ dio_submit_pad(struct ploop_io *io, struct ploop_request * preq,
> } else {
> /* sec >= start && sec < end */
> struct bio_vec * bv;
> + zero_page = false;
>
> if (sec == start) {
> bw.cur = sbl->head;
> @@ -672,6 +673,10 @@ flush_bio:
> goto flush_bio;
> }
>
> + /* Handle FLUSH here, dio_post_submit will handle FUA */
submit_pad may be called w/o post_submit flag from here:
->dio_submit_alloc
if (io->files.em_tree->_get_extent) {
->dio_fallocate
->dio_submit_pad
..
}
> + if (!zero_page)
> + bio->bi_rw |= bw.cur->bi_rw & REQ_FLUSH;
> +
> bw.bv_off += (plen<<9);
> BUG_ON(plen == 0);
> sec += plen;
> @@ -688,13 +693,9 @@ flush_bio:
> b->bi_private = preq;
> b->bi_end_io = dio_endio_async;
>
> - rw = sbl->head->bi_rw | WRITE;
> - if (unlikely(preflush)) {
> - rw |= REQ_FLUSH;
> - preflush = 0;
> - }
> + rw = preq->req_rw & ~(REQ_FLUSH | REQ_FUA);
> ploop_acc_ff_out(preq->plo, rw | b->bi_rw);
> - submit_bio(rw, b);
> + submit_bio(rw | b->bi_rw, b);
> }
>
> ploop_complete_io_request(preq);
> @@ -1422,13 +1423,6 @@ dio_io_page(struct ploop_io * io, unsigned long rw,
> sector_t nsec;
> int err;
> int off;
> - int postfua;
> - int bio_num;
> - int preflush;
> -
> - preflush = !!(rw & REQ_FLUSH);
> - postfua = !!(rw & REQ_FUA);
> - rw &= ~(REQ_FUA|REQ_FLUSH);
>
> bio_list_init(&bl);
> bio = NULL;
> @@ -1481,27 +1475,16 @@ flush_bio:
> if (em)
> ploop_extent_put(em);
>
> - bio_num = 0;
> while (bl.head) {
> - unsigned long rw2 = rw;
> struct bio * b = bl.head;
> bl.head = b->bi_next;
>
> - if (unlikely(preflush)) {
> - rw2 |= REQ_FLUSH;
> - preflush = 0;
> - }
> -
> - if (unlikely(postfua && !bl.head))
> - rw2 |= (REQ_FUA | ((bio_num) ? REQ_FLUSH : 0));
> -
> b->bi_next = NULL;
> b->bi_end_io = dio_endio_async;
> b->bi_private = preq;
> atomic_inc(&preq->io_count);
> - ploop_acc_ff_out(preq->plo, rw2 | b->bi_rw);
> - submit_bio(rw2, b);
> - bio_num++;
> + ploop_acc_ff_out(preq->plo, rw | b->bi_rw);
> + submit_bio(rw, b);
> }
>
> ploop_complete_io_request(preq);
More information about the Devel
mailing list