Skip to content

Commit cd65869

Browse files
committed
io_uring: use iov_iter state save/restore helpers
Get rid of the need to do re-expand and revert on an iterator when we encounter a short IO, or failure that warrants a retry. Use the new state save/restore helpers instead. We keep the iov_iter_state persistent across retries, if we need to restart the read or write operation. If there's a pending retry, the operation will always exit with the state correctly saved. Signed-off-by: Jens Axboe <axboe@kernel.dk>
1 parent 8fb0f47 commit cd65869

File tree

1 file changed

+61
-21
lines changed

1 file changed

+61
-21
lines changed

fs/io_uring.c

Lines changed: 61 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -712,6 +712,7 @@ struct io_async_rw {
712712
struct iovec fast_iov[UIO_FASTIOV];
713713
const struct iovec *free_iovec;
714714
struct iov_iter iter;
715+
struct iov_iter_state iter_state;
715716
size_t bytes_done;
716717
struct wait_page_queue wpq;
717718
};
@@ -2608,8 +2609,7 @@ static bool io_resubmit_prep(struct io_kiocb *req)
26082609

26092610
if (!rw)
26102611
return !io_req_prep_async(req);
2611-
/* may have left rw->iter inconsistent on -EIOCBQUEUED */
2612-
iov_iter_revert(&rw->iter, req->result - iov_iter_count(&rw->iter));
2612+
iov_iter_restore(&rw->iter, &rw->iter_state);
26132613
return true;
26142614
}
26152615

@@ -3310,12 +3310,17 @@ static int io_setup_async_rw(struct io_kiocb *req, const struct iovec *iovec,
33103310
if (!force && !io_op_defs[req->opcode].needs_async_setup)
33113311
return 0;
33123312
if (!req->async_data) {
3313+
struct io_async_rw *iorw;
3314+
33133315
if (io_alloc_async_data(req)) {
33143316
kfree(iovec);
33153317
return -ENOMEM;
33163318
}
33173319

33183320
io_req_map_rw(req, iovec, fast_iov, iter);
3321+
iorw = req->async_data;
3322+
/* we've copied and mapped the iter, ensure state is saved */
3323+
iov_iter_save_state(&iorw->iter, &iorw->iter_state);
33193324
}
33203325
return 0;
33213326
}
@@ -3334,6 +3339,7 @@ static inline int io_rw_prep_async(struct io_kiocb *req, int rw)
33343339
iorw->free_iovec = iov;
33353340
if (iov)
33363341
req->flags |= REQ_F_NEED_CLEANUP;
3342+
iov_iter_save_state(&iorw->iter, &iorw->iter_state);
33373343
return 0;
33383344
}
33393345

@@ -3437,19 +3443,28 @@ static int io_read(struct io_kiocb *req, unsigned int issue_flags)
34373443
struct kiocb *kiocb = &req->rw.kiocb;
34383444
struct iov_iter __iter, *iter = &__iter;
34393445
struct io_async_rw *rw = req->async_data;
3440-
ssize_t io_size, ret, ret2;
34413446
bool force_nonblock = issue_flags & IO_URING_F_NONBLOCK;
3447+
struct iov_iter_state __state, *state;
3448+
ssize_t ret, ret2;
34423449

34433450
if (rw) {
34443451
iter = &rw->iter;
3452+
state = &rw->iter_state;
3453+
/*
3454+
* We come here from an earlier attempt, restore our state to
3455+
* match in case it doesn't. It's cheap enough that we don't
3456+
* need to make this conditional.
3457+
*/
3458+
iov_iter_restore(iter, state);
34453459
iovec = NULL;
34463460
} else {
34473461
ret = io_import_iovec(READ, req, &iovec, iter, !force_nonblock);
34483462
if (ret < 0)
34493463
return ret;
3464+
state = &__state;
3465+
iov_iter_save_state(iter, state);
34503466
}
3451-
io_size = iov_iter_count(iter);
3452-
req->result = io_size;
3467+
req->result = iov_iter_count(iter);
34533468

34543469
/* Ensure we clear previously set non-block flag */
34553470
if (!force_nonblock)
@@ -3463,7 +3478,7 @@ static int io_read(struct io_kiocb *req, unsigned int issue_flags)
34633478
return ret ?: -EAGAIN;
34643479
}
34653480

3466-
ret = rw_verify_area(READ, req->file, io_kiocb_ppos(kiocb), io_size);
3481+
ret = rw_verify_area(READ, req->file, io_kiocb_ppos(kiocb), req->result);
34673482
if (unlikely(ret)) {
34683483
kfree(iovec);
34693484
return ret;
@@ -3479,30 +3494,49 @@ static int io_read(struct io_kiocb *req, unsigned int issue_flags)
34793494
/* no retry on NONBLOCK nor RWF_NOWAIT */
34803495
if (req->flags & REQ_F_NOWAIT)
34813496
goto done;
3482-
/* some cases will consume bytes even on error returns */
3483-
iov_iter_reexpand(iter, iter->count + iter->truncated);
3484-
iov_iter_revert(iter, io_size - iov_iter_count(iter));
34853497
ret = 0;
34863498
} else if (ret == -EIOCBQUEUED) {
34873499
goto out_free;
3488-
} else if (ret <= 0 || ret == io_size || !force_nonblock ||
3500+
} else if (ret <= 0 || ret == req->result || !force_nonblock ||
34893501
(req->flags & REQ_F_NOWAIT) || !need_read_all(req)) {
34903502
/* read all, failed, already did sync or don't want to retry */
34913503
goto done;
34923504
}
34933505

3506+
/*
3507+
* Don't depend on the iter state matching what was consumed, or being
3508+
* untouched in case of error. Restore it and we'll advance it
3509+
* manually if we need to.
3510+
*/
3511+
iov_iter_restore(iter, state);
3512+
34943513
ret2 = io_setup_async_rw(req, iovec, inline_vecs, iter, true);
34953514
if (ret2)
34963515
return ret2;
34973516

34983517
iovec = NULL;
34993518
rw = req->async_data;
3500-
/* now use our persistent iterator, if we aren't already */
3501-
iter = &rw->iter;
3519+
/*
3520+
* Now use our persistent iterator and state, if we aren't already.
3521+
* We've restored and mapped the iter to match.
3522+
*/
3523+
if (iter != &rw->iter) {
3524+
iter = &rw->iter;
3525+
state = &rw->iter_state;
3526+
}
35023527

35033528
do {
3504-
io_size -= ret;
3529+
/*
3530+
* We end up here because of a partial read, either from
3531+
* above or inside this loop. Advance the iter by the bytes
3532+
* that were consumed.
3533+
*/
3534+
iov_iter_advance(iter, ret);
3535+
if (!iov_iter_count(iter))
3536+
break;
35053537
rw->bytes_done += ret;
3538+
iov_iter_save_state(iter, state);
3539+
35063540
/* if we can retry, do so with the callbacks armed */
35073541
if (!io_rw_should_retry(req)) {
35083542
kiocb->ki_flags &= ~IOCB_WAITQ;
@@ -3520,7 +3554,8 @@ static int io_read(struct io_kiocb *req, unsigned int issue_flags)
35203554
return 0;
35213555
/* we got some bytes, but not all. retry. */
35223556
kiocb->ki_flags &= ~IOCB_WAITQ;
3523-
} while (ret > 0 && ret < io_size);
3557+
iov_iter_restore(iter, state);
3558+
} while (ret > 0);
35243559
done:
35253560
kiocb_done(kiocb, ret, issue_flags);
35263561
out_free:
@@ -3543,19 +3578,24 @@ static int io_write(struct io_kiocb *req, unsigned int issue_flags)
35433578
struct kiocb *kiocb = &req->rw.kiocb;
35443579
struct iov_iter __iter, *iter = &__iter;
35453580
struct io_async_rw *rw = req->async_data;
3546-
ssize_t ret, ret2, io_size;
35473581
bool force_nonblock = issue_flags & IO_URING_F_NONBLOCK;
3582+
struct iov_iter_state __state, *state;
3583+
ssize_t ret, ret2;
35483584

35493585
if (rw) {
35503586
iter = &rw->iter;
3587+
state = &rw->iter_state;
3588+
iov_iter_restore(iter, state);
35513589
iovec = NULL;
35523590
} else {
35533591
ret = io_import_iovec(WRITE, req, &iovec, iter, !force_nonblock);
35543592
if (ret < 0)
35553593
return ret;
3594+
state = &__state;
3595+
iov_iter_save_state(iter, state);
35563596
}
3557-
io_size = iov_iter_count(iter);
3558-
req->result = io_size;
3597+
req->result = iov_iter_count(iter);
3598+
ret2 = 0;
35593599

35603600
/* Ensure we clear previously set non-block flag */
35613601
if (!force_nonblock)
@@ -3572,7 +3612,7 @@ static int io_write(struct io_kiocb *req, unsigned int issue_flags)
35723612
(req->flags & REQ_F_ISREG))
35733613
goto copy_iov;
35743614

3575-
ret = rw_verify_area(WRITE, req->file, io_kiocb_ppos(kiocb), io_size);
3615+
ret = rw_verify_area(WRITE, req->file, io_kiocb_ppos(kiocb), req->result);
35763616
if (unlikely(ret))
35773617
goto out_free;
35783618

@@ -3619,9 +3659,9 @@ static int io_write(struct io_kiocb *req, unsigned int issue_flags)
36193659
kiocb_done(kiocb, ret2, issue_flags);
36203660
} else {
36213661
copy_iov:
3622-
/* some cases will consume bytes even on error returns */
3623-
iov_iter_reexpand(iter, iter->count + iter->truncated);
3624-
iov_iter_revert(iter, io_size - iov_iter_count(iter));
3662+
iov_iter_restore(iter, state);
3663+
if (ret2 > 0)
3664+
iov_iter_advance(iter, ret2);
36253665
ret = io_setup_async_rw(req, iovec, inline_vecs, iter, false);
36263666
return ret ?: -EAGAIN;
36273667
}

0 commit comments

Comments
 (0)