Skip to content

Commit 2299cee

Browse files
calebsanderaxboe
authored andcommitted
ublk: use copy_{to,from}_iter() for user copy
ublk_copy_user_pages()/ublk_copy_io_pages() currently uses iov_iter_get_pages2() to extract the pages from the iov_iter and memcpy()s between the bvec_iter and the iov_iter's pages one at a time. Switch to using copy_to_iter()/copy_from_iter() instead. This avoids the user page reference count increments and decrements and needing to split the memcpy() at user page boundaries. It also simplifies the code considerably. Ming reports a 40% throughput improvement when issuing I/O to the selftests null ublk server with zero-copy disabled. Signed-off-by: Caleb Sander Mateos <[email protected]> Reviewed-by: Ming Lei <[email protected]> Signed-off-by: Jens Axboe <[email protected]>
1 parent 15638d5 commit 2299cee

1 file changed

Lines changed: 14 additions & 48 deletions

File tree

drivers/block/ublk_drv.c

Lines changed: 14 additions & 48 deletions
Original file line numberDiff line numberDiff line change
@@ -913,54 +913,43 @@ static const struct block_device_operations ub_fops = {
913913
.report_zones = ublk_report_zones,
914914
};
915915

916-
#define UBLK_MAX_PIN_PAGES 32
917-
918916
struct ublk_io_iter {
919-
struct page *pages[UBLK_MAX_PIN_PAGES];
920917
struct bio *bio;
921918
struct bvec_iter iter;
922919
};
923920

924-
/* return how many pages are copied */
925-
static void ublk_copy_io_pages(struct ublk_io_iter *data,
926-
size_t total, size_t pg_off, int dir)
921+
/* return how many bytes are copied */
922+
static size_t ublk_copy_io_pages(struct ublk_io_iter *data,
923+
struct iov_iter *uiter, int dir)
927924
{
928-
unsigned done = 0;
929-
unsigned pg_idx = 0;
925+
size_t done = 0;
930926

931-
while (done < total) {
927+
for (;;) {
932928
struct bio_vec bv = bio_iter_iovec(data->bio, data->iter);
933-
unsigned int bytes = min3(bv.bv_len, (unsigned)total - done,
934-
(unsigned)(PAGE_SIZE - pg_off));
935929
void *bv_buf = bvec_kmap_local(&bv);
936-
void *pg_buf = kmap_local_page(data->pages[pg_idx]);
930+
size_t copied;
937931

938932
if (dir == ITER_DEST)
939-
memcpy(pg_buf + pg_off, bv_buf, bytes);
933+
copied = copy_to_iter(bv_buf, bv.bv_len, uiter);
940934
else
941-
memcpy(bv_buf, pg_buf + pg_off, bytes);
935+
copied = copy_from_iter(bv_buf, bv.bv_len, uiter);
942936

943-
kunmap_local(pg_buf);
944937
kunmap_local(bv_buf);
945938

946-
/* advance page array */
947-
pg_off += bytes;
948-
if (pg_off == PAGE_SIZE) {
949-
pg_idx += 1;
950-
pg_off = 0;
951-
}
952-
953-
done += bytes;
939+
done += copied;
940+
if (copied < bv.bv_len)
941+
break;
954942

955943
/* advance bio */
956-
bio_advance_iter_single(data->bio, &data->iter, bytes);
944+
bio_advance_iter_single(data->bio, &data->iter, copied);
957945
if (!data->iter.bi_size) {
958946
data->bio = data->bio->bi_next;
959947
if (data->bio == NULL)
960948
break;
961949
data->iter = data->bio->bi_iter;
962950
}
963951
}
952+
return done;
964953
}
965954

966955
static bool ublk_advance_io_iter(const struct request *req,
@@ -988,34 +977,11 @@ static size_t ublk_copy_user_pages(const struct request *req,
988977
unsigned offset, struct iov_iter *uiter, int dir)
989978
{
990979
struct ublk_io_iter iter;
991-
size_t done = 0;
992980

993981
if (!ublk_advance_io_iter(req, &iter, offset))
994982
return 0;
995983

996-
while (iov_iter_count(uiter) && iter.bio) {
997-
unsigned nr_pages;
998-
ssize_t len;
999-
size_t off;
1000-
int i;
1001-
1002-
len = iov_iter_get_pages2(uiter, iter.pages,
1003-
iov_iter_count(uiter),
1004-
UBLK_MAX_PIN_PAGES, &off);
1005-
if (len <= 0)
1006-
return done;
1007-
1008-
ublk_copy_io_pages(&iter, len, off, dir);
1009-
nr_pages = DIV_ROUND_UP(len + off, PAGE_SIZE);
1010-
for (i = 0; i < nr_pages; i++) {
1011-
if (dir == ITER_DEST)
1012-
set_page_dirty(iter.pages[i]);
1013-
put_page(iter.pages[i]);
1014-
}
1015-
done += len;
1016-
}
1017-
1018-
return done;
984+
return ublk_copy_io_pages(&iter, uiter, dir);
1019985
}
1020986

1021987
static inline bool ublk_need_map_req(const struct request *req)

0 commit comments

Comments
 (0)