qcow2: Merge the writing of the COW regions with the guest data
If the guest tries to write data that results on the allocation of a new cluster, instead of writing the guest data first and then the data from the COW regions, write everything together using one single I/O operation. This can improve the write performance by 25% or more, depending on several factors such as the media type, the cluster size and the I/O request size. Signed-off-by: Alberto Garcia <berto@igalia.com> Reviewed-by: Kevin Wolf <kwolf@redhat.com> Signed-off-by: Kevin Wolf <kwolf@redhat.com>
This commit is contained in:
parent
86b862c431
commit
ee22a9d869
@ -776,6 +776,7 @@ static int perform_cow(BlockDriverState *bs, QCowL2Meta *m)
|
|||||||
assert(start->nb_bytes <= UINT_MAX - end->nb_bytes);
|
assert(start->nb_bytes <= UINT_MAX - end->nb_bytes);
|
||||||
assert(start->nb_bytes + end->nb_bytes <= UINT_MAX - data_bytes);
|
assert(start->nb_bytes + end->nb_bytes <= UINT_MAX - data_bytes);
|
||||||
assert(start->offset + start->nb_bytes <= end->offset);
|
assert(start->offset + start->nb_bytes <= end->offset);
|
||||||
|
assert(!m->data_qiov || m->data_qiov->size == data_bytes);
|
||||||
|
|
||||||
if (start->nb_bytes == 0 && end->nb_bytes == 0) {
|
if (start->nb_bytes == 0 && end->nb_bytes == 0) {
|
||||||
return 0;
|
return 0;
|
||||||
@ -807,7 +808,7 @@ static int perform_cow(BlockDriverState *bs, QCowL2Meta *m)
|
|||||||
/* The part of the buffer where the end region is located */
|
/* The part of the buffer where the end region is located */
|
||||||
end_buffer = start_buffer + buffer_size - end->nb_bytes;
|
end_buffer = start_buffer + buffer_size - end->nb_bytes;
|
||||||
|
|
||||||
qemu_iovec_init(&qiov, 1);
|
qemu_iovec_init(&qiov, 2 + (m->data_qiov ? m->data_qiov->niov : 0));
|
||||||
|
|
||||||
qemu_co_mutex_unlock(&s->lock);
|
qemu_co_mutex_unlock(&s->lock);
|
||||||
/* First we read the existing data from both COW regions. We
|
/* First we read the existing data from both COW regions. We
|
||||||
@ -842,17 +843,36 @@ static int perform_cow(BlockDriverState *bs, QCowL2Meta *m)
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* And now we can write everything */
|
/* And now we can write everything. If we have the guest data we
|
||||||
qemu_iovec_reset(&qiov);
|
* can write everything in one single operation */
|
||||||
qemu_iovec_add(&qiov, start_buffer, start->nb_bytes);
|
if (m->data_qiov) {
|
||||||
ret = do_perform_cow_write(bs, m->alloc_offset, start->offset, &qiov);
|
qemu_iovec_reset(&qiov);
|
||||||
if (ret < 0) {
|
if (start->nb_bytes) {
|
||||||
goto fail;
|
qemu_iovec_add(&qiov, start_buffer, start->nb_bytes);
|
||||||
|
}
|
||||||
|
qemu_iovec_concat(&qiov, m->data_qiov, 0, data_bytes);
|
||||||
|
if (end->nb_bytes) {
|
||||||
|
qemu_iovec_add(&qiov, end_buffer, end->nb_bytes);
|
||||||
|
}
|
||||||
|
/* NOTE: we have a write_aio blkdebug event here followed by
|
||||||
|
* a cow_write one in do_perform_cow_write(), but there's only
|
||||||
|
* one single I/O operation */
|
||||||
|
BLKDBG_EVENT(bs->file, BLKDBG_WRITE_AIO);
|
||||||
|
ret = do_perform_cow_write(bs, m->alloc_offset, start->offset, &qiov);
|
||||||
|
} else {
|
||||||
|
/* If there's no guest data then write both COW regions separately */
|
||||||
|
qemu_iovec_reset(&qiov);
|
||||||
|
qemu_iovec_add(&qiov, start_buffer, start->nb_bytes);
|
||||||
|
ret = do_perform_cow_write(bs, m->alloc_offset, start->offset, &qiov);
|
||||||
|
if (ret < 0) {
|
||||||
|
goto fail;
|
||||||
|
}
|
||||||
|
|
||||||
|
qemu_iovec_reset(&qiov);
|
||||||
|
qemu_iovec_add(&qiov, end_buffer, end->nb_bytes);
|
||||||
|
ret = do_perform_cow_write(bs, m->alloc_offset, end->offset, &qiov);
|
||||||
}
|
}
|
||||||
|
|
||||||
qemu_iovec_reset(&qiov);
|
|
||||||
qemu_iovec_add(&qiov, end_buffer, end->nb_bytes);
|
|
||||||
ret = do_perform_cow_write(bs, m->alloc_offset, end->offset, &qiov);
|
|
||||||
fail:
|
fail:
|
||||||
qemu_co_mutex_lock(&s->lock);
|
qemu_co_mutex_lock(&s->lock);
|
||||||
|
|
||||||
|
@ -1575,6 +1575,44 @@ fail:
|
|||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* Check if it's possible to merge a write request with the writing of
|
||||||
|
* the data from the COW regions */
|
||||||
|
static bool merge_cow(uint64_t offset, unsigned bytes,
|
||||||
|
QEMUIOVector *hd_qiov, QCowL2Meta *l2meta)
|
||||||
|
{
|
||||||
|
QCowL2Meta *m;
|
||||||
|
|
||||||
|
for (m = l2meta; m != NULL; m = m->next) {
|
||||||
|
/* If both COW regions are empty then there's nothing to merge */
|
||||||
|
if (m->cow_start.nb_bytes == 0 && m->cow_end.nb_bytes == 0) {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* The data (middle) region must be immediately after the
|
||||||
|
* start region */
|
||||||
|
if (l2meta_cow_start(m) + m->cow_start.nb_bytes != offset) {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* The end region must be immediately after the data (middle)
|
||||||
|
* region */
|
||||||
|
if (m->offset + m->cow_end.offset != offset + bytes) {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Make sure that adding both COW regions to the QEMUIOVector
|
||||||
|
* does not exceed IOV_MAX */
|
||||||
|
if (hd_qiov->niov > IOV_MAX - 2) {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
m->data_qiov = hd_qiov;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
static coroutine_fn int qcow2_co_pwritev(BlockDriverState *bs, uint64_t offset,
|
static coroutine_fn int qcow2_co_pwritev(BlockDriverState *bs, uint64_t offset,
|
||||||
uint64_t bytes, QEMUIOVector *qiov,
|
uint64_t bytes, QEMUIOVector *qiov,
|
||||||
int flags)
|
int flags)
|
||||||
@ -1657,16 +1695,22 @@ static coroutine_fn int qcow2_co_pwritev(BlockDriverState *bs, uint64_t offset,
|
|||||||
goto fail;
|
goto fail;
|
||||||
}
|
}
|
||||||
|
|
||||||
qemu_co_mutex_unlock(&s->lock);
|
/* If we need to do COW, check if it's possible to merge the
|
||||||
BLKDBG_EVENT(bs->file, BLKDBG_WRITE_AIO);
|
* writing of the guest data together with that of the COW regions.
|
||||||
trace_qcow2_writev_data(qemu_coroutine_self(),
|
* If it's not possible (or not necessary) then write the
|
||||||
cluster_offset + offset_in_cluster);
|
* guest data now. */
|
||||||
ret = bdrv_co_pwritev(bs->file,
|
if (!merge_cow(offset, cur_bytes, &hd_qiov, l2meta)) {
|
||||||
cluster_offset + offset_in_cluster,
|
qemu_co_mutex_unlock(&s->lock);
|
||||||
cur_bytes, &hd_qiov, 0);
|
BLKDBG_EVENT(bs->file, BLKDBG_WRITE_AIO);
|
||||||
qemu_co_mutex_lock(&s->lock);
|
trace_qcow2_writev_data(qemu_coroutine_self(),
|
||||||
if (ret < 0) {
|
cluster_offset + offset_in_cluster);
|
||||||
goto fail;
|
ret = bdrv_co_pwritev(bs->file,
|
||||||
|
cluster_offset + offset_in_cluster,
|
||||||
|
cur_bytes, &hd_qiov, 0);
|
||||||
|
qemu_co_mutex_lock(&s->lock);
|
||||||
|
if (ret < 0) {
|
||||||
|
goto fail;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
while (l2meta != NULL) {
|
while (l2meta != NULL) {
|
||||||
|
@ -343,6 +343,13 @@ typedef struct QCowL2Meta
|
|||||||
*/
|
*/
|
||||||
Qcow2COWRegion cow_end;
|
Qcow2COWRegion cow_end;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* The I/O vector with the data from the actual guest write request.
|
||||||
|
* If non-NULL, this is meant to be merged together with the data
|
||||||
|
* from @cow_start and @cow_end into one single write operation.
|
||||||
|
*/
|
||||||
|
QEMUIOVector *data_qiov;
|
||||||
|
|
||||||
/** Pointer to next L2Meta of the same write request */
|
/** Pointer to next L2Meta of the same write request */
|
||||||
struct QCowL2Meta *next;
|
struct QCowL2Meta *next;
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user