Vladimir Sementsov-Ogievskiy ff812c5563 qcow2: handle_dependencies(): relax conflict detection
There is no conflict and no dependency if we have parallel writes to
different subclusters of one cluster when the cluster itself is already
allocated. So, relax extra dependency.

Measure performance:
First, prepare build/qemu-img-old and build/qemu-img-new images.

cd scripts/simplebench
./img_bench_templater.py

Paste the following to stdin of running script:

qemu_img=../../build/qemu-img-{old|new}
$qemu_img create -f qcow2 -o extended_l2=on /ssd/x.qcow2 1G
$qemu_img bench -c 100000 -d 8 [-s 2K|-s 2K -o 512|-s $((1024*2+512))] \
        -w -t none -n /ssd/x.qcow2

The result:

All results are in seconds

------------------  ---------  ---------
                    old        new
-s 2K               6.7 ± 15%  6.2 ± 12%
                                 -7%
-s 2K -o 512        13 ± 3%    11 ± 5%
                                 -16%
-s $((1024*2+512))  9.5 ± 4%   8.4
                                 -12%
------------------  ---------  ---------

So small writes are more independent now and that helps to keep deeper
io queue which improves performance.

271 iotest output becomes racy for three allocation in one cluster.
Second and third writes may finish in different order. Second and
third requests don't depend on each other any more. Still they both
depend on first request anyway. Filter out second and third write
offsets to cover both possible outputs.

Signed-off-by: Vladimir Sementsov-Ogievskiy <vsementsov@virtuozzo.com>
Message-Id: <20210824101517.59802-4-vsementsov@virtuozzo.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Reviewed-by: Hanna Reitz <hreitz@redhat.com>
[hreitz: s/ an / and /]
Signed-off-by: Hanna Reitz <hreitz@redhat.com>
2021-09-15 15:54:07 +02:00

906 lines
32 KiB
Bash
Executable File

#!/usr/bin/env bash
# group: rw auto
#
# Test qcow2 images with extended L2 entries
#
# Copyright (C) 2019-2020 Igalia, S.L.
# Author: Alberto Garcia <berto@igalia.com>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
# creator
owner=berto@igalia.com
seq="$(basename $0)"
echo "QA output created by $seq"
here="$PWD"
status=1 # failure is the default!
_cleanup()
{
_cleanup_test_img
rm -f "$TEST_IMG.raw"
}
trap "_cleanup; exit \$status" 0 1 2 3 15
# get standard environment, filters and checks
. ./common.rc
. ./common.filter
_supported_fmt qcow2
_supported_proto file nfs
_supported_os Linux
_unsupported_imgopts extended_l2 compat=0.10 cluster_size data_file refcount_bits=1[^0-9]
l2_offset=$((0x40000))
_verify_img()
{
$QEMU_IMG compare "$TEST_IMG" "$TEST_IMG.raw" | grep -v 'Images are identical'
$QEMU_IMG check "$TEST_IMG" | _filter_qemu_img_check | \
grep -v 'No errors were found on the image'
}
# Compare the bitmap of an extended L2 entry against an expected value
_verify_l2_bitmap()
{
entry_no="$1" # L2 entry number, starting from 0
expected_alloc="$alloc" # Space-separated list of allocated subcluster indexes
expected_zero="$zero" # Space-separated list of zero subcluster indexes
offset=$(($l2_offset + $entry_no * 16))
entry=$(peek_file_be "$TEST_IMG" $offset 8)
offset=$(($offset + 8))
bitmap=$(peek_file_be "$TEST_IMG" $offset 8)
expected_bitmap=0
for bit in $expected_alloc; do
expected_bitmap=$(($expected_bitmap | (1 << $bit)))
done
for bit in $expected_zero; do
expected_bitmap=$(($expected_bitmap | (1 << (32 + $bit))))
done
printf -v expected_bitmap "%u" $expected_bitmap # Convert to unsigned
printf "L2 entry #%d: 0x%016x %016x\n" "$entry_no" "$entry" "$bitmap"
if [ "$bitmap" != "$expected_bitmap" ]; then
printf "ERROR: expecting bitmap 0x%016x\n" "$expected_bitmap"
fi
}
# This should be called as _run_test c=XXX sc=XXX off=XXX len=XXX cmd=XXX
# c: cluster number (0 if unset)
# sc: subcluster number inside cluster @c (0 if unset)
# off: offset inside subcluster @sc, in kilobytes (0 if unset)
# len: request length, passed directly to qemu-io (e.g: 256, 4k, 1M, ...)
# cmd: the command to pass to qemu-io, must be one of
# write -> write
# zero -> write -z
# unmap -> write -z -u
# compress -> write -c
# discard -> discard
_run_test()
{
unset c sc off len cmd
for var in "$@"; do eval "$var"; done
case "${cmd:-write}" in
zero)
cmd="write -q -z";;
unmap)
cmd="write -q -z -u";;
compress)
pat=$((${pat:-0} + 1))
cmd="write -q -c -P ${pat}";;
write)
pat=$((${pat:-0} + 1))
cmd="write -q -P ${pat}";;
discard)
cmd="discard -q";;
*)
echo "Unknown option $cmd"
exit 1;;
esac
c="${c:-0}"
sc="${sc:-0}"
off="${off:-0}"
offset="$(($c * 64 + $sc * 2 + $off))"
[ "$offset" != 0 ] && offset="${offset}k"
cmd="$cmd ${offset} ${len}"
raw_cmd=$(echo $cmd | sed s/-c//) # Raw images don't support -c
echo $cmd | sed 's/-P [0-9][0-9]\?/-P PATTERN/'
$QEMU_IO -c "$cmd" "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c "$raw_cmd" -f raw "$TEST_IMG.raw" | _filter_qemu_io
_verify_img
_verify_l2_bitmap "$c"
}
_reset_img()
{
size="$1"
$QEMU_IMG create -f raw "$TEST_IMG.raw" "$size" | _filter_img_create
if [ "$use_backing_file" = "yes" ]; then
$QEMU_IMG create -f raw "$TEST_IMG.base" "$size" | _filter_img_create
$QEMU_IO -c "write -q -P 0xFF 0 $size" -f raw "$TEST_IMG.base" | _filter_qemu_io
$QEMU_IO -c "write -q -P 0xFF 0 $size" -f raw "$TEST_IMG.raw" | _filter_qemu_io
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base" "$size"
else
_make_test_img -o extended_l2=on "$size"
fi
}
############################################################
############################################################
############################################################
# Test that writing to an image with subclusters produces the expected
# results, in images with and without backing files
for use_backing_file in yes no; do
echo
echo "### Standard write tests (backing file: $use_backing_file) ###"
echo
_reset_img 1M
### Write subcluster #0 (beginning of subcluster) ###
alloc="0"; zero=""
_run_test sc=0 len=1k
### Write subcluster #1 (middle of subcluster) ###
alloc="0 1"; zero=""
_run_test sc=1 off=1 len=512
### Write subcluster #2 (end of subcluster) ###
alloc="0 1 2"; zero=""
_run_test sc=2 off=1 len=1k
### Write subcluster #3 (full subcluster) ###
alloc="0 1 2 3"; zero=""
_run_test sc=3 len=2k
### Write subclusters #4-6 (full subclusters) ###
alloc="$(seq 0 6)"; zero=""
_run_test sc=4 len=6k
### Write subclusters #7-9 (partial subclusters) ###
alloc="$(seq 0 9)"; zero=""
_run_test sc=7 off=1 len=4k
### Write subcluster #16 (partial subcluster) ###
alloc="$(seq 0 9) 16"; zero=""
_run_test sc=16 len=1k
### Write subcluster #31-#33 (cluster overlap) ###
alloc="$(seq 0 9) 16 31"; zero=""
_run_test sc=31 off=1 len=4k
alloc="0 1" ; zero=""
_verify_l2_bitmap 1
### Zero subcluster #1
alloc="0 $(seq 2 9) 16 31"; zero="1"
_run_test sc=1 len=2k cmd=zero
### Zero cluster #0
alloc=""; zero="$(seq 0 31)"
_run_test sc=0 len=64k cmd=zero
### Fill cluster #0 with data
alloc="$(seq 0 31)"; zero=""
_run_test sc=0 len=64k
### Zero and unmap half of cluster #0 (this won't unmap it)
alloc="$(seq 16 31)"; zero="$(seq 0 15)"
_run_test sc=0 len=32k cmd=unmap
### Zero and unmap cluster #0
alloc=""; zero="$(seq 0 31)"
_run_test sc=0 len=64k cmd=unmap
### Write subcluster #1 (middle of subcluster)
alloc="1"; zero="0 $(seq 2 31)"
_run_test sc=1 off=1 len=512
### Fill cluster #0 with data
alloc="$(seq 0 31)"; zero=""
_run_test sc=0 len=64k
### Discard cluster #0
alloc=""; zero="$(seq 0 31)"
_run_test sc=0 len=64k cmd=discard
### Write compressed data to cluster #0
alloc=""; zero=""
_run_test sc=0 len=64k cmd=compress
### Write subcluster #1 (middle of subcluster)
alloc="$(seq 0 31)"; zero=""
_run_test sc=1 off=1 len=512
done
############################################################
############################################################
############################################################
# calculate_l2_meta() checks if none of the clusters affected by a
# write operation need COW or changes to their L2 metadata and simply
# returns when they don't. This is a test for that optimization.
# Here clusters #0-#3 are overwritten but only #1 and #2 need changes.
echo
echo '### Overwriting several clusters without COW ###'
echo
use_backing_file="no" _reset_img 1M
# Write cluster #0, subclusters #12-#31
alloc="$(seq 12 31)"; zero=""
_run_test sc=12 len=40k
# Write cluster #1, subcluster #13
alloc="13"; zero=""
_run_test c=1 sc=13 len=2k
# Zeroize cluster #2, subcluster #14
alloc="14"; zero=""
_run_test c=2 sc=14 len=2k
alloc=""; zero="14"
_run_test c=2 sc=14 len=2k cmd=zero
# Write cluster #3, subclusters #0-#16
alloc="$(seq 0 16)"; zero=""
_run_test c=3 sc=0 len=34k
# Write from cluster #0, subcluster #12 to cluster #3, subcluster #11
alloc="$(seq 12 31)"; zero=""
_run_test sc=12 len=192k
alloc="$(seq 0 31)"; zero=""
_verify_l2_bitmap 1
_verify_l2_bitmap 2
alloc="$(seq 0 16)"; zero=""
_verify_l2_bitmap 3
############################################################
############################################################
############################################################
# Test different patterns of writing zeroes
for use_backing_file in yes no; do
echo
echo "### Writing zeroes 1: unallocated clusters (backing file: $use_backing_file) ###"
echo
# Note that the image size is not a multiple of the cluster size
_reset_img 2083k
# Cluster-aligned request from clusters #0 to #2
alloc=""; zero="$(seq 0 31)"
_run_test c=0 sc=0 len=192k cmd=zero
_verify_l2_bitmap 1
_verify_l2_bitmap 2
# Subcluster-aligned request from clusters #3 to #5
alloc=""; zero="$(seq 16 31)"
_run_test c=3 sc=16 len=128k cmd=zero
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 4
alloc=""; zero="$(seq 0 15)"
_verify_l2_bitmap 5
# Unaligned request from clusters #6 to #8
if [ "$use_backing_file" = "yes" ]; then
alloc="15"; zero="$(seq 16 31)" # copy-on-write happening here
else
alloc=""; zero="$(seq 15 31)"
fi
_run_test c=6 sc=15 off=1 len=128k cmd=zero
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 7
if [ "$use_backing_file" = "yes" ]; then
alloc="15"; zero="$(seq 0 14)" # copy-on-write happening here
else
alloc=""; zero="$(seq 0 15)"
fi
_verify_l2_bitmap 8
echo
echo "### Writing zeroes 2: allocated clusters (backing file: $use_backing_file) ###"
echo
alloc="$(seq 0 31)"; zero=""
_run_test c=9 sc=0 len=576k
_verify_l2_bitmap 10
_verify_l2_bitmap 11
_verify_l2_bitmap 12
_verify_l2_bitmap 13
_verify_l2_bitmap 14
_verify_l2_bitmap 15
_verify_l2_bitmap 16
_verify_l2_bitmap 17
# Cluster-aligned request from clusters #9 to #11
alloc=""; zero="$(seq 0 31)"
_run_test c=9 sc=0 len=192k cmd=zero
_verify_l2_bitmap 10
_verify_l2_bitmap 11
# Subcluster-aligned request from clusters #12 to #14
alloc="$(seq 0 15)"; zero="$(seq 16 31)"
_run_test c=12 sc=16 len=128k cmd=zero
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 13
alloc="$(seq 16 31)"; zero="$(seq 0 15)"
_verify_l2_bitmap 14
# Unaligned request from clusters #15 to #17
alloc="$(seq 0 15)"; zero="$(seq 16 31)"
_run_test c=15 sc=15 off=1 len=128k cmd=zero
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 16
alloc="$(seq 15 31)"; zero="$(seq 0 14)"
_verify_l2_bitmap 17
echo
echo "### Writing zeroes 3: compressed clusters (backing file: $use_backing_file) ###"
echo
alloc=""; zero=""
for c in $(seq 18 28); do
_run_test c=$c sc=0 len=64k cmd=compress
done
# Cluster-aligned request from clusters #18 to #20
alloc=""; zero="$(seq 0 31)"
_run_test c=18 sc=0 len=192k cmd=zero
_verify_l2_bitmap 19
_verify_l2_bitmap 20
# Subcluster-aligned request from clusters #21 to #23.
# We cannot partially zero a compressed cluster so the code
# returns -ENOTSUP, which means copy-on-write of the compressed
# data and fill the rest with actual zeroes on disk.
# TODO: cluster #22 should use the 'all zeroes' bits.
alloc="$(seq 0 31)"; zero=""
_run_test c=21 sc=16 len=128k cmd=zero
_verify_l2_bitmap 22
_verify_l2_bitmap 23
# Unaligned request from clusters #24 to #26
# In this case QEMU internally sends a 1k request followed by a
# subcluster-aligned 128k request. The first request decompresses
# cluster #24, but that's not enough to perform the second request
# efficiently because it partially writes to cluster #26 (which is
# compressed) so we hit the same problem as before.
alloc="$(seq 0 31)"; zero=""
_run_test c=24 sc=15 off=1 len=129k cmd=zero
_verify_l2_bitmap 25
_verify_l2_bitmap 26
# Unaligned request from clusters #27 to #29
# Similar to the previous case, but this time the tail of the
# request does not correspond to a compressed cluster, so it can
# be zeroed efficiently.
# Note that the very last subcluster is partially written, so if
# there's a backing file we need to perform cow.
alloc="$(seq 0 15)"; zero="$(seq 16 31)"
_run_test c=27 sc=15 off=1 len=128k cmd=zero
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 28
if [ "$use_backing_file" = "yes" ]; then
alloc="15"; zero="$(seq 0 14)" # copy-on-write happening here
else
alloc=""; zero="$(seq 0 15)"
fi
_verify_l2_bitmap 29
echo
echo "### Writing zeroes 4: other tests (backing file: $use_backing_file) ###"
echo
# Unaligned request in the middle of cluster #30.
# If there's a backing file we need to allocate and do
# copy-on-write on the partially zeroed subclusters.
# If not we can set the 'all zeroes' bit on them.
if [ "$use_backing_file" = "yes" ]; then
alloc="15 19"; zero="$(seq 16 18)" # copy-on-write happening here
else
alloc=""; zero="$(seq 15 19)"
fi
_run_test c=30 sc=15 off=1 len=8k cmd=zero
# Fill the last cluster with zeroes, up to the end of the image
# (the image size is not a multiple of the cluster or subcluster size).
alloc=""; zero="$(seq 0 17)"
_run_test c=32 sc=0 len=35k cmd=zero
done
############################################################
############################################################
############################################################
# Zero + unmap
for use_backing_file in yes no; do
echo
echo "### Zero + unmap 1: allocated clusters (backing file: $use_backing_file) ###"
echo
# Note that the image size is not a multiple of the cluster size
_reset_img 2083k
alloc="$(seq 0 31)"; zero=""
_run_test c=9 sc=0 len=576k
_verify_l2_bitmap 10
_verify_l2_bitmap 11
_verify_l2_bitmap 12
_verify_l2_bitmap 13
_verify_l2_bitmap 14
_verify_l2_bitmap 15
_verify_l2_bitmap 16
_verify_l2_bitmap 17
# Cluster-aligned request from clusters #9 to #11
alloc=""; zero="$(seq 0 31)"
_run_test c=9 sc=0 len=192k cmd=unmap
_verify_l2_bitmap 10
_verify_l2_bitmap 11
# Subcluster-aligned request from clusters #12 to #14
alloc="$(seq 0 15)"; zero="$(seq 16 31)"
_run_test c=12 sc=16 len=128k cmd=unmap
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 13
alloc="$(seq 16 31)"; zero="$(seq 0 15)"
_verify_l2_bitmap 14
# Unaligned request from clusters #15 to #17
alloc="$(seq 0 15)"; zero="$(seq 16 31)"
_run_test c=15 sc=15 off=1 len=128k cmd=unmap
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 16
alloc="$(seq 15 31)"; zero="$(seq 0 14)"
_verify_l2_bitmap 17
echo
echo "### Zero + unmap 2: compressed clusters (backing file: $use_backing_file) ###"
echo
alloc=""; zero=""
for c in $(seq 18 28); do
_run_test c=$c sc=0 len=64k cmd=compress
done
# Cluster-aligned request from clusters #18 to #20
alloc=""; zero="$(seq 0 31)"
_run_test c=18 sc=0 len=192k cmd=unmap
_verify_l2_bitmap 19
_verify_l2_bitmap 20
# Subcluster-aligned request from clusters #21 to #23.
# We cannot partially zero a compressed cluster so the code
# returns -ENOTSUP, which means copy-on-write of the compressed
# data and fill the rest with actual zeroes on disk.
# TODO: cluster #22 should use the 'all zeroes' bits.
alloc="$(seq 0 31)"; zero=""
_run_test c=21 sc=16 len=128k cmd=unmap
_verify_l2_bitmap 22
_verify_l2_bitmap 23
# Unaligned request from clusters #24 to #26
# In this case QEMU internally sends a 1k request followed by a
# subcluster-aligned 128k request. The first request decompresses
# cluster #24, but that's not enough to perform the second request
# efficiently because it partially writes to cluster #26 (which is
# compressed) so we hit the same problem as before.
alloc="$(seq 0 31)"; zero=""
_run_test c=24 sc=15 off=1 len=129k cmd=unmap
_verify_l2_bitmap 25
_verify_l2_bitmap 26
# Unaligned request from clusters #27 to #29
# Similar to the previous case, but this time the tail of the
# request does not correspond to a compressed cluster, so it can
# be zeroed efficiently.
# Note that the very last subcluster is partially written, so if
# there's a backing file we need to perform cow.
alloc="$(seq 0 15)"; zero="$(seq 16 31)"
_run_test c=27 sc=15 off=1 len=128k cmd=unmap
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 28
if [ "$use_backing_file" = "yes" ]; then
alloc="15"; zero="$(seq 0 14)" # copy-on-write happening here
else
alloc=""; zero="$(seq 0 15)"
fi
_verify_l2_bitmap 29
done
############################################################
############################################################
############################################################
# Test qcow2_cluster_discard() with full and normal discards
for use_backing_file in yes no; do
echo
echo "### Discarding clusters with non-zero bitmaps (backing file: $use_backing_file) ###"
echo
if [ "$use_backing_file" = "yes" ]; then
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base" 1M
else
_make_test_img -o extended_l2=on 1M
fi
# Write clusters #0-#2 and then discard them
$QEMU_IO -c 'write -q 0 128k' "$TEST_IMG"
$QEMU_IO -c 'discard -q 0 128k' "$TEST_IMG"
# 'qemu-io discard' doesn't do a full discard, it zeroizes the
# cluster, so both clusters have all zero bits set now
alloc=""; zero="$(seq 0 31)"
_verify_l2_bitmap 0
_verify_l2_bitmap 1
# Now mark the 2nd half of the subclusters from cluster #0 as unallocated
poke_file "$TEST_IMG" $(($l2_offset+8)) "\x00\x00"
# Discard cluster #0 again to see how the zero bits have changed
$QEMU_IO -c 'discard -q 0 64k' "$TEST_IMG"
# And do a full discard of cluster #1 by shrinking and growing the image
$QEMU_IMG resize --shrink "$TEST_IMG" 64k
$QEMU_IMG resize "$TEST_IMG" 1M
# A normal discard sets all 'zero' bits only if the image has a
# backing file, otherwise it won't touch them.
if [ "$use_backing_file" = "yes" ]; then
alloc=""; zero="$(seq 0 31)"
else
alloc=""; zero="$(seq 0 15)"
fi
_verify_l2_bitmap 0
# A full discard should clear the L2 entry completely. However
# when growing an image with a backing file the new clusters are
# zeroized to hide the stale data from the backing file
if [ "$use_backing_file" = "yes" ]; then
alloc=""; zero="$(seq 0 31)"
else
alloc=""; zero=""
fi
_verify_l2_bitmap 1
done
############################################################
############################################################
############################################################
# Test that corrupted L2 entries are detected in both read and write
# operations
for corruption_test_cmd in read write; do
echo
echo "### Corrupted L2 entries - $corruption_test_cmd test (allocated) ###"
echo
echo "# 'cluster is zero' bit set on the standard cluster descriptor"
echo
# We actually don't consider this a corrupted image.
# The 'cluster is zero' bit is unused in extended L2 entries so
# QEMU ignores it.
# TODO: maybe treat the image as corrupted and make qemu-img check fix it?
_make_test_img -o extended_l2=on 1M
$QEMU_IO -c 'write -q -P 0x11 0 2k' "$TEST_IMG"
poke_file "$TEST_IMG" $(($l2_offset+7)) "\x01"
alloc="0"; zero=""
_verify_l2_bitmap 0
$QEMU_IO -c "$corruption_test_cmd -q -P 0x11 0 1k" "$TEST_IMG"
if [ "$corruption_test_cmd" = "write" ]; then
alloc="0"; zero=""
fi
_verify_l2_bitmap 0
echo
echo "# Both 'subcluster is zero' and 'subcluster is allocated' bits set"
echo
_make_test_img -o extended_l2=on 1M
# Write from the middle of cluster #0 to the middle of cluster #2
$QEMU_IO -c 'write -q 32k 128k' "$TEST_IMG"
# Corrupt the L2 entry from cluster #1
poke_file_be "$TEST_IMG" $(($l2_offset+24)) 4 1
alloc="$(seq 0 31)"; zero="0"
_verify_l2_bitmap 1
$QEMU_IO -c "$corruption_test_cmd 0 192k" "$TEST_IMG"
echo
echo "### Corrupted L2 entries - $corruption_test_cmd test (unallocated) ###"
echo
echo "# 'cluster is zero' bit set on the standard cluster descriptor"
echo
# We actually don't consider this a corrupted image.
# The 'cluster is zero' bit is unused in extended L2 entries so
# QEMU ignores it.
# TODO: maybe treat the image as corrupted and make qemu-img check fix it?
_make_test_img -o extended_l2=on 1M
# We want to modify the (empty) L2 entry from cluster #0,
# but we write to #4 in order to initialize the L2 table first
$QEMU_IO -c 'write -q 256k 1k' "$TEST_IMG"
poke_file "$TEST_IMG" $(($l2_offset+7)) "\x01"
alloc=""; zero=""
_verify_l2_bitmap 0
$QEMU_IO -c "$corruption_test_cmd -q 0 1k" "$TEST_IMG"
if [ "$corruption_test_cmd" = "write" ]; then
alloc="0"; zero=""
fi
_verify_l2_bitmap 0
echo
echo "# 'subcluster is allocated' bit set"
echo
_make_test_img -o extended_l2=on 1M
# We want to corrupt the (empty) L2 entry from cluster #0,
# but we write to #4 in order to initialize the L2 table first
$QEMU_IO -c 'write -q 256k 1k' "$TEST_IMG"
poke_file "$TEST_IMG" $(($l2_offset+15)) "\x01"
alloc="0"; zero=""
_verify_l2_bitmap 0
$QEMU_IO -c "$corruption_test_cmd 0 1k" "$TEST_IMG"
echo
echo "# Both 'subcluster is zero' and 'subcluster is allocated' bits set"
echo
_make_test_img -o extended_l2=on 1M
# We want to corrupt the (empty) L2 entry from cluster #1,
# but we write to #4 in order to initialize the L2 table first
$QEMU_IO -c 'write -q 256k 1k' "$TEST_IMG"
# Corrupt the L2 entry from cluster #1
poke_file_be "$TEST_IMG" $(($l2_offset+24)) 8 $(((1 << 32) | 1))
alloc="0"; zero="0"
_verify_l2_bitmap 1
$QEMU_IO -c "$corruption_test_cmd 0 192k" "$TEST_IMG"
echo
echo "### Compressed cluster with subcluster bitmap != 0 - $corruption_test_cmd test ###"
echo
# We actually don't consider this a corrupted image.
# The bitmap in compressed clusters is unused so QEMU should just ignore it.
_make_test_img -o extended_l2=on 1M
$QEMU_IO -c 'write -q -P 11 -c 0 64k' "$TEST_IMG"
# Change the L2 bitmap to allocate subcluster #31 and zeroize subcluster #0
poke_file "$TEST_IMG" $(($l2_offset+11)) "\x01\x80"
alloc="31"; zero="0"
_verify_l2_bitmap 0
$QEMU_IO -c "$corruption_test_cmd -P 11 0 64k" "$TEST_IMG" | _filter_qemu_io
# Writing allocates a new uncompressed cluster so we get a new bitmap
if [ "$corruption_test_cmd" = "write" ]; then
alloc="$(seq 0 31)"; zero=""
fi
_verify_l2_bitmap 0
done
############################################################
############################################################
############################################################
echo
echo "### Detect and repair unaligned clusters ###"
echo
# Create a backing file and fill it with data
$QEMU_IMG create -f raw "$TEST_IMG.base" 128k | _filter_img_create
$QEMU_IO -c "write -q -P 0xff 0 128k" -f raw "$TEST_IMG.base" | _filter_qemu_io
echo "# Corrupted L2 entry, allocated subcluster #"
# Create a new image, allocate a cluster and write some data to it
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base"
$QEMU_IO -c 'write -q -P 1 4k 2k' "$TEST_IMG"
# Corrupt the L2 entry by making the offset unaligned
poke_file "$TEST_IMG" "$(($l2_offset+6))" "\x02"
# This cannot be repaired, qemu-img check will fail to fix it
_check_test_img -r all
# Attempting to read the image will still show that it's corrupted
$QEMU_IO -c 'read -q 0 2k' "$TEST_IMG"
echo "# Corrupted L2 entry, no allocated subclusters #"
# Create a new image, allocate a cluster and zeroize subcluster #2
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base"
$QEMU_IO -c 'write -q -P 1 4k 2k' "$TEST_IMG"
$QEMU_IO -c 'write -q -z 4k 2k' "$TEST_IMG"
# Corrupt the L2 entry by making the offset unaligned
poke_file "$TEST_IMG" "$(($l2_offset+6))" "\x02"
# This time none of the subclusters are allocated so we can repair the image
_check_test_img -r all
# And the data can be read normally
$QEMU_IO -c 'read -q -P 0xff 0 4k' "$TEST_IMG"
$QEMU_IO -c 'read -q -P 0x00 4k 2k' "$TEST_IMG"
$QEMU_IO -c 'read -q -P 0xff 6k 122k' "$TEST_IMG"
############################################################
############################################################
############################################################
echo
echo "### Image creation options ###"
echo
echo "# cluster_size < 16k"
_make_test_img -o extended_l2=on,cluster_size=8k 1M
echo "# backing file and preallocation=metadata"
# For preallocation with backing files, create a backing file first
$QEMU_IMG create -f raw "$TEST_IMG.base" 1M | _filter_img_create
$QEMU_IO -c "write -q -P 0xff 0 1M" -f raw "$TEST_IMG.base" | _filter_qemu_io
_make_test_img -o extended_l2=on,preallocation=metadata -F raw -b "$TEST_IMG.base" 512k
$QEMU_IMG resize "$TEST_IMG" 1M
$QEMU_IO -c 'read -P 0xff 0 512k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 512k 512k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IMG map "$TEST_IMG" | _filter_testdir
echo "# backing file and preallocation=falloc"
_make_test_img -o extended_l2=on,preallocation=falloc -F raw -b "$TEST_IMG.base" 512k
$QEMU_IMG resize "$TEST_IMG" 1M
$QEMU_IO -c 'read -P 0xff 0 512k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 512k 512k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IMG map "$TEST_IMG" | _filter_testdir
echo "# backing file and preallocation=full"
_make_test_img -o extended_l2=on,preallocation=full -F raw -b "$TEST_IMG.base" 512k
$QEMU_IMG resize "$TEST_IMG" 1M
$QEMU_IO -c 'read -P 0xff 0 512k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 512k 512k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IMG map "$TEST_IMG" | _filter_testdir
echo
echo "### Image resizing with preallocation and backing files ###"
echo
# In this case the new subclusters must have the 'all zeroes' bit set
echo "# resize --preallocation=metadata"
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base" 503k
$QEMU_IMG resize --preallocation=metadata "$TEST_IMG" 1013k
$QEMU_IO -c 'read -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 503k 510k' "$TEST_IMG" | _filter_qemu_io
# In this case and the next one the new subclusters must be allocated
echo "# resize --preallocation=falloc"
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base" 503k
$QEMU_IMG resize --preallocation=falloc "$TEST_IMG" 1013k
$QEMU_IO -c 'read -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 503k 510k' "$TEST_IMG" | _filter_qemu_io
echo "# resize --preallocation=full"
_make_test_img -o extended_l2=on -F raw -b "$TEST_IMG.base" 503k
$QEMU_IMG resize --preallocation=full "$TEST_IMG" 1013k
$QEMU_IO -c 'read -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 503k 510k' "$TEST_IMG" | _filter_qemu_io
echo
echo "### Image resizing with preallocation without backing files ###"
echo
# In this case the new subclusters must have the 'all zeroes' bit set
echo "# resize --preallocation=metadata"
_make_test_img -o extended_l2=on 503k
$QEMU_IO -c 'write -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IMG resize --preallocation=metadata "$TEST_IMG" 1013k
$QEMU_IO -c 'read -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 503k 510k' "$TEST_IMG" | _filter_qemu_io
# In this case and the next one the new subclusters must be allocated
echo "# resize --preallocation=falloc"
_make_test_img -o extended_l2=on 503k
$QEMU_IO -c 'write -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IMG resize --preallocation=falloc "$TEST_IMG" 1013k
$QEMU_IO -c 'read -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 503k 510k' "$TEST_IMG" | _filter_qemu_io
echo "# resize --preallocation=full"
_make_test_img -o extended_l2=on 503k
$QEMU_IO -c 'write -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IMG resize --preallocation=full "$TEST_IMG" 1013k
$QEMU_IO -c 'read -P 0xff 0 503k' "$TEST_IMG" | _filter_qemu_io
$QEMU_IO -c 'read -P 0x00 503k 510k' "$TEST_IMG" | _filter_qemu_io
echo
echo "### qemu-img measure ###"
echo
echo "# 512MB, extended_l2=off" # This needs one L2 table
$QEMU_IMG measure --size 512M -O qcow2 -o extended_l2=off
echo "# 512MB, extended_l2=on" # This needs two L2 tables
$QEMU_IMG measure --size 512M -O qcow2 -o extended_l2=on
echo "# 16K clusters, 64GB, extended_l2=off" # This needs one full L1 table cluster
$QEMU_IMG measure --size 64G -O qcow2 -o cluster_size=16k,extended_l2=off
echo "# 16K clusters, 64GB, extended_l2=on" # This needs two full L2 table clusters
$QEMU_IMG measure --size 64G -O qcow2 -o cluster_size=16k,extended_l2=on
echo "# 8k clusters" # This should fail
$QEMU_IMG measure --size 1M -O qcow2 -o cluster_size=8k,extended_l2=on
echo "# 1024 TB" # Maximum allowed size with extended_l2=on and 64K clusters
$QEMU_IMG measure --size 1024T -O qcow2 -o extended_l2=on
echo "# 1025 TB" # This should fail
$QEMU_IMG measure --size 1025T -O qcow2 -o extended_l2=on
echo
echo "### qemu-img amend ###"
echo
_make_test_img -o extended_l2=on 1M
$QEMU_IMG amend -o extended_l2=off "$TEST_IMG" && echo "Unexpected pass"
_make_test_img -o extended_l2=off 1M
$QEMU_IMG amend -o extended_l2=on "$TEST_IMG" && echo "Unexpected pass"
echo
echo "### Test copy-on-write on an image with snapshots ###"
echo
_make_test_img -o extended_l2=on 1M
# For each cluster from #0 to #9 this loop zeroes subcluster #7
# and allocates subclusters #13 and #18.
alloc="13 18"; zero="7"
for c in $(seq 0 9); do
$QEMU_IO -c "write -q -z $((64*$c+14))k 2k" \
-c "write -q -P $((0xd0+$c)) $((64*$c+26))k 2k" \
-c "write -q -P $((0xe0+$c)) $((64*$c+36))k 2k" "$TEST_IMG"
_verify_l2_bitmap "$c"
done
# Create a snapshot and set l2_offset to the new L2 table
$QEMU_IMG snapshot -c snap1 "$TEST_IMG"
l2_offset=$((0x110000))
# Write different patterns to each one of the clusters
# in order to see how copy-on-write behaves in each case.
$QEMU_IO -c "write -q -P 0xf0 $((64*0+30))k 1k" \
-c "write -q -P 0xf1 $((64*1+20))k 1k" \
-c "write -q -P 0xf2 $((64*2+40))k 1k" \
-c "write -q -P 0xf3 $((64*3+26))k 1k" \
-c "write -q -P 0xf4 $((64*4+14))k 1k" \
-c "write -q -P 0xf5 $((64*5+1))k 1k" \
-c "write -q -z $((64*6+30))k 3k" \
-c "write -q -z $((64*7+26))k 2k" \
-c "write -q -z $((64*8+26))k 1k" \
-c "write -q -z $((64*9+12))k 1k" \
"$TEST_IMG"
alloc="$(seq 13 18)"; zero="7" _verify_l2_bitmap 0
alloc="$(seq 10 18)"; zero="7" _verify_l2_bitmap 1
alloc="$(seq 13 20)"; zero="7" _verify_l2_bitmap 2
alloc="$(seq 13 18)"; zero="7" _verify_l2_bitmap 3
alloc="$(seq 7 18)"; zero="" _verify_l2_bitmap 4
alloc="$(seq 0 18)"; zero="" _verify_l2_bitmap 5
alloc="13 18"; zero="7 15 16" _verify_l2_bitmap 6
alloc="18"; zero="7 13" _verify_l2_bitmap 7
alloc="$(seq 13 18)"; zero="7" _verify_l2_bitmap 8
alloc="13 18"; zero="6 7" _verify_l2_bitmap 9
echo
echo "### Test concurrent requests ###"
echo
_concurrent_io()
{
# Allocate three subclusters in the same cluster.
# This works because handle_dependencies() checks whether the requests
# allocate the same cluster, even if the COW regions don't overlap (in
# this case they don't).
cat <<EOF
open -o driver=$IMGFMT blkdebug::$TEST_IMG
break write_aio A
aio_write -P 10 30k 2k
wait_break A
aio_write -P 11 20k 2k
aio_write -P 12 40k 2k
resume A
aio_flush
EOF
}
_concurrent_verify()
{
cat <<EOF
open -o driver=$IMGFMT $TEST_IMG
read -q -P 10 30k 2k
read -q -P 11 20k 2k
read -q -P 12 40k 2k
EOF
}
_make_test_img -o extended_l2=on 1M
# Second and third writes in _concurrent_io() are independent and may finish in
# different order. So, filter offset out to match both possible variants.
_concurrent_io | $QEMU_IO | _filter_qemu_io | \
$SED -e 's/\(20480\|40960\)/OFFSET/'
_concurrent_verify | $QEMU_IO | _filter_qemu_io
# success, all done
echo "*** done"
rm -f $seq.full
status=0