Currently, behavior on copy-before-write operation failure is simple:
report error to the guest.
Let's implement alternative behavior: break the whole copy-before-write
process (and corresponding backup job or NBD client) but keep guest
working. It's needed if we consider guest stability as more important.
The realisation is simple: on copy-before-write failure we immediately
continue guest write operation and set s->snapshot_ret variable which
will lead to all further and in-flight snapshot-API requests failure.
Signed-off-by: Vladimir Sementsov-Ogievskiy <vsementsov@openvz.org>
---
block/copy-before-write.c | 62 ++++++++++++++++++++++++++++++++++-----
qapi/block-core.json | 27 ++++++++++++++++-
2 files changed, 81 insertions(+), 8 deletions(-)
diff --git a/block/copy-before-write.c b/block/copy-before-write.c
index 394e73b094..0614c3d08b 100644
--- a/block/copy-before-write.c
+++ b/block/copy-before-write.c
@@ -41,6 +41,7 @@
typedef struct BDRVCopyBeforeWriteState {
BlockCopyState *bcs;
BdrvChild *target;
+ OnCbwError on_cbw_error;
/*
* @lock: protects access to @access_bitmap, @done_bitmap and
@@ -65,6 +66,14 @@ typedef struct BDRVCopyBeforeWriteState {
* node. These areas must not be rewritten by guest.
*/
BlockReqList frozen_read_reqs;
+
+ /*
+ * @snapshot_error is normally zero. But on first copy-before-write failure
+ * when @on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT, @snapshot_error takes
+ * value of this error (<0). After that all in-flight and further
+ * snaoshot-API requests will fail with that error.
+ */
+ int snapshot_error;
} BDRVCopyBeforeWriteState;
static coroutine_fn int cbw_co_preadv(
@@ -99,11 +108,25 @@ static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs,
end = QEMU_ALIGN_UP(offset + bytes, cluster_size);
ret = block_copy(s->bcs, off, end - off, true);
- if (ret < 0) {
+ if (ret < 0 && s->on_cbw_error == ON_CBW_ERROR_BREAK_GUEST_WRITE) {
return ret;
}
WITH_QEMU_LOCK_GUARD(&s->lock) {
+ if (ret < 0) {
+ assert(s->on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT);
+ if (!s->snapshot_error) {
+ s->snapshot_error = ret;
+ }
+ /*
+ * No need to wait for s->frozen_read_reqs: they will fail anyway,
+ * as s->snapshot_error is set.
+ *
+ * We return 0, as error is handled. Guest operation should be
+ * continued.
+ */
+ return 0;
+ }
bdrv_set_dirty_bitmap(s->done_bitmap, off, end - off);
reqlist_wait_all(&s->frozen_read_reqs, off, end - off, &s->lock);
}
@@ -176,6 +199,11 @@ static BlockReq *cbw_snapshot_read_lock(BlockDriverState *bs,
QEMU_LOCK_GUARD(&s->lock);
+ if (s->snapshot_error) {
+ g_free(req);
+ return NULL;
+ }
+
if (bdrv_dirty_bitmap_next_zero(s->access_bitmap, offset, bytes) != -1) {
g_free(req);
return NULL;
@@ -198,19 +226,26 @@ static BlockReq *cbw_snapshot_read_lock(BlockDriverState *bs,
return req;
}
-static void cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
+static int cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
{
BDRVCopyBeforeWriteState *s = bs->opaque;
if (req->offset == -1 && req->bytes == -1) {
g_free(req);
- return;
+ /*
+ * No real need to read snapshot_error under mutex here: we are actually
+ * safe to ignore it and return 0, as this request was to s->target, and
+ * can't be influenced by guest write. But if we can new read negative
+ * s->snapshot_error let's return it, so that backup failed earlier.
+ */
+ return s->snapshot_error;
}
QEMU_LOCK_GUARD(&s->lock);
reqlist_remove_req(req);
g_free(req);
+ return s->snapshot_error;
}
static coroutine_fn int
@@ -219,7 +254,7 @@ cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
{
BlockReq *req;
BdrvChild *file;
- int ret;
+ int ret, ret2;
/* TODO: upgrade to async loop using AioTask */
while (bytes) {
@@ -232,10 +267,13 @@ cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
ret = bdrv_co_preadv_part(file, offset, cur_bytes,
qiov, qiov_offset, 0);
- cbw_snapshot_read_unlock(bs, req);
+ ret2 = cbw_snapshot_read_unlock(bs, req);
if (ret < 0) {
return ret;
}
+ if (ret2 < 0) {
+ return ret2;
+ }
bytes -= cur_bytes;
offset += cur_bytes;
@@ -253,7 +291,7 @@ cbw_co_snapshot_block_status(BlockDriverState *bs,
{
BDRVCopyBeforeWriteState *s = bs->opaque;
BlockReq *req;
- int ret;
+ int ret, ret2;
int64_t cur_bytes;
BdrvChild *child;
@@ -273,7 +311,14 @@ cbw_co_snapshot_block_status(BlockDriverState *bs,
assert(ret & BDRV_BLOCK_ALLOCATED);
}
- cbw_snapshot_read_unlock(bs, req);
+ ret2 = cbw_snapshot_read_unlock(bs, req);
+
+ if (ret < 0) {
+ return ret;
+ }
+ if (ret2 < 0) {
+ return ret2;
+ }
return ret;
}
@@ -366,6 +411,7 @@ static BlockdevOptionsCbw *cbw_parse_options(QDict *options, Error **errp)
* object for original options.
*/
qdict_extract_subqdict(options, NULL, "bitmap");
+ qdict_del(options, "on-cbw-error");
out:
visit_free(v);
@@ -407,6 +453,8 @@ static int cbw_open(BlockDriverState *bs, QDict *options, int flags,
return -EINVAL;
}
}
+ s->on_cbw_error = opts->has_on_cbw_error ? opts->on_cbw_error :
+ ON_CBW_ERROR_BREAK_GUEST_WRITE;
bs->total_sectors = bs->file->bs->total_sectors;
bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
diff --git a/qapi/block-core.json b/qapi/block-core.json
index e89f2dfb5b..3f08025114 100644
--- a/qapi/block-core.json
+++ b/qapi/block-core.json
@@ -4162,6 +4162,27 @@
'base': 'BlockdevOptionsGenericFormat',
'data': { '*bottom': 'str' } }
+##
+# @OnCbwError:
+#
+# An enumeration of possible behaviors for copy-before-write operation
+# failures.
+#
+# @break-guest-write: report the error to the guest. This way the state
+# of copy-before-write process is kept OK and
+# copy-before-write filter continues to work normally.
+#
+# @break-snapshot: continue guest write. Since this, the snapshot state
+# provided by copy-before-write filter becomes broken.
+# So, all in-flight and all further snapshot-access
+# operations (through snapshot-access block driver)
+# will fail.
+#
+# Since: 7.0
+##
+{ 'enum': 'OnCbwError',
+ 'data': [ 'break-guest-write', 'break-snapshot' ] }
+
##
# @BlockdevOptionsCbw:
#
@@ -4183,11 +4204,15 @@
# modifications (or removing) of specified bitmap doesn't
# influence the filter. (Since 7.0)
#
+# @on-cbw-error: Behavior on failure of copy-before-write operation.
+# Default is @break-guest-write. (Since 7.0)
+#
# Since: 6.2
##
{ 'struct': 'BlockdevOptionsCbw',
'base': 'BlockdevOptionsGenericFormat',
- 'data': { 'target': 'BlockdevRef', '*bitmap': 'BlockDirtyBitmap' } }
+ 'data': { 'target': 'BlockdevRef', '*bitmap': 'BlockDirtyBitmap',
+ '*on-cbw-error': 'OnCbwError' } }
##
# @BlockdevOptions:
--
2.35.1
On 01.04.22 11:19, Vladimir Sementsov-Ogievskiy wrote:
> Currently, behavior on copy-before-write operation failure is simple:
> report error to the guest.
>
> Let's implement alternative behavior: break the whole copy-before-write
> process (and corresponding backup job or NBD client) but keep guest
> working. It's needed if we consider guest stability as more important.
>
> The realisation is simple: on copy-before-write failure we immediately
> continue guest write operation and set s->snapshot_ret variable which
> will lead to all further and in-flight snapshot-API requests failure.
>
> Signed-off-by: Vladimir Sementsov-Ogievskiy <vsementsov@openvz.org>
> ---
> block/copy-before-write.c | 62 ++++++++++++++++++++++++++++++++++-----
> qapi/block-core.json | 27 ++++++++++++++++-
> 2 files changed, 81 insertions(+), 8 deletions(-)
>
> diff --git a/block/copy-before-write.c b/block/copy-before-write.c
> index 394e73b094..0614c3d08b 100644
> --- a/block/copy-before-write.c
> +++ b/block/copy-before-write.c
> @@ -41,6 +41,7 @@
> typedef struct BDRVCopyBeforeWriteState {
> BlockCopyState *bcs;
> BdrvChild *target;
> + OnCbwError on_cbw_error;
>
> /*
> * @lock: protects access to @access_bitmap, @done_bitmap and
> @@ -65,6 +66,14 @@ typedef struct BDRVCopyBeforeWriteState {
> * node. These areas must not be rewritten by guest.
> */
> BlockReqList frozen_read_reqs;
> +
> + /*
> + * @snapshot_error is normally zero. But on first copy-before-write failure
> + * when @on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT, @snapshot_error takes
> + * value of this error (<0). After that all in-flight and further
> + * snaoshot-API requests will fail with that error.
*snapshot
> + */
> + int snapshot_error;
> } BDRVCopyBeforeWriteState;
>
> static coroutine_fn int cbw_co_preadv(
> @@ -99,11 +108,25 @@ static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs,
> end = QEMU_ALIGN_UP(offset + bytes, cluster_size);
Wouldn’t it make sense to completely cease CBW if snapshot_error is
non-zero? (I.e. always returning 0 here, skipping block_copy().) You
can’t read from it anyway anymore. (Except from below the
copy-before-write node, but users shouldn’t be doing this, because they
can’t know which areas are valid to read and which aren’t.)
> ret = block_copy(s->bcs, off, end - off, true);
> - if (ret < 0) {
> + if (ret < 0 && s->on_cbw_error == ON_CBW_ERROR_BREAK_GUEST_WRITE) {
> return ret;
> }
>
> WITH_QEMU_LOCK_GUARD(&s->lock) {
> + if (ret < 0) {
> + assert(s->on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT);
> + if (!s->snapshot_error) {
> + s->snapshot_error = ret;
> + }
> + /*
> + * No need to wait for s->frozen_read_reqs: they will fail anyway,
> + * as s->snapshot_error is set.
> + *
> + * We return 0, as error is handled. Guest operation should be
> + * continued.
> + */
> + return 0;
Hm, OK. Naively, it looks to me like we could save us this explanation
and simplify the code just by unconditionally waiting here (I guess we
could skip the wait if snapshot_error was non-zero before) and not
checking snapshot_error in cbw_snapshot_read_unlock(). I don’t think
not waiting here meaningfully saves time.
> + }
> bdrv_set_dirty_bitmap(s->done_bitmap, off, end - off);
> reqlist_wait_all(&s->frozen_read_reqs, off, end - off, &s->lock);
> }
> @@ -176,6 +199,11 @@ static BlockReq *cbw_snapshot_read_lock(BlockDriverState *bs,
>
> QEMU_LOCK_GUARD(&s->lock);
>
> + if (s->snapshot_error) {
> + g_free(req);
> + return NULL;
> + }
> +
> if (bdrv_dirty_bitmap_next_zero(s->access_bitmap, offset, bytes) != -1) {
> g_free(req);
> return NULL;
> @@ -198,19 +226,26 @@ static BlockReq *cbw_snapshot_read_lock(BlockDriverState *bs,
> return req;
> }
>
> -static void cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
> +static int cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
> {
> BDRVCopyBeforeWriteState *s = bs->opaque;
>
> if (req->offset == -1 && req->bytes == -1) {
> g_free(req);
> - return;
> + /*
> + * No real need to read snapshot_error under mutex here: we are actually
> + * safe to ignore it and return 0, as this request was to s->target, and
> + * can't be influenced by guest write. But if we can new read negative
> + * s->snapshot_error let's return it, so that backup failed earlier.
> + */
> + return s->snapshot_error;
> }
>
> QEMU_LOCK_GUARD(&s->lock);
>
> reqlist_remove_req(req);
> g_free(req);
> + return s->snapshot_error;
> }
>
> static coroutine_fn int
> @@ -219,7 +254,7 @@ cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
> {
> BlockReq *req;
> BdrvChild *file;
> - int ret;
> + int ret, ret2;
>
> /* TODO: upgrade to async loop using AioTask */
> while (bytes) {
> @@ -232,10 +267,13 @@ cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
>
> ret = bdrv_co_preadv_part(file, offset, cur_bytes,
> qiov, qiov_offset, 0);
> - cbw_snapshot_read_unlock(bs, req);
> + ret2 = cbw_snapshot_read_unlock(bs, req);
> if (ret < 0) {
> return ret;
> }
> + if (ret2 < 0) {
> + return ret2;
> + }
>
> bytes -= cur_bytes;
> offset += cur_bytes;
> @@ -253,7 +291,7 @@ cbw_co_snapshot_block_status(BlockDriverState *bs,
> {
> BDRVCopyBeforeWriteState *s = bs->opaque;
> BlockReq *req;
> - int ret;
> + int ret, ret2;
> int64_t cur_bytes;
> BdrvChild *child;
>
> @@ -273,7 +311,14 @@ cbw_co_snapshot_block_status(BlockDriverState *bs,
> assert(ret & BDRV_BLOCK_ALLOCATED);
> }
>
> - cbw_snapshot_read_unlock(bs, req);
> + ret2 = cbw_snapshot_read_unlock(bs, req);
> +
> + if (ret < 0) {
> + return ret;
> + }
> + if (ret2 < 0) {
> + return ret2;
> + }
>
> return ret;
> }
> @@ -366,6 +411,7 @@ static BlockdevOptionsCbw *cbw_parse_options(QDict *options, Error **errp)
> * object for original options.
> */
> qdict_extract_subqdict(options, NULL, "bitmap");
> + qdict_del(options, "on-cbw-error");
>
> out:
> visit_free(v);
> @@ -407,6 +453,8 @@ static int cbw_open(BlockDriverState *bs, QDict *options, int flags,
> return -EINVAL;
> }
> }
> + s->on_cbw_error = opts->has_on_cbw_error ? opts->on_cbw_error :
> + ON_CBW_ERROR_BREAK_GUEST_WRITE;
>
> bs->total_sectors = bs->file->bs->total_sectors;
> bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
> diff --git a/qapi/block-core.json b/qapi/block-core.json
> index e89f2dfb5b..3f08025114 100644
> --- a/qapi/block-core.json
> +++ b/qapi/block-core.json
> @@ -4162,6 +4162,27 @@
> 'base': 'BlockdevOptionsGenericFormat',
> 'data': { '*bottom': 'str' } }
>
> +##
> +# @OnCbwError:
> +#
> +# An enumeration of possible behaviors for copy-before-write operation
> +# failures.
> +#
> +# @break-guest-write: report the error to the guest. This way the state
> +# of copy-before-write process is kept OK and
I’d be more verbose here: “This way, the guest will not be able to
overwrite areas that cannot be backed up, so the backup remains valid.”
I like the bluntness of how these two options are named, by the way.
That does clearly tell users what they’ll have to expect.
> +# copy-before-write filter continues to work normally.
> +#
> +# @break-snapshot: continue guest write. Since this, the snapshot state
> +# provided by copy-before-write filter becomes broken.
Maybe “Doing so will invalidate the backup snapshot”?
> +# So, all in-flight and all further snapshot-access
> +# operations (through snapshot-access block driver)
> +# will fail.
> +#
> +# Since: 7.0
> +##
> +{ 'enum': 'OnCbwError',
> + 'data': [ 'break-guest-write', 'break-snapshot' ] }
> +
> ##
> # @BlockdevOptionsCbw:
> #
> @@ -4183,11 +4204,15 @@
> # modifications (or removing) of specified bitmap doesn't
> # influence the filter. (Since 7.0)
> #
> +# @on-cbw-error: Behavior on failure of copy-before-write operation.
> +# Default is @break-guest-write. (Since 7.0)
*7.1
> +#
> # Since: 6.2
> ##
> { 'struct': 'BlockdevOptionsCbw',
> 'base': 'BlockdevOptionsGenericFormat',
> - 'data': { 'target': 'BlockdevRef', '*bitmap': 'BlockDirtyBitmap' } }
> + 'data': { 'target': 'BlockdevRef', '*bitmap': 'BlockDirtyBitmap',
> + '*on-cbw-error': 'OnCbwError' } }
>
> ##
> # @BlockdevOptions:
01.04.2022 14:58, Hanna Reitz wrote:
> On 01.04.22 11:19, Vladimir Sementsov-Ogievskiy wrote:
>> Currently, behavior on copy-before-write operation failure is simple:
>> report error to the guest.
>>
>> Let's implement alternative behavior: break the whole copy-before-write
>> process (and corresponding backup job or NBD client) but keep guest
>> working. It's needed if we consider guest stability as more important.
>>
>> The realisation is simple: on copy-before-write failure we immediately
>> continue guest write operation and set s->snapshot_ret variable which
>> will lead to all further and in-flight snapshot-API requests failure.
>>
>> Signed-off-by: Vladimir Sementsov-Ogievskiy <vsementsov@openvz.org>
>> ---
>> block/copy-before-write.c | 62 ++++++++++++++++++++++++++++++++++-----
>> qapi/block-core.json | 27 ++++++++++++++++-
>> 2 files changed, 81 insertions(+), 8 deletions(-)
>>
>> diff --git a/block/copy-before-write.c b/block/copy-before-write.c
>> index 394e73b094..0614c3d08b 100644
>> --- a/block/copy-before-write.c
>> +++ b/block/copy-before-write.c
>> @@ -41,6 +41,7 @@
>> typedef struct BDRVCopyBeforeWriteState {
>> BlockCopyState *bcs;
>> BdrvChild *target;
>> + OnCbwError on_cbw_error;
>> /*
>> * @lock: protects access to @access_bitmap, @done_bitmap and
>> @@ -65,6 +66,14 @@ typedef struct BDRVCopyBeforeWriteState {
>> * node. These areas must not be rewritten by guest.
>> */
>> BlockReqList frozen_read_reqs;
>> +
>> + /*
>> + * @snapshot_error is normally zero. But on first copy-before-write failure
>> + * when @on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT, @snapshot_error takes
>> + * value of this error (<0). After that all in-flight and further
>> + * snaoshot-API requests will fail with that error.
>
> *snapshot
>
>> + */
>> + int snapshot_error;
>> } BDRVCopyBeforeWriteState;
>> static coroutine_fn int cbw_co_preadv(
>> @@ -99,11 +108,25 @@ static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs,
>> end = QEMU_ALIGN_UP(offset + bytes, cluster_size);
>
> Wouldn’t it make sense to completely cease CBW if snapshot_error is non-zero? (I.e. always returning 0 here, skipping block_copy().) You can’t read from it anyway anymore. (Except from below the copy-before-write node, but users shouldn’t be doing this, because they can’t know which areas are valid to read and which aren’t.)
Agree, will do.
>
>> ret = block_copy(s->bcs, off, end - off, true);
>> - if (ret < 0) {
>> + if (ret < 0 && s->on_cbw_error == ON_CBW_ERROR_BREAK_GUEST_WRITE) {
>> return ret;
>> }
>> WITH_QEMU_LOCK_GUARD(&s->lock) {
>> + if (ret < 0) {
>> + assert(s->on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT);
>> + if (!s->snapshot_error) {
>> + s->snapshot_error = ret;
>> + }
>> + /*
>> + * No need to wait for s->frozen_read_reqs: they will fail anyway,
>> + * as s->snapshot_error is set.
>> + *
>> + * We return 0, as error is handled. Guest operation should be
>> + * continued.
>> + */
>> + return 0;
>
> Hm, OK. Naively, it looks to me like we could save us this explanation and simplify the code just by unconditionally waiting here (I guess we could skip the wait if snapshot_error was non-zero before) and not checking snapshot_error in cbw_snapshot_read_unlock(). I don’t think not waiting here meaningfully saves time.
Hmm. I tend to agree, this optimization doesn't seem to worth the complexity. Will drop it, we can implement it later if really needed.
>
>> + }
>> bdrv_set_dirty_bitmap(s->done_bitmap, off, end - off);
>> reqlist_wait_all(&s->frozen_read_reqs, off, end - off, &s->lock);
>> }
>> @@ -176,6 +199,11 @@ static BlockReq *cbw_snapshot_read_lock(BlockDriverState *bs,
>> QEMU_LOCK_GUARD(&s->lock);
>> + if (s->snapshot_error) {
>> + g_free(req);
>> + return NULL;
>> + }
>> +
>> if (bdrv_dirty_bitmap_next_zero(s->access_bitmap, offset, bytes) != -1) {
>> g_free(req);
>> return NULL;
>> @@ -198,19 +226,26 @@ static BlockReq *cbw_snapshot_read_lock(BlockDriverState *bs,
>> return req;
>> }
>> -static void cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
>> +static int cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
>> {
>> BDRVCopyBeforeWriteState *s = bs->opaque;
>> if (req->offset == -1 && req->bytes == -1) {
>> g_free(req);
>> - return;
>> + /*
>> + * No real need to read snapshot_error under mutex here: we are actually
>> + * safe to ignore it and return 0, as this request was to s->target, and
>> + * can't be influenced by guest write. But if we can new read negative
>> + * s->snapshot_error let's return it, so that backup failed earlier.
>> + */
>> + return s->snapshot_error;
>> }
>> QEMU_LOCK_GUARD(&s->lock);
>> reqlist_remove_req(req);
>> g_free(req);
>> + return s->snapshot_error;
>> }
>> static coroutine_fn int
>> @@ -219,7 +254,7 @@ cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
>> {
>> BlockReq *req;
>> BdrvChild *file;
>> - int ret;
>> + int ret, ret2;
>> /* TODO: upgrade to async loop using AioTask */
>> while (bytes) {
>> @@ -232,10 +267,13 @@ cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
>> ret = bdrv_co_preadv_part(file, offset, cur_bytes,
>> qiov, qiov_offset, 0);
>> - cbw_snapshot_read_unlock(bs, req);
>> + ret2 = cbw_snapshot_read_unlock(bs, req);
>> if (ret < 0) {
>> return ret;
>> }
>> + if (ret2 < 0) {
>> + return ret2;
>> + }
>> bytes -= cur_bytes;
>> offset += cur_bytes;
>> @@ -253,7 +291,7 @@ cbw_co_snapshot_block_status(BlockDriverState *bs,
>> {
>> BDRVCopyBeforeWriteState *s = bs->opaque;
>> BlockReq *req;
>> - int ret;
>> + int ret, ret2;
>> int64_t cur_bytes;
>> BdrvChild *child;
>> @@ -273,7 +311,14 @@ cbw_co_snapshot_block_status(BlockDriverState *bs,
>> assert(ret & BDRV_BLOCK_ALLOCATED);
>> }
>> - cbw_snapshot_read_unlock(bs, req);
>> + ret2 = cbw_snapshot_read_unlock(bs, req);
>> +
>> + if (ret < 0) {
>> + return ret;
>> + }
>> + if (ret2 < 0) {
>> + return ret2;
>> + }
>> return ret;
>> }
>> @@ -366,6 +411,7 @@ static BlockdevOptionsCbw *cbw_parse_options(QDict *options, Error **errp)
>> * object for original options.
>> */
>> qdict_extract_subqdict(options, NULL, "bitmap");
>> + qdict_del(options, "on-cbw-error");
>> out:
>> visit_free(v);
>> @@ -407,6 +453,8 @@ static int cbw_open(BlockDriverState *bs, QDict *options, int flags,
>> return -EINVAL;
>> }
>> }
>> + s->on_cbw_error = opts->has_on_cbw_error ? opts->on_cbw_error :
>> + ON_CBW_ERROR_BREAK_GUEST_WRITE;
>> bs->total_sectors = bs->file->bs->total_sectors;
>> bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
>> diff --git a/qapi/block-core.json b/qapi/block-core.json
>> index e89f2dfb5b..3f08025114 100644
>> --- a/qapi/block-core.json
>> +++ b/qapi/block-core.json
>> @@ -4162,6 +4162,27 @@
>> 'base': 'BlockdevOptionsGenericFormat',
>> 'data': { '*bottom': 'str' } }
>> +##
>> +# @OnCbwError:
>> +#
>> +# An enumeration of possible behaviors for copy-before-write operation
>> +# failures.
>> +#
>> +# @break-guest-write: report the error to the guest. This way the state
>> +# of copy-before-write process is kept OK and
>
> I’d be more verbose here: “This way, the guest will not be able to overwrite areas that cannot be backed up, so the backup remains valid.”
Sounds good
>
> I like the bluntness of how these two options are named, by the way. That does clearly tell users what they’ll have to expect.
>
>> +# copy-before-write filter continues to work normally.
>> +#
>> +# @break-snapshot: continue guest write. Since this, the snapshot state
>> +# provided by copy-before-write filter becomes broken.
>
> Maybe “Doing so will invalidate the backup snapshot”?
"invalidate" word was never clear for me.. In our block-layer for example "invalidate" is opposite to "inactivate".
something like:
Doing so will make the provided snapshot state invalid and any backup or export process based on it will finally fail.
?
>
>> +# So, all in-flight and all further snapshot-access
>> +# operations (through snapshot-access block driver)
>> +# will fail.
>> +#
>> +# Since: 7.0
>> +##
>> +{ 'enum': 'OnCbwError',
>> + 'data': [ 'break-guest-write', 'break-snapshot' ] }
>> +
>> ##
>> # @BlockdevOptionsCbw:
>> #
>> @@ -4183,11 +4204,15 @@
>> # modifications (or removing) of specified bitmap doesn't
>> # influence the filter. (Since 7.0)
>> #
>> +# @on-cbw-error: Behavior on failure of copy-before-write operation.
>> +# Default is @break-guest-write. (Since 7.0)
>
> *7.1
>
>> +#
>> # Since: 6.2
>> ##
>> { 'struct': 'BlockdevOptionsCbw',
>> 'base': 'BlockdevOptionsGenericFormat',
>> - 'data': { 'target': 'BlockdevRef', '*bitmap': 'BlockDirtyBitmap' } }
>> + 'data': { 'target': 'BlockdevRef', '*bitmap': 'BlockDirtyBitmap',
>> + '*on-cbw-error': 'OnCbwError' } }
>> ##
>> # @BlockdevOptions:
>
--
Best regards,
Vladimir
© 2016 - 2026 Red Hat, Inc.