- kvm-migration-multifd-move-macros-to-multifd-header.patch [RHEL-59697] - kvm-migration-refactor-channel-discovery-mechanism.patch [RHEL-59697] - kvm-migration-Add-save_postcopy_prepare-savevm-handler.patch [RHEL-59697] - kvm-migration-ram-Implement-save_postcopy_prepare.patch [RHEL-59697] - kvm-tests-qtest-migration-consolidate-set-capabilities.patch [RHEL-59697] - kvm-migration-write-zero-pages-when-postcopy-enabled.patch [RHEL-59697] - kvm-migration-enable-multifd-and-postcopy-together.patch [RHEL-59697] - kvm-migration-Add-qtest-for-migration-over-RDMA.patch [RHEL-59697] - kvm-qtest-migration-rdma-Enforce-RLIMIT_MEMLOCK-128MB-re.patch [RHEL-59697] - kvm-qtest-migration-rdma-Add-test-for-rdma-migration-wit.patch [RHEL-59697] - kvm-tests-qtest-migration-add-postcopy-tests-with-multif.patch [RHEL-59697] - kvm-file-posix-Fix-aio-threads-performance-regression-af.patch [RHEL-96854] - kvm-block-remove-outdated-comments-about-AioContext-lock.patch [RHEL-88561] - kvm-block-move-drain-outside-of-read-locked-bdrv_reopen_.patch [RHEL-88561] - kvm-block-snapshot-move-drain-outside-of-read-locked-bdr.patch [RHEL-88561] - kvm-block-move-drain-outside-of-read-locked-bdrv_inactiv.patch [RHEL-88561] - kvm-block-mark-bdrv_parent_change_aio_context-GRAPH_RDLO.patch [RHEL-88561] - kvm-block-mark-change_aio_ctx-callback-and-instances-as-.patch [RHEL-88561] - kvm-block-mark-bdrv_child_change_aio_context-GRAPH_RDLOC.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_change_aio_context-.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_try_change_aio_cont.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_attach_child_common.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_set_backing_hd_drai.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_root_attach_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_attach_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-quorum_add_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_root_unref_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-quorum_del_child.patch [RHEL-88561] - kvm-blockdev-drain-while-unlocked-in-internal_snapshot_a.patch [RHEL-88561] - kvm-blockdev-drain-while-unlocked-in-external_snapshot_a.patch [RHEL-88561] - kvm-block-mark-bdrv_drained_begin-and-friends-as-GRAPH_U.patch [RHEL-88561] - kvm-iotests-graph-changes-while-io-remove-image-file-aft.patch [RHEL-88561] - kvm-iotests-graph-changes-while-io-add-test-case-with-re.patch [RHEL-88561] - Resolves: RHEL-59697 (Allow multifd+postcopy features being enabled together, but only use multifd during precopy ) - Resolves: RHEL-96854 (Performance Degradation(aio=threads) between Upstream Commit b75c5f9 and 984a32f) - Resolves: RHEL-88561 (qemu graph deadlock during job-dismiss)
327 lines
12 KiB
Diff
327 lines
12 KiB
Diff
From 62e8b3e9173ea4fb85cf52c66109832ff9d4d437 Mon Sep 17 00:00:00 2001
|
|
From: Fiona Ebner <f.ebner@proxmox.com>
|
|
Date: Fri, 30 May 2025 17:10:50 +0200
|
|
Subject: [PATCH 25/33] block: move drain outside of bdrv_attach_child()
|
|
|
|
RH-Author: Kevin Wolf <kwolf@redhat.com>
|
|
RH-MergeRequest: 393: block: do not drain while holding the graph lock
|
|
RH-Jira: RHEL-88561
|
|
RH-Acked-by: Stefan Hajnoczi <stefanha@redhat.com>
|
|
RH-Acked-by: Hanna Czenczek <hreitz@redhat.com>
|
|
RH-Commit: [13/21] c68a1e34fa991dff72ec0a6403fd9786341ab534 (kmwolf/centos-qemu-kvm)
|
|
|
|
This is part of resolving the deadlock mentioned in commit "block:
|
|
move draining out of bdrv_change_aio_context() and mark GRAPH_RDLOCK".
|
|
|
|
The function bdrv_attach_child() runs under the graph lock, so it is
|
|
not allowed to drain. It is called by:
|
|
1. replication_start()
|
|
2. quorum_add_child()
|
|
3. bdrv_open_child_common()
|
|
4. Throughout test-bdrv-graph-mod.c and test-bdrv-drain.c unit tests.
|
|
|
|
In all callers, a drained section is introduced.
|
|
|
|
The function quorum_add_child() runs under the graph lock, so it is
|
|
not actually allowed to drain. This will be addressed by the following
|
|
commit.
|
|
|
|
Signed-off-by: Fiona Ebner <f.ebner@proxmox.com>
|
|
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
|
|
Message-ID: <20250530151125.955508-14-f.ebner@proxmox.com>
|
|
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
|
|
(cherry picked from commit 77f3965ba7fed5b35212171a1e41c20c05a7ef11)
|
|
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
|
|
---
|
|
block.c | 6 ++++--
|
|
block/quorum.c | 2 ++
|
|
block/replication.c | 5 +++++
|
|
tests/unit/test-bdrv-drain.c | 14 ++++++++++++++
|
|
tests/unit/test-bdrv-graph-mod.c | 10 ++++++++++
|
|
5 files changed, 35 insertions(+), 2 deletions(-)
|
|
|
|
diff --git a/block.c b/block.c
|
|
index 536a017201..3857f42877 100644
|
|
--- a/block.c
|
|
+++ b/block.c
|
|
@@ -3269,6 +3269,8 @@ out:
|
|
*
|
|
* On failure NULL is returned, errp is set and the reference to
|
|
* child_bs is also dropped.
|
|
+ *
|
|
+ * All block nodes must be drained.
|
|
*/
|
|
BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
|
|
BlockDriverState *child_bs,
|
|
@@ -3283,7 +3285,6 @@ BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
|
|
|
|
GLOBAL_STATE_CODE();
|
|
|
|
- bdrv_drain_all_begin();
|
|
child = bdrv_attach_child_noperm(parent_bs, child_bs, child_name,
|
|
child_class, child_role, tran, errp);
|
|
if (!child) {
|
|
@@ -3298,7 +3299,6 @@ BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
|
|
|
|
out:
|
|
tran_finalize(tran, ret);
|
|
- bdrv_drain_all_end();
|
|
|
|
bdrv_schedule_unref(child_bs);
|
|
|
|
@@ -3789,10 +3789,12 @@ static BdrvChild *bdrv_open_child_common(const char *filename,
|
|
return NULL;
|
|
}
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
child = bdrv_attach_child(parent, bs, bdref_key, child_class, child_role,
|
|
errp);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
return child;
|
|
}
|
|
diff --git a/block/quorum.c b/block/quorum.c
|
|
index ed8ce801ee..ea17b0ec13 100644
|
|
--- a/block/quorum.c
|
|
+++ b/block/quorum.c
|
|
@@ -1096,8 +1096,10 @@ quorum_add_child(BlockDriverState *bs, BlockDriverState *child_bs, Error **errp)
|
|
/* We can safely add the child now */
|
|
bdrv_ref(child_bs);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
child = bdrv_attach_child(bs, child_bs, indexstr, &child_of_bds,
|
|
BDRV_CHILD_DATA, errp);
|
|
+ bdrv_drain_all_end();
|
|
if (child == NULL) {
|
|
s->next_child_index--;
|
|
return;
|
|
diff --git a/block/replication.c b/block/replication.c
|
|
index 0020f33843..02814578c6 100644
|
|
--- a/block/replication.c
|
|
+++ b/block/replication.c
|
|
@@ -541,6 +541,7 @@ static void replication_start(ReplicationState *rs, ReplicationMode mode,
|
|
return;
|
|
}
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
|
|
bdrv_ref(hidden_disk->bs);
|
|
@@ -550,6 +551,7 @@ static void replication_start(ReplicationState *rs, ReplicationMode mode,
|
|
if (local_err) {
|
|
error_propagate(errp, local_err);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
return;
|
|
}
|
|
|
|
@@ -560,6 +562,7 @@ static void replication_start(ReplicationState *rs, ReplicationMode mode,
|
|
if (local_err) {
|
|
error_propagate(errp, local_err);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
return;
|
|
}
|
|
|
|
@@ -572,12 +575,14 @@ static void replication_start(ReplicationState *rs, ReplicationMode mode,
|
|
!check_top_bs(top_bs, bs)) {
|
|
error_setg(errp, "No top_bs or it is invalid");
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
reopen_backing_file(bs, false, NULL);
|
|
return;
|
|
}
|
|
bdrv_op_block_all(top_bs, s->blocker);
|
|
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
s->backup_job = backup_job_create(
|
|
NULL, s->secondary_disk->bs, s->hidden_disk->bs,
|
|
diff --git a/tests/unit/test-bdrv-drain.c b/tests/unit/test-bdrv-drain.c
|
|
index 4f3057844b..ac76525e5a 100644
|
|
--- a/tests/unit/test-bdrv-drain.c
|
|
+++ b/tests/unit/test-bdrv-drain.c
|
|
@@ -1049,10 +1049,12 @@ static void do_test_delete_by_drain(bool detach_instead_of_delete,
|
|
|
|
null_bs = bdrv_open("null-co://", NULL, NULL, BDRV_O_RDWR | BDRV_O_PROTOCOL,
|
|
&error_abort);
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(bs, null_bs, "null-child", &child_of_bds,
|
|
BDRV_CHILD_DATA, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
/* This child will be the one to pass to requests through to, and
|
|
* it will stall until a drain occurs */
|
|
@@ -1060,21 +1062,25 @@ static void do_test_delete_by_drain(bool detach_instead_of_delete,
|
|
&error_abort);
|
|
child_bs->total_sectors = 65536 >> BDRV_SECTOR_BITS;
|
|
/* Takes our reference to child_bs */
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
tts->wait_child = bdrv_attach_child(bs, child_bs, "wait-child",
|
|
&child_of_bds,
|
|
BDRV_CHILD_DATA | BDRV_CHILD_PRIMARY,
|
|
&error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
/* This child is just there to be deleted
|
|
* (for detach_instead_of_delete == true) */
|
|
null_bs = bdrv_open("null-co://", NULL, NULL, BDRV_O_RDWR | BDRV_O_PROTOCOL,
|
|
&error_abort);
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(bs, null_bs, "null-child", &child_of_bds, BDRV_CHILD_DATA,
|
|
&error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
|
|
blk_insert_bs(blk, bs, &error_abort);
|
|
@@ -1157,6 +1163,7 @@ static void no_coroutine_fn detach_indirect_bh(void *opaque)
|
|
|
|
bdrv_dec_in_flight(data->child_b->bs);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_unref_child(data->parent_b, data->child_b);
|
|
|
|
@@ -1165,6 +1172,7 @@ static void no_coroutine_fn detach_indirect_bh(void *opaque)
|
|
&child_of_bds, BDRV_CHILD_DATA,
|
|
&error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
}
|
|
|
|
static void coroutine_mixed_fn detach_by_parent_aio_cb(void *opaque, int ret)
|
|
@@ -1262,6 +1270,7 @@ static void TSA_NO_TSA test_detach_indirect(bool by_parent_cb)
|
|
/* Set child relationships */
|
|
bdrv_ref(b);
|
|
bdrv_ref(a);
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
child_b = bdrv_attach_child(parent_b, b, "PB-B", &child_of_bds,
|
|
BDRV_CHILD_DATA, &error_abort);
|
|
@@ -1273,6 +1282,7 @@ static void TSA_NO_TSA test_detach_indirect(bool by_parent_cb)
|
|
by_parent_cb ? &child_of_bds : &detach_by_driver_cb_class,
|
|
BDRV_CHILD_DATA, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
g_assert_cmpint(parent_a->refcnt, ==, 1);
|
|
g_assert_cmpint(parent_b->refcnt, ==, 1);
|
|
@@ -1685,6 +1695,7 @@ static void test_drop_intermediate_poll(void)
|
|
* Establish the chain last, so the chain links are the first
|
|
* elements in the BDS.parents lists
|
|
*/
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
for (i = 0; i < 3; i++) {
|
|
if (i) {
|
|
@@ -1694,6 +1705,7 @@ static void test_drop_intermediate_poll(void)
|
|
}
|
|
}
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
job = block_job_create("job", &test_simple_job_driver, NULL, job_node,
|
|
0, BLK_PERM_ALL, 0, 0, NULL, NULL, &error_abort);
|
|
@@ -1940,10 +1952,12 @@ static void do_test_replace_child_mid_drain(int old_drain_count,
|
|
new_child_bs->total_sectors = 1;
|
|
|
|
bdrv_ref(old_child_bs);
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(parent_bs, old_child_bs, "child", &child_of_bds,
|
|
BDRV_CHILD_COW, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
parent_s->setup_completed = true;
|
|
|
|
for (i = 0; i < old_drain_count; i++) {
|
|
diff --git a/tests/unit/test-bdrv-graph-mod.c b/tests/unit/test-bdrv-graph-mod.c
|
|
index d743abb4bb..7b03ebe4b0 100644
|
|
--- a/tests/unit/test-bdrv-graph-mod.c
|
|
+++ b/tests/unit/test-bdrv-graph-mod.c
|
|
@@ -137,10 +137,12 @@ static void test_update_perm_tree(void)
|
|
|
|
blk_insert_bs(root, bs, &error_abort);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(filter, bs, "child", &child_of_bds,
|
|
BDRV_CHILD_DATA, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
ret = bdrv_append(filter, bs, NULL);
|
|
g_assert_cmpint(ret, <, 0);
|
|
@@ -204,11 +206,13 @@ static void test_should_update_child(void)
|
|
|
|
bdrv_set_backing_hd(target, bs, &error_abort);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
g_assert(target->backing->bs == bs);
|
|
bdrv_attach_child(filter, target, "target", &child_of_bds,
|
|
BDRV_CHILD_DATA, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
bdrv_append(filter, bs, &error_abort);
|
|
|
|
bdrv_graph_rdlock_main_loop();
|
|
@@ -244,6 +248,7 @@ static void test_parallel_exclusive_write(void)
|
|
bdrv_ref(base);
|
|
bdrv_ref(fl1);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(top, fl1, "backing", &child_of_bds,
|
|
BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY,
|
|
@@ -257,6 +262,7 @@ static void test_parallel_exclusive_write(void)
|
|
|
|
bdrv_replace_node(fl1, fl2, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
bdrv_drained_end(fl2);
|
|
bdrv_drained_end(fl1);
|
|
@@ -363,6 +369,7 @@ static void test_parallel_perm_update(void)
|
|
*/
|
|
bdrv_ref(base);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(top, ws, "file", &child_of_bds, BDRV_CHILD_DATA,
|
|
&error_abort);
|
|
@@ -377,6 +384,7 @@ static void test_parallel_perm_update(void)
|
|
BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY,
|
|
&error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
/* Select fl1 as first child to be active */
|
|
s->selected = c_fl1;
|
|
@@ -430,11 +438,13 @@ static void test_append_greedy_filter(void)
|
|
BlockDriverState *base = no_perm_node("base");
|
|
BlockDriverState *fl = exclusive_writer_node("fl1");
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
bdrv_attach_child(top, base, "backing", &child_of_bds,
|
|
BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY,
|
|
&error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
bdrv_append(fl, base, &error_abort);
|
|
bdrv_unref(fl);
|
|
--
|
|
2.39.3
|
|
|