- kvm-migration-multifd-move-macros-to-multifd-header.patch [RHEL-59697] - kvm-migration-refactor-channel-discovery-mechanism.patch [RHEL-59697] - kvm-migration-Add-save_postcopy_prepare-savevm-handler.patch [RHEL-59697] - kvm-migration-ram-Implement-save_postcopy_prepare.patch [RHEL-59697] - kvm-tests-qtest-migration-consolidate-set-capabilities.patch [RHEL-59697] - kvm-migration-write-zero-pages-when-postcopy-enabled.patch [RHEL-59697] - kvm-migration-enable-multifd-and-postcopy-together.patch [RHEL-59697] - kvm-migration-Add-qtest-for-migration-over-RDMA.patch [RHEL-59697] - kvm-qtest-migration-rdma-Enforce-RLIMIT_MEMLOCK-128MB-re.patch [RHEL-59697] - kvm-qtest-migration-rdma-Add-test-for-rdma-migration-wit.patch [RHEL-59697] - kvm-tests-qtest-migration-add-postcopy-tests-with-multif.patch [RHEL-59697] - kvm-file-posix-Fix-aio-threads-performance-regression-af.patch [RHEL-96854] - kvm-block-remove-outdated-comments-about-AioContext-lock.patch [RHEL-88561] - kvm-block-move-drain-outside-of-read-locked-bdrv_reopen_.patch [RHEL-88561] - kvm-block-snapshot-move-drain-outside-of-read-locked-bdr.patch [RHEL-88561] - kvm-block-move-drain-outside-of-read-locked-bdrv_inactiv.patch [RHEL-88561] - kvm-block-mark-bdrv_parent_change_aio_context-GRAPH_RDLO.patch [RHEL-88561] - kvm-block-mark-change_aio_ctx-callback-and-instances-as-.patch [RHEL-88561] - kvm-block-mark-bdrv_child_change_aio_context-GRAPH_RDLOC.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_change_aio_context-.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_try_change_aio_cont.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_attach_child_common.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_set_backing_hd_drai.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_root_attach_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_attach_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-quorum_add_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-bdrv_root_unref_child.patch [RHEL-88561] - kvm-block-move-drain-outside-of-quorum_del_child.patch [RHEL-88561] - kvm-blockdev-drain-while-unlocked-in-internal_snapshot_a.patch [RHEL-88561] - kvm-blockdev-drain-while-unlocked-in-external_snapshot_a.patch [RHEL-88561] - kvm-block-mark-bdrv_drained_begin-and-friends-as-GRAPH_U.patch [RHEL-88561] - kvm-iotests-graph-changes-while-io-remove-image-file-aft.patch [RHEL-88561] - kvm-iotests-graph-changes-while-io-add-test-case-with-re.patch [RHEL-88561] - Resolves: RHEL-59697 (Allow multifd+postcopy features being enabled together, but only use multifd during precopy ) - Resolves: RHEL-96854 (Performance Degradation(aio=threads) between Upstream Commit b75c5f9 and 984a32f) - Resolves: RHEL-88561 (qemu graph deadlock during job-dismiss)
284 lines
9.3 KiB
Diff
284 lines
9.3 KiB
Diff
From 4629f2201a220c7775df5a305f22d51ba7a34641 Mon Sep 17 00:00:00 2001
|
|
From: Fiona Ebner <f.ebner@proxmox.com>
|
|
Date: Fri, 30 May 2025 17:10:49 +0200
|
|
Subject: [PATCH 24/33] block: move drain outside of bdrv_root_attach_child()
|
|
|
|
RH-Author: Kevin Wolf <kwolf@redhat.com>
|
|
RH-MergeRequest: 393: block: do not drain while holding the graph lock
|
|
RH-Jira: RHEL-88561
|
|
RH-Acked-by: Stefan Hajnoczi <stefanha@redhat.com>
|
|
RH-Acked-by: Hanna Czenczek <hreitz@redhat.com>
|
|
RH-Commit: [12/21] fa142303dc37b7dc3555900f6e86d5d8241cb36b (kmwolf/centos-qemu-kvm)
|
|
|
|
This is part of resolving the deadlock mentioned in commit "block:
|
|
move draining out of bdrv_change_aio_context() and mark GRAPH_RDLOCK".
|
|
|
|
The function bdrv_root_attach_child() runs under the graph lock, so it
|
|
is not allowed to drain. It is called by:
|
|
1. blk_insert_bs(), where a drained section is introduced.
|
|
2. block_job_add_bdrv(), which holds the graph lock itself.
|
|
|
|
block_job_add_bdrv() is called by:
|
|
1. mirror_start_job()
|
|
2. stream_start()
|
|
3. commit_start()
|
|
4. backup_job_create()
|
|
5. block_job_create()
|
|
6. In the test_blockjob_common_drain_node() unit test
|
|
|
|
In all callers, a drained section is introduced.
|
|
|
|
Signed-off-by: Fiona Ebner <f.ebner@proxmox.com>
|
|
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
|
|
Message-ID: <20250530151125.955508-13-f.ebner@proxmox.com>
|
|
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
|
|
(cherry picked from commit ffdcd081f52544f065020c780a6c522dace6b0af)
|
|
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
|
|
---
|
|
block.c | 4 ++--
|
|
block/backup.c | 2 ++
|
|
block/block-backend.c | 2 ++
|
|
block/commit.c | 4 ++++
|
|
block/mirror.c | 5 +++++
|
|
block/stream.c | 4 ++++
|
|
blockjob.c | 4 ++++
|
|
include/block/blockjob.h | 2 ++
|
|
tests/unit/test-bdrv-drain.c | 2 ++
|
|
9 files changed, 27 insertions(+), 2 deletions(-)
|
|
|
|
diff --git a/block.c b/block.c
|
|
index d84b8ae49e..536a017201 100644
|
|
--- a/block.c
|
|
+++ b/block.c
|
|
@@ -3228,6 +3228,8 @@ bdrv_attach_child_noperm(BlockDriverState *parent_bs,
|
|
*
|
|
* On failure NULL is returned, errp is set and the reference to
|
|
* child_bs is also dropped.
|
|
+ *
|
|
+ * All block nodes must be drained.
|
|
*/
|
|
BdrvChild *bdrv_root_attach_child(BlockDriverState *child_bs,
|
|
const char *child_name,
|
|
@@ -3242,7 +3244,6 @@ BdrvChild *bdrv_root_attach_child(BlockDriverState *child_bs,
|
|
|
|
GLOBAL_STATE_CODE();
|
|
|
|
- bdrv_drain_all_begin();
|
|
child = bdrv_attach_child_common(child_bs, child_name, child_class,
|
|
child_role, perm, shared_perm, opaque,
|
|
tran, errp);
|
|
@@ -3255,7 +3256,6 @@ BdrvChild *bdrv_root_attach_child(BlockDriverState *child_bs,
|
|
|
|
out:
|
|
tran_finalize(tran, ret);
|
|
- bdrv_drain_all_end();
|
|
|
|
bdrv_schedule_unref(child_bs);
|
|
|
|
diff --git a/block/backup.c b/block/backup.c
|
|
index 79652bf57b..9d55e55b79 100644
|
|
--- a/block/backup.c
|
|
+++ b/block/backup.c
|
|
@@ -497,10 +497,12 @@ BlockJob *backup_job_create(const char *job_id, BlockDriverState *bs,
|
|
block_copy_set_speed(bcs, speed);
|
|
|
|
/* Required permissions are taken by copy-before-write filter target */
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
block_job_add_bdrv(&job->common, "target", target, 0, BLK_PERM_ALL,
|
|
&error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
return &job->common;
|
|
|
|
diff --git a/block/block-backend.c b/block/block-backend.c
|
|
index 6a6949edeb..24cae3cb55 100644
|
|
--- a/block/block-backend.c
|
|
+++ b/block/block-backend.c
|
|
@@ -904,6 +904,7 @@ int blk_insert_bs(BlockBackend *blk, BlockDriverState *bs, Error **errp)
|
|
|
|
GLOBAL_STATE_CODE();
|
|
bdrv_ref(bs);
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
|
|
if ((bs->open_flags & BDRV_O_INACTIVE) && blk_can_inactivate(blk)) {
|
|
@@ -919,6 +920,7 @@ int blk_insert_bs(BlockBackend *blk, BlockDriverState *bs, Error **errp)
|
|
BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY,
|
|
perm, shared_perm, blk, errp);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
if (blk->root == NULL) {
|
|
return -EPERM;
|
|
}
|
|
diff --git a/block/commit.c b/block/commit.c
|
|
index 5df3d05346..6c06b894ff 100644
|
|
--- a/block/commit.c
|
|
+++ b/block/commit.c
|
|
@@ -342,6 +342,7 @@ void commit_start(const char *job_id, BlockDriverState *bs,
|
|
* this is the responsibility of the interface (i.e. whoever calls
|
|
* commit_start()).
|
|
*/
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
s->base_overlay = bdrv_find_overlay(top, base);
|
|
assert(s->base_overlay);
|
|
@@ -374,18 +375,21 @@ void commit_start(const char *job_id, BlockDriverState *bs,
|
|
iter_shared_perms, errp);
|
|
if (ret < 0) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
if (bdrv_freeze_backing_chain(commit_top_bs, base, errp) < 0) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
s->chain_frozen = true;
|
|
|
|
ret = block_job_add_bdrv(&s->common, "base", base, 0, BLK_PERM_ALL, errp);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
if (ret < 0) {
|
|
goto fail;
|
|
diff --git a/block/mirror.c b/block/mirror.c
|
|
index c2c5099c95..6e8caf4b49 100644
|
|
--- a/block/mirror.c
|
|
+++ b/block/mirror.c
|
|
@@ -2014,6 +2014,7 @@ static BlockJob *mirror_start_job(
|
|
*/
|
|
bdrv_disable_dirty_bitmap(s->dirty_bitmap);
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
ret = block_job_add_bdrv(&s->common, "source", bs, 0,
|
|
BLK_PERM_WRITE_UNCHANGED | BLK_PERM_WRITE |
|
|
@@ -2021,6 +2022,7 @@ static BlockJob *mirror_start_job(
|
|
errp);
|
|
if (ret < 0) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
|
|
@@ -2066,16 +2068,19 @@ static BlockJob *mirror_start_job(
|
|
iter_shared_perms, errp);
|
|
if (ret < 0) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
if (bdrv_freeze_backing_chain(mirror_top_bs, target, errp) < 0) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
}
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
QTAILQ_INIT(&s->ops_in_flight);
|
|
|
|
diff --git a/block/stream.c b/block/stream.c
|
|
index 6ba49cffd3..f5441f27f4 100644
|
|
--- a/block/stream.c
|
|
+++ b/block/stream.c
|
|
@@ -371,10 +371,12 @@ void stream_start(const char *job_id, BlockDriverState *bs,
|
|
* already have our own plans. Also don't allow resize as the image size is
|
|
* queried only at the job start and then cached.
|
|
*/
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
if (block_job_add_bdrv(&s->common, "active node", bs, 0,
|
|
basic_flags | BLK_PERM_WRITE, errp)) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
|
|
@@ -395,10 +397,12 @@ void stream_start(const char *job_id, BlockDriverState *bs,
|
|
basic_flags, errp);
|
|
if (ret < 0) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
goto fail;
|
|
}
|
|
}
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
s->base_overlay = base_overlay;
|
|
s->above_base = above_base;
|
|
diff --git a/blockjob.c b/blockjob.c
|
|
index 34185d7715..44991e3ff7 100644
|
|
--- a/blockjob.c
|
|
+++ b/blockjob.c
|
|
@@ -496,6 +496,7 @@ void *block_job_create(const char *job_id, const BlockJobDriver *driver,
|
|
int ret;
|
|
GLOBAL_STATE_CODE();
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
|
|
if (job_id == NULL && !(flags & JOB_INTERNAL)) {
|
|
@@ -506,6 +507,7 @@ void *block_job_create(const char *job_id, const BlockJobDriver *driver,
|
|
flags, cb, opaque, errp);
|
|
if (job == NULL) {
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
return NULL;
|
|
}
|
|
|
|
@@ -544,10 +546,12 @@ void *block_job_create(const char *job_id, const BlockJobDriver *driver,
|
|
}
|
|
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
return job;
|
|
|
|
fail:
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
job_early_fail(&job->job);
|
|
return NULL;
|
|
}
|
|
diff --git a/include/block/blockjob.h b/include/block/blockjob.h
|
|
index 7061ab7201..990f3e179a 100644
|
|
--- a/include/block/blockjob.h
|
|
+++ b/include/block/blockjob.h
|
|
@@ -137,6 +137,8 @@ BlockJob *block_job_get_locked(const char *id);
|
|
* Add @bs to the list of BlockDriverState that are involved in
|
|
* @job. This means that all operations will be blocked on @bs while
|
|
* @job exists.
|
|
+ *
|
|
+ * All block nodes must be drained.
|
|
*/
|
|
int GRAPH_WRLOCK
|
|
block_job_add_bdrv(BlockJob *job, const char *name, BlockDriverState *bs,
|
|
diff --git a/tests/unit/test-bdrv-drain.c b/tests/unit/test-bdrv-drain.c
|
|
index 3185f3f429..4f3057844b 100644
|
|
--- a/tests/unit/test-bdrv-drain.c
|
|
+++ b/tests/unit/test-bdrv-drain.c
|
|
@@ -772,9 +772,11 @@ static void test_blockjob_common_drain_node(enum drain_type drain_type,
|
|
tjob->bs = src;
|
|
job = &tjob->common;
|
|
|
|
+ bdrv_drain_all_begin();
|
|
bdrv_graph_wrlock();
|
|
block_job_add_bdrv(job, "target", target, 0, BLK_PERM_ALL, &error_abort);
|
|
bdrv_graph_wrunlock();
|
|
+ bdrv_drain_all_end();
|
|
|
|
switch (result) {
|
|
case TEST_JOB_SUCCESS:
|
|
--
|
|
2.39.3
|
|
|