1
The following changes since commit e47f81b617684c4546af286d307b69014a83538a:
1
The following changes since commit 013a18edbbc59cdad019100c7d03c0494642b74c:
2
2
3
Merge remote-tracking branch 'remotes/thibault/tags/samuel-thibault' into staging (2019-02-07 18:53:25 +0000)
3
Merge remote-tracking branch 'remotes/pmaydell/tags/pull-target-arm-2020051=
4
4' into staging (2020-05-14 16:17:55 +0100)
4
5
5
are available in the Git repository at:
6
are available in the Git repository at:
6
7
7
git://github.com/stefanha/qemu.git tags/block-pull-request
8
https://github.com/stefanha/qemu.git tags/block-pull-request
8
9
9
for you to fetch changes up to 55140166667bb555c5d05165b93b25557d2e6397:
10
for you to fetch changes up to ba607ca8bff4d2c2062902f8355657c865ac7c29:
10
11
11
tests/virtio-blk: add test for WRITE_ZEROES command (2019-02-11 11:58:17 +0800)
12
aio-posix: disable fdmon-io_uring when GSource is used (2020-05-18 18:16:00=
13
+0100)
12
14
13
----------------------------------------------------------------
15
----------------------------------------------------------------
14
Pull request
16
Pull request
15
17
16
User-visible changes:
17
18
* virtio-blk: DISCARD and WRITE_ZEROES support
19
20
----------------------------------------------------------------
18
----------------------------------------------------------------
21
19
22
Peter Xu (1):
20
Philippe Mathieu-Daud=C3=A9 (6):
23
iothread: fix iothread hang when stop too soon
21
tests/fuzz/Makefile: Do not link code using unavailable devices
22
Makefile: List fuzz targets in 'make help'
23
tests/fuzz: Add missing space in test description
24
tests/fuzz: Remove unuseful/unused typedefs
25
tests/fuzz: Extract pciconfig_fuzz_qos() method
26
tests/fuzz: Extract ioport_fuzz_qtest() method
24
27
25
Stefano Garzarella (7):
28
Stefan Hajnoczi (2):
26
virtio-blk: cleanup using VirtIOBlock *s and VirtIODevice *vdev
29
aio-posix: don't duplicate fd handler deletion in
27
virtio-blk: add acct_failed param to virtio_blk_handle_rw_error()
30
fdmon_io_uring_destroy()
28
virtio-blk: add host_features field in VirtIOBlock
31
aio-posix: disable fdmon-io_uring when GSource is used
29
virtio-blk: add "discard" and "write-zeroes" properties
30
virtio-blk: add DISCARD and WRITE_ZEROES features
31
tests/virtio-blk: change assert on data_size in virtio_blk_request()
32
tests/virtio-blk: add test for WRITE_ZEROES command
33
32
34
Vladimir Sementsov-Ogievskiy (1):
33
Makefile | 6 +++-
35
qemugdb/coroutine: fix arch_prctl has unknown return type
34
tests/qtest/fuzz/Makefile.include | 6 ++--
35
include/block/aio.h | 3 ++
36
tests/qtest/fuzz/i440fx_fuzz.c | 47 ++++++++++++++++++++-----------
37
util/aio-posix.c | 13 +++++++++
38
util/aio-win32.c | 4 +++
39
util/async.c | 1 +
40
util/fdmon-io_uring.c | 13 +++++++--
41
8 files changed, 69 insertions(+), 24 deletions(-)
36
42
37
include/hw/virtio/virtio-blk.h | 5 +-
43
--=20
38
hw/block/virtio-blk.c | 236 +++++++++++++++++++++++++++++----
44
2.25.3
39
hw/core/machine.c | 2 +
40
iothread.c | 6 +-
41
tests/virtio-blk-test.c | 75 ++++++++++-
42
scripts/qemugdb/coroutine.py | 2 +-
43
6 files changed, 297 insertions(+), 29 deletions(-)
44
45
45
--
46
2.20.1
47
48
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
From: Philippe Mathieu-Daudé <philmd@redhat.com>
2
2
3
If the WRITE_ZEROES feature is enabled, we check this command
3
Some devices availability depends on CONFIG options.
4
in the test_basic().
4
Use these options to only link tests when requested device
5
is available.
5
6
6
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
7
Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com>
7
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
8
Message-id: 20200514143433.18569-2-philmd@redhat.com
8
Acked-by: Thomas Huth <thuth@redhat.com>
9
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
10
Acked-by: Pankaj Gupta <pagupta@redhat.com>
11
Message-id: 20190208134950.187665-7-sgarzare@redhat.com
12
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
9
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
13
---
10
---
14
tests/virtio-blk-test.c | 60 +++++++++++++++++++++++++++++++++++++++++
11
tests/qtest/fuzz/Makefile.include | 6 +++---
15
1 file changed, 60 insertions(+)
12
1 file changed, 3 insertions(+), 3 deletions(-)
16
13
17
diff --git a/tests/virtio-blk-test.c b/tests/virtio-blk-test.c
14
diff --git a/tests/qtest/fuzz/Makefile.include b/tests/qtest/fuzz/Makefile.include
18
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
19
--- a/tests/virtio-blk-test.c
16
--- a/tests/qtest/fuzz/Makefile.include
20
+++ b/tests/virtio-blk-test.c
17
+++ b/tests/qtest/fuzz/Makefile.include
21
@@ -XXX,XX +XXX,XX @@ static void test_basic(QVirtioDevice *dev, QGuestAllocator *alloc,
18
@@ -XXX,XX +XXX,XX @@ fuzz-obj-y += tests/qtest/fuzz/fork_fuzz.o
22
19
fuzz-obj-y += tests/qtest/fuzz/qos_fuzz.o
23
guest_free(alloc, req_addr);
20
24
21
# Targets
25
+ if (features & (1u << VIRTIO_BLK_F_WRITE_ZEROES)) {
22
-fuzz-obj-y += tests/qtest/fuzz/i440fx_fuzz.o
26
+ struct virtio_blk_discard_write_zeroes dwz_hdr;
23
-fuzz-obj-y += tests/qtest/fuzz/virtio_net_fuzz.o
27
+ void *expected;
24
-fuzz-obj-y += tests/qtest/fuzz/virtio_scsi_fuzz.o
28
+
25
+fuzz-obj-$(CONFIG_PCI_I440FX) += tests/qtest/fuzz/i440fx_fuzz.o
29
+ /*
26
+fuzz-obj-$(CONFIG_VIRTIO_NET) += tests/qtest/fuzz/virtio_net_fuzz.o
30
+ * WRITE_ZEROES request on the same sector of previous test where
27
+fuzz-obj-$(CONFIG_SCSI) += tests/qtest/fuzz/virtio_scsi_fuzz.o
31
+ * we wrote "TEST".
28
32
+ */
29
FUZZ_CFLAGS += -I$(SRC_PATH)/tests -I$(SRC_PATH)/tests/qtest
33
+ req.type = VIRTIO_BLK_T_WRITE_ZEROES;
30
34
+ req.data = (char *) &dwz_hdr;
35
+ dwz_hdr.sector = 0;
36
+ dwz_hdr.num_sectors = 1;
37
+ dwz_hdr.flags = 0;
38
+
39
+ req_addr = virtio_blk_request(alloc, dev, &req, sizeof(dwz_hdr));
40
+
41
+ free_head = qvirtqueue_add(vq, req_addr, 16, false, true);
42
+ qvirtqueue_add(vq, req_addr + 16, sizeof(dwz_hdr), false, true);
43
+ qvirtqueue_add(vq, req_addr + 16 + sizeof(dwz_hdr), 1, true, false);
44
+
45
+ qvirtqueue_kick(dev, vq, free_head);
46
+
47
+ qvirtio_wait_used_elem(dev, vq, free_head, NULL,
48
+ QVIRTIO_BLK_TIMEOUT_US);
49
+ status = readb(req_addr + 16 + sizeof(dwz_hdr));
50
+ g_assert_cmpint(status, ==, 0);
51
+
52
+ guest_free(alloc, req_addr);
53
+
54
+ /* Read request to check if the sector contains all zeroes */
55
+ req.type = VIRTIO_BLK_T_IN;
56
+ req.ioprio = 1;
57
+ req.sector = 0;
58
+ req.data = g_malloc0(512);
59
+
60
+ req_addr = virtio_blk_request(alloc, dev, &req, 512);
61
+
62
+ g_free(req.data);
63
+
64
+ free_head = qvirtqueue_add(vq, req_addr, 16, false, true);
65
+ qvirtqueue_add(vq, req_addr + 16, 512, true, true);
66
+ qvirtqueue_add(vq, req_addr + 528, 1, true, false);
67
+
68
+ qvirtqueue_kick(dev, vq, free_head);
69
+
70
+ qvirtio_wait_used_elem(dev, vq, free_head, NULL,
71
+ QVIRTIO_BLK_TIMEOUT_US);
72
+ status = readb(req_addr + 528);
73
+ g_assert_cmpint(status, ==, 0);
74
+
75
+ data = g_malloc(512);
76
+ expected = g_malloc0(512);
77
+ memread(req_addr + 16, data, 512);
78
+ g_assert_cmpmem(data, 512, expected, 512);
79
+ g_free(expected);
80
+ g_free(data);
81
+
82
+ guest_free(alloc, req_addr);
83
+ }
84
+
85
if (features & (1u << VIRTIO_F_ANY_LAYOUT)) {
86
/* Write and read with 2 descriptor layout */
87
/* Write request */
88
--
31
--
89
2.20.1
32
2.25.3
90
33
91
diff view generated by jsdifflib
1
From: Peter Xu <peterx@redhat.com>
1
From: Philippe Mathieu-Daudé <philmd@redhat.com>
2
2
3
Lukas reported an hard to reproduce QMP iothread hang on s390 that
3
List softmmu fuzz targets in 'make help' output:
4
QEMU might hang at pthread_join() of the QMP monitor iothread before
5
quitting:
6
4
7
Thread 1
5
$ make help
8
#0 0x000003ffad10932c in pthread_join
6
...
9
#1 0x0000000109e95750 in qemu_thread_join
7
Architecture specific targets:
10
at /home/thuth/devel/qemu/util/qemu-thread-posix.c:570
8
aarch64-softmmu/all - Build for aarch64-softmmu
11
#2 0x0000000109c95a1c in iothread_stop
9
aarch64-softmmu/fuzz - Build fuzzer for aarch64-softmmu
12
#3 0x0000000109bb0874 in monitor_cleanup
10
alpha-softmmu/all - Build for alpha-softmmu
13
#4 0x0000000109b55042 in main
11
alpha-softmmu/fuzz - Build fuzzer for alpha-softmmu
12
arm-softmmu/all - Build for arm-softmmu
13
arm-softmmu/fuzz - Build fuzzer for arm-softmmu
14
...
14
15
15
While the iothread is still in the main loop:
16
Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com>
16
17
Message-id: 20200514143433.18569-3-philmd@redhat.com
17
Thread 4
18
#0 0x000003ffad0010e4 in ??
19
#1 0x000003ffad553958 in g_main_context_iterate.isra.19
20
#2 0x000003ffad553d90 in g_main_loop_run
21
#3 0x0000000109c9585a in iothread_run
22
at /home/thuth/devel/qemu/iothread.c:74
23
#4 0x0000000109e94752 in qemu_thread_start
24
at /home/thuth/devel/qemu/util/qemu-thread-posix.c:502
25
#5 0x000003ffad10825a in start_thread
26
#6 0x000003ffad00dcf2 in thread_start
27
28
IMHO it's because there's a race between the main thread and iothread
29
when stopping the thread in following sequence:
30
31
main thread iothread
32
=========== ==============
33
aio_poll()
34
iothread_get_g_main_context
35
set iothread->worker_context
36
iothread_stop
37
schedule iothread_stop_bh
38
execute iothread_stop_bh [1]
39
set iothread->running=false
40
(since main_loop==NULL so
41
skip to quit main loop.
42
Note: although main_loop is
43
NULL but worker_context is
44
not!)
45
atomic_read(&iothread->worker_context) [2]
46
create main_loop object
47
g_main_loop_run() [3]
48
pthread_join() [4]
49
50
We can see that when execute iothread_stop_bh() at [1] it's possible
51
that main_loop is still NULL because it's only created until the first
52
check of the worker_context later at [2]. Then the iothread will hang
53
in the main loop [3] and it'll starve the main thread too [4].
54
55
Here the simple solution should be that we check again the "running"
56
variable before check against worker_context.
57
58
CC: Thomas Huth <thuth@redhat.com>
59
CC: Dr. David Alan Gilbert <dgilbert@redhat.com>
60
CC: Stefan Hajnoczi <stefanha@redhat.com>
61
CC: Lukáš Doktor <ldoktor@redhat.com>
62
CC: Markus Armbruster <armbru@redhat.com>
63
CC: Eric Blake <eblake@redhat.com>
64
CC: Paolo Bonzini <pbonzini@redhat.com>
65
Reported-by: Lukáš Doktor <ldoktor@redhat.com>
66
Signed-off-by: Peter Xu <peterx@redhat.com>
67
Tested-by: Thomas Huth <thuth@redhat.com>
68
Message-id: 20190129051432.22023-1-peterx@redhat.com
69
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
18
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
70
---
19
---
71
iothread.c | 6 +++++-
20
Makefile | 6 +++++-
72
1 file changed, 5 insertions(+), 1 deletion(-)
21
1 file changed, 5 insertions(+), 1 deletion(-)
73
22
74
diff --git a/iothread.c b/iothread.c
23
diff --git a/Makefile b/Makefile
75
index XXXXXXX..XXXXXXX 100644
24
index XXXXXXX..XXXXXXX 100644
76
--- a/iothread.c
25
--- a/Makefile
77
+++ b/iothread.c
26
+++ b/Makefile
78
@@ -XXX,XX +XXX,XX @@ static void *iothread_run(void *opaque)
27
@@ -XXX,XX +XXX,XX @@ endif
79
while (iothread->running) {
28
    @$(if $(TARGET_DIRS), \
80
aio_poll(iothread->ctx, true);
29
        echo 'Architecture specific targets:'; \
81
30
        $(foreach t, $(TARGET_DIRS), \
82
- if (atomic_read(&iothread->worker_context)) {
31
-        $(call print-help-run,$(t)/all,Build for $(t));) \
83
+ /*
32
+        $(call print-help-run,$(t)/all,Build for $(t)); \
84
+ * We must check the running state again in case it was
33
+        $(if $(CONFIG_FUZZ), \
85
+ * changed in previous aio_poll()
34
+            $(if $(findstring softmmu,$(t)), \
86
+ */
35
+                $(call print-help-run,$(t)/fuzz,Build fuzzer for $(t)); \
87
+ if (iothread->running && atomic_read(&iothread->worker_context)) {
36
+        ))) \
88
GMainLoop *loop;
37
        echo '')
89
38
    @$(if $(TOOLS), \
90
g_main_context_push_thread_default(iothread->worker_context);
39
        echo 'Tools targets:'; \
91
--
40
--
92
2.20.1
41
2.25.3
93
42
94
diff view generated by jsdifflib
Deleted patch
1
From: Vladimir Sementsov-Ogievskiy <vsementsov@virtuozzo.com>
2
1
3
qemu coroutine command results in following error output:
4
5
Python Exception <class 'gdb.error'> 'arch_prctl' has unknown return
6
type; cast the call to its declared return type: Error occurred in
7
Python command: 'arch_prctl' has unknown return type; cast the call to
8
its declared return type
9
10
Fix it by giving it what it wants: arch_prctl return type.
11
12
Information on the topic:
13
https://sourceware.org/gdb/onlinedocs/gdb/Calling.html
14
15
Signed-off-by: Vladimir Sementsov-Ogievskiy <vsementsov@virtuozzo.com>
16
Message-id: 20190206151425.105871-1-vsementsov@virtuozzo.com
17
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
18
---
19
scripts/qemugdb/coroutine.py | 2 +-
20
1 file changed, 1 insertion(+), 1 deletion(-)
21
22
diff --git a/scripts/qemugdb/coroutine.py b/scripts/qemugdb/coroutine.py
23
index XXXXXXX..XXXXXXX 100644
24
--- a/scripts/qemugdb/coroutine.py
25
+++ b/scripts/qemugdb/coroutine.py
26
@@ -XXX,XX +XXX,XX @@ def get_fs_base():
27
pthread_self().'''
28
# %rsp - 120 is scratch space according to the SystemV ABI
29
old = gdb.parse_and_eval('*(uint64_t*)($rsp - 120)')
30
- gdb.execute('call arch_prctl(0x1003, $rsp - 120)', False, True)
31
+ gdb.execute('call (int)arch_prctl(0x1003, $rsp - 120)', False, True)
32
fs_base = gdb.parse_and_eval('*(uint64_t*)($rsp - 120)')
33
gdb.execute('set *(uint64_t*)($rsp - 120) = %s' % old, False, True)
34
return fs_base
35
--
36
2.20.1
37
38
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
From: Philippe Mathieu-Daudé <philmd@redhat.com>
2
2
3
Since configurable features for virtio-blk are growing, this patch
3
Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com>
4
adds host_features field in the struct VirtIOBlock. (as in virtio-net)
4
Message-id: 20200514143433.18569-4-philmd@redhat.com
5
In this way, we can avoid to add new fields for new properties and
6
we can directly set VIRTIO_BLK_F* flags in the host_features.
7
8
We update "config-wce" and "scsi" property definition to use the new
9
host_features field without change the behaviour.
10
11
Suggested-by: Michael S. Tsirkin <mst@redhat.com>
12
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
13
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
14
Acked-by: Pankaj Gupta <pagupta@redhat.com>
15
Message-id: 20190208134950.187665-3-sgarzare@redhat.com
16
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
5
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
17
---
6
---
18
include/hw/virtio/virtio-blk.h | 3 +--
7
tests/qtest/fuzz/i440fx_fuzz.c | 6 +++---
19
hw/block/virtio-blk.c | 16 +++++++++-------
8
1 file changed, 3 insertions(+), 3 deletions(-)
20
2 files changed, 10 insertions(+), 9 deletions(-)
21
9
22
diff --git a/include/hw/virtio/virtio-blk.h b/include/hw/virtio/virtio-blk.h
10
diff --git a/tests/qtest/fuzz/i440fx_fuzz.c b/tests/qtest/fuzz/i440fx_fuzz.c
23
index XXXXXXX..XXXXXXX 100644
11
index XXXXXXX..XXXXXXX 100644
24
--- a/include/hw/virtio/virtio-blk.h
12
--- a/tests/qtest/fuzz/i440fx_fuzz.c
25
+++ b/include/hw/virtio/virtio-blk.h
13
+++ b/tests/qtest/fuzz/i440fx_fuzz.c
26
@@ -XXX,XX +XXX,XX @@ struct VirtIOBlkConf
14
@@ -XXX,XX +XXX,XX @@ static void register_pci_fuzz_targets(void)
27
BlockConf conf;
15
/* Uses simple qtest commands and reboots to reset state */
28
IOThread *iothread;
16
fuzz_add_target(&(FuzzTarget){
29
char *serial;
17
.name = "i440fx-qtest-reboot-fuzz",
30
- uint32_t scsi;
18
- .description = "Fuzz the i440fx using raw qtest commands and"
31
- uint32_t config_wce;
19
+ .description = "Fuzz the i440fx using raw qtest commands and "
32
uint32_t request_merging;
20
"rebooting after each run",
33
uint16_t num_queues;
21
.get_init_cmdline = i440fx_argv,
34
uint16_t queue_size;
22
.fuzz = i440fx_fuzz_qtest});
35
@@ -XXX,XX +XXX,XX @@ typedef struct VirtIOBlock {
23
@@ -XXX,XX +XXX,XX @@ static void register_pci_fuzz_targets(void)
36
bool dataplane_disabled;
24
/* Uses libqos and forks to prevent state leakage */
37
bool dataplane_started;
25
fuzz_add_qos_target(&(FuzzTarget){
38
struct VirtIOBlockDataPlane *dataplane;
26
.name = "i440fx-qos-fork-fuzz",
39
+ uint64_t host_features;
27
- .description = "Fuzz the i440fx using raw qtest commands and"
40
} VirtIOBlock;
28
+ .description = "Fuzz the i440fx using raw qtest commands and "
41
29
"rebooting after each run",
42
typedef struct VirtIOBlockReq {
30
.pre_vm_init = &fork_init,
43
diff --git a/hw/block/virtio-blk.c b/hw/block/virtio-blk.c
31
.fuzz = i440fx_fuzz_qos_fork,},
44
index XXXXXXX..XXXXXXX 100644
32
@@ -XXX,XX +XXX,XX @@ static void register_pci_fuzz_targets(void)
45
--- a/hw/block/virtio-blk.c
46
+++ b/hw/block/virtio-blk.c
47
@@ -XXX,XX +XXX,XX @@ static int virtio_blk_handle_scsi_req(VirtIOBlockReq *req)
48
*/
33
*/
49
scsi = (void *)elem->in_sg[elem->in_num - 2].iov_base;
34
fuzz_add_qos_target(&(FuzzTarget){
50
35
.name = "i440fx-qos-noreset-fuzz",
51
- if (!blk->conf.scsi) {
36
- .description = "Fuzz the i440fx using raw qtest commands and"
52
+ if (!virtio_has_feature(blk->host_features, VIRTIO_BLK_F_SCSI)) {
37
+ .description = "Fuzz the i440fx using raw qtest commands and "
53
status = VIRTIO_BLK_S_UNSUPP;
38
"rebooting after each run",
54
goto fail;
39
.fuzz = i440fx_fuzz_qos,},
55
}
40
"i440FX-pcihost",
56
@@ -XXX,XX +XXX,XX @@ static uint64_t virtio_blk_get_features(VirtIODevice *vdev, uint64_t features,
57
{
58
VirtIOBlock *s = VIRTIO_BLK(vdev);
59
60
+ /* Firstly sync all virtio-blk possible supported features */
61
+ features |= s->host_features;
62
+
63
virtio_add_feature(&features, VIRTIO_BLK_F_SEG_MAX);
64
virtio_add_feature(&features, VIRTIO_BLK_F_GEOMETRY);
65
virtio_add_feature(&features, VIRTIO_BLK_F_TOPOLOGY);
66
virtio_add_feature(&features, VIRTIO_BLK_F_BLK_SIZE);
67
if (virtio_has_feature(features, VIRTIO_F_VERSION_1)) {
68
- if (s->conf.scsi) {
69
+ if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_SCSI)) {
70
error_setg(errp, "Please set scsi=off for virtio-blk devices in order to use virtio 1.0");
71
return 0;
72
}
73
@@ -XXX,XX +XXX,XX @@ static uint64_t virtio_blk_get_features(VirtIODevice *vdev, uint64_t features,
74
virtio_add_feature(&features, VIRTIO_BLK_F_SCSI);
75
}
76
77
- if (s->conf.config_wce) {
78
- virtio_add_feature(&features, VIRTIO_BLK_F_CONFIG_WCE);
79
- }
80
if (blk_enable_write_cache(s->blk)) {
81
virtio_add_feature(&features, VIRTIO_BLK_F_WCE);
82
}
83
@@ -XXX,XX +XXX,XX @@ static Property virtio_blk_properties[] = {
84
DEFINE_BLOCK_ERROR_PROPERTIES(VirtIOBlock, conf.conf),
85
DEFINE_BLOCK_CHS_PROPERTIES(VirtIOBlock, conf.conf),
86
DEFINE_PROP_STRING("serial", VirtIOBlock, conf.serial),
87
- DEFINE_PROP_BIT("config-wce", VirtIOBlock, conf.config_wce, 0, true),
88
+ DEFINE_PROP_BIT64("config-wce", VirtIOBlock, host_features,
89
+ VIRTIO_BLK_F_CONFIG_WCE, true),
90
#ifdef __linux__
91
- DEFINE_PROP_BIT("scsi", VirtIOBlock, conf.scsi, 0, false),
92
+ DEFINE_PROP_BIT64("scsi", VirtIOBlock, host_features,
93
+ VIRTIO_BLK_F_SCSI, false),
94
#endif
95
DEFINE_PROP_BIT("request-merging", VirtIOBlock, conf.request_merging, 0,
96
true),
97
--
41
--
98
2.20.1
42
2.25.3
99
43
100
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
From: Philippe Mathieu-Daudé <philmd@redhat.com>
2
2
3
We add acct_failed param in order to use virtio_blk_handle_rw_error()
3
These typedefs are not used. Use a simple structure,
4
also when is not required to call block_acct_failed(). (eg. a discard
4
remote the typedefs.
5
operation is failed)
6
5
7
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
6
Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com>
8
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
7
Message-id: 20200514143433.18569-5-philmd@redhat.com
9
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
10
Acked-by: Pankaj Gupta <pagupta@redhat.com>
11
Message-id: 20190208134950.187665-2-sgarzare@redhat.com
12
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
8
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
13
---
9
---
14
hw/block/virtio-blk.c | 10 ++++++----
10
tests/qtest/fuzz/i440fx_fuzz.c | 10 ++++------
15
1 file changed, 6 insertions(+), 4 deletions(-)
11
1 file changed, 4 insertions(+), 6 deletions(-)
16
12
17
diff --git a/hw/block/virtio-blk.c b/hw/block/virtio-blk.c
13
diff --git a/tests/qtest/fuzz/i440fx_fuzz.c b/tests/qtest/fuzz/i440fx_fuzz.c
18
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
19
--- a/hw/block/virtio-blk.c
15
--- a/tests/qtest/fuzz/i440fx_fuzz.c
20
+++ b/hw/block/virtio-blk.c
16
+++ b/tests/qtest/fuzz/i440fx_fuzz.c
21
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_req_complete(VirtIOBlockReq *req, unsigned char status)
17
@@ -XXX,XX +XXX,XX @@ static void i440fx_fuzz_qtest(QTestState *s,
22
}
18
* loop over the Data, breaking it up into actions. each action has an
23
19
* opcode, address offset and value
24
static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error,
20
*/
25
- bool is_read)
21
- typedef struct QTestFuzzAction {
26
+ bool is_read, bool acct_failed)
22
+ struct {
27
{
23
uint8_t opcode;
28
VirtIOBlock *s = req->dev;
24
uint8_t addr;
29
BlockErrorAction action = blk_get_error_action(s->blk, is_read, error);
25
uint32_t value;
30
@@ -XXX,XX +XXX,XX @@ static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error,
26
- } QTestFuzzAction;
31
s->rq = req;
27
- QTestFuzzAction a;
32
} else if (action == BLOCK_ERROR_ACTION_REPORT) {
28
+ } a;
33
virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR);
29
34
- block_acct_failed(blk_get_stats(s->blk), &req->acct);
30
while (Size >= sizeof(a)) {
35
+ if (acct_failed) {
31
/* make a copy of the action so we can normalize the values in-place */
36
+ block_acct_failed(blk_get_stats(s->blk), &req->acct);
32
@@ -XXX,XX +XXX,XX @@ static void i440fx_fuzz_qos(QTestState *s,
37
+ }
33
* Same as i440fx_fuzz_qtest, but using QOS. devfn is incorporated into the
38
virtio_blk_free_request(req);
34
* value written over Port IO
35
*/
36
- typedef struct QOSFuzzAction {
37
+ struct {
38
uint8_t opcode;
39
uint8_t offset;
40
int devfn;
41
uint32_t value;
42
- } QOSFuzzAction;
43
+ } a;
44
45
static QPCIBus *bus;
46
if (!bus) {
47
bus = qpci_new_pc(s, fuzz_qos_alloc);
39
}
48
}
40
49
41
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_rw_complete(void *opaque, int ret)
50
- QOSFuzzAction a;
42
* the memory until the request is completed (which will
51
while (Size >= sizeof(a)) {
43
* happen on the other side of the migration).
52
memcpy(&a, Data, sizeof(a));
44
*/
53
switch (a.opcode % ACTION_MAX) {
45
- if (virtio_blk_handle_rw_error(req, -ret, is_read)) {
46
+ if (virtio_blk_handle_rw_error(req, -ret, is_read, true)) {
47
continue;
48
}
49
}
50
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_flush_complete(void *opaque, int ret)
51
52
aio_context_acquire(blk_get_aio_context(s->conf.conf.blk));
53
if (ret) {
54
- if (virtio_blk_handle_rw_error(req, -ret, 0)) {
55
+ if (virtio_blk_handle_rw_error(req, -ret, 0, true)) {
56
goto out;
57
}
58
}
59
--
54
--
60
2.20.1
55
2.25.3
61
56
62
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
From: Philippe Mathieu-Daudé <philmd@redhat.com>
2
2
3
The size of data in the virtio_blk_request must be a multiple
3
Extract the generic pciconfig_fuzz_qos() method from
4
of 512 bytes for IN and OUT requests, or a multiple of the size
4
i440fx_fuzz_qos(). This will help to write tests not
5
of struct virtio_blk_discard_write_zeroes for DISCARD and
5
specific to the i440FX controller.
6
WRITE_ZEROES requests.
7
6
8
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
7
Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com>
9
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
8
Message-id: 20200514143433.18569-6-philmd@redhat.com
10
Reviewed-by: Thomas Huth <thuth@redhat.com>
11
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
12
Acked-by: Pankaj Gupta <pagupta@redhat.com>
13
Message-id: 20190208134950.187665-6-sgarzare@redhat.com
14
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
9
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
15
---
10
---
16
tests/virtio-blk-test.c | 15 ++++++++++++++-
11
tests/qtest/fuzz/i440fx_fuzz.c | 20 ++++++++++++++------
17
1 file changed, 14 insertions(+), 1 deletion(-)
12
1 file changed, 14 insertions(+), 6 deletions(-)
18
13
19
diff --git a/tests/virtio-blk-test.c b/tests/virtio-blk-test.c
14
diff --git a/tests/qtest/fuzz/i440fx_fuzz.c b/tests/qtest/fuzz/i440fx_fuzz.c
20
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
21
--- a/tests/virtio-blk-test.c
16
--- a/tests/qtest/fuzz/i440fx_fuzz.c
22
+++ b/tests/virtio-blk-test.c
17
+++ b/tests/qtest/fuzz/i440fx_fuzz.c
23
@@ -XXX,XX +XXX,XX @@ static uint64_t virtio_blk_request(QGuestAllocator *alloc, QVirtioDevice *d,
18
@@ -XXX,XX +XXX,XX @@ static void i440fx_fuzz_qtest(QTestState *s,
24
uint64_t addr;
19
flush_events(s);
25
uint8_t status = 0xFF;
20
}
26
21
27
- g_assert_cmpuint(data_size % 512, ==, 0);
22
-static void i440fx_fuzz_qos(QTestState *s,
28
+ switch (req->type) {
23
+static void pciconfig_fuzz_qos(QTestState *s, QPCIBus *bus,
29
+ case VIRTIO_BLK_T_IN:
24
const unsigned char *Data, size_t Size) {
30
+ case VIRTIO_BLK_T_OUT:
25
/*
31
+ g_assert_cmpuint(data_size % 512, ==, 0);
26
* Same as i440fx_fuzz_qtest, but using QOS. devfn is incorporated into the
32
+ break;
27
@@ -XXX,XX +XXX,XX @@ static void i440fx_fuzz_qos(QTestState *s,
33
+ case VIRTIO_BLK_T_DISCARD:
28
uint32_t value;
34
+ case VIRTIO_BLK_T_WRITE_ZEROES:
29
} a;
35
+ g_assert_cmpuint(data_size %
30
36
+ sizeof(struct virtio_blk_discard_write_zeroes), ==, 0);
31
- static QPCIBus *bus;
37
+ break;
32
- if (!bus) {
38
+ default:
33
- bus = qpci_new_pc(s, fuzz_qos_alloc);
39
+ g_assert_cmpuint(data_size, ==, 0);
34
- }
35
-
36
while (Size >= sizeof(a)) {
37
memcpy(&a, Data, sizeof(a));
38
switch (a.opcode % ACTION_MAX) {
39
@@ -XXX,XX +XXX,XX @@ static void i440fx_fuzz_qos(QTestState *s,
40
flush_events(s);
41
}
42
43
+static void i440fx_fuzz_qos(QTestState *s,
44
+ const unsigned char *Data,
45
+ size_t Size)
46
+{
47
+ static QPCIBus *bus;
48
+
49
+ if (!bus) {
50
+ bus = qpci_new_pc(s, fuzz_qos_alloc);
40
+ }
51
+ }
41
+
52
+
42
addr = guest_alloc(alloc, sizeof(*req) + data_size);
53
+ pciconfig_fuzz_qos(s, bus, Data, Size);
43
54
+}
44
virtio_blk_fix_request(d, req);
55
+
56
static void i440fx_fuzz_qos_fork(QTestState *s,
57
const unsigned char *Data, size_t Size) {
58
if (fork() == 0) {
45
--
59
--
46
2.20.1
60
2.25.3
47
61
48
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
From: Philippe Mathieu-Daudé <philmd@redhat.com>
2
2
3
In order to avoid migration issues, we enable DISCARD and
3
Extract generic ioport_fuzz_qtest() method from
4
WRITE_ZEROES features only for machine type >= 4.0
4
i440fx_fuzz_qtest(). This will help to write tests
5
not specific to the i440FX controller.
5
6
6
As discussed with Michael S. Tsirkin and Stefan Hajnoczi on the
7
Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com>
7
list [1], DISCARD operation should not have security implications
8
Message-id: 20200514143433.18569-7-philmd@redhat.com
8
(eg. page cache attacks), so we can enable it by default.
9
10
[1] https://lists.gnu.org/archive/html/qemu-devel/2019-02/msg00504.html
11
12
Suggested-by: Dr. David Alan Gilbert <dgilbert@redhat.com>
13
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
14
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
15
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
16
Acked-by: Pankaj Gupta <pagupta@redhat.com>
17
Message-id: 20190208134950.187665-4-sgarzare@redhat.com
18
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
9
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
19
---
10
---
20
hw/block/virtio-blk.c | 4 ++++
11
tests/qtest/fuzz/i440fx_fuzz.c | 11 +++++++++--
21
hw/core/machine.c | 2 ++
12
1 file changed, 9 insertions(+), 2 deletions(-)
22
2 files changed, 6 insertions(+)
23
13
24
diff --git a/hw/block/virtio-blk.c b/hw/block/virtio-blk.c
14
diff --git a/tests/qtest/fuzz/i440fx_fuzz.c b/tests/qtest/fuzz/i440fx_fuzz.c
25
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
26
--- a/hw/block/virtio-blk.c
16
--- a/tests/qtest/fuzz/i440fx_fuzz.c
27
+++ b/hw/block/virtio-blk.c
17
+++ b/tests/qtest/fuzz/i440fx_fuzz.c
28
@@ -XXX,XX +XXX,XX @@ static Property virtio_blk_properties[] = {
18
@@ -XXX,XX +XXX,XX @@ enum action_id {
29
DEFINE_PROP_UINT16("queue-size", VirtIOBlock, conf.queue_size, 128),
19
ACTION_MAX
30
DEFINE_PROP_LINK("iothread", VirtIOBlock, conf.iothread, TYPE_IOTHREAD,
31
IOThread *),
32
+ DEFINE_PROP_BIT64("discard", VirtIOBlock, host_features,
33
+ VIRTIO_BLK_F_DISCARD, true),
34
+ DEFINE_PROP_BIT64("write-zeroes", VirtIOBlock, host_features,
35
+ VIRTIO_BLK_F_WRITE_ZEROES, true),
36
DEFINE_PROP_END_OF_LIST(),
37
};
20
};
38
21
39
diff --git a/hw/core/machine.c b/hw/core/machine.c
22
-static void i440fx_fuzz_qtest(QTestState *s,
40
index XXXXXXX..XXXXXXX 100644
23
+static void ioport_fuzz_qtest(QTestState *s,
41
--- a/hw/core/machine.c
24
const unsigned char *Data, size_t Size) {
42
+++ b/hw/core/machine.c
25
/*
43
@@ -XXX,XX +XXX,XX @@ GlobalProperty hw_compat_3_1[] = {
26
* loop over the Data, breaking it up into actions. each action has an
44
{ "usb-kbd", "serial", "42" },
27
@@ -XXX,XX +XXX,XX @@ static void i440fx_fuzz_qtest(QTestState *s,
45
{ "usb-mouse", "serial", "42" },
28
flush_events(s);
46
{ "usb-kbd", "serial", "42" },
29
}
47
+ { "virtio-blk-device", "discard", "false" },
30
48
+ { "virtio-blk-device", "write-zeroes", "false" },
31
+static void i440fx_fuzz_qtest(QTestState *s,
49
};
32
+ const unsigned char *Data,
50
const size_t hw_compat_3_1_len = G_N_ELEMENTS(hw_compat_3_1);
33
+ size_t Size)
51
34
+{
35
+ ioport_fuzz_qtest(s, Data, Size);
36
+}
37
+
38
static void pciconfig_fuzz_qos(QTestState *s, QPCIBus *bus,
39
const unsigned char *Data, size_t Size) {
40
/*
41
- * Same as i440fx_fuzz_qtest, but using QOS. devfn is incorporated into the
42
+ * Same as ioport_fuzz_qtest, but using QOS. devfn is incorporated into the
43
* value written over Port IO
44
*/
45
struct {
52
--
46
--
53
2.20.1
47
2.25.3
54
48
55
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
The io_uring file descriptor monitoring implementation has an internal
2
list of fd handlers that are pending submission to io_uring.
3
fdmon_io_uring_destroy() deletes all fd handlers on the list.
2
4
3
In several part we still using req->dev or VIRTIO_DEVICE(req->dev)
5
Don't delete fd handlers directly in fdmon_io_uring_destroy() for two
4
when we have already defined s and vdev pointers:
6
reasons:
5
VirtIOBlock *s = req->dev;
7
1. This duplicates the aio-posix.c AioHandler deletion code and could
6
VirtIODevice *vdev = VIRTIO_DEVICE(s);
8
become outdated if the struct changes.
9
2. Only handlers with the FDMON_IO_URING_REMOVE flag set are safe to
10
remove. If the flag is not set then something still has a pointer to
11
the fd handler. Let aio-posix.c and its user worry about that. In
12
practice this isn't an issue because fdmon_io_uring_destroy() is only
13
called when shutting down so all users have removed their fd
14
handlers, but the next patch will need this!
7
15
8
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
16
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
9
Reviewed-by: Liam Merwick <liam.merwick@oracle.com>
17
Tested-by: Oleksandr Natalenko <oleksandr@redhat.com>
10
Message-id: 20190208142347.214815-1-sgarzare@redhat.com
18
Message-id: 20200511183630.279750-2-stefanha@redhat.com
11
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
19
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
12
---
20
---
13
hw/block/virtio-blk.c | 22 +++++++++-------------
21
util/aio-posix.c | 1 +
14
1 file changed, 9 insertions(+), 13 deletions(-)
22
util/fdmon-io_uring.c | 13 ++++++++++---
23
2 files changed, 11 insertions(+), 3 deletions(-)
15
24
16
diff --git a/hw/block/virtio-blk.c b/hw/block/virtio-blk.c
25
diff --git a/util/aio-posix.c b/util/aio-posix.c
17
index XXXXXXX..XXXXXXX 100644
26
index XXXXXXX..XXXXXXX 100644
18
--- a/hw/block/virtio-blk.c
27
--- a/util/aio-posix.c
19
+++ b/hw/block/virtio-blk.c
28
+++ b/util/aio-posix.c
20
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_req_complete(VirtIOBlockReq *req, unsigned char status)
29
@@ -XXX,XX +XXX,XX @@ void aio_context_destroy(AioContext *ctx)
21
static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error,
22
bool is_read)
23
{
30
{
24
- BlockErrorAction action = blk_get_error_action(req->dev->blk,
31
fdmon_io_uring_destroy(ctx);
25
- is_read, error);
32
fdmon_epoll_disable(ctx);
26
VirtIOBlock *s = req->dev;
33
+ aio_free_deleted_handlers(ctx);
27
+ BlockErrorAction action = blk_get_error_action(s->blk, is_read, error);
34
}
28
35
29
if (action == BLOCK_ERROR_ACTION_STOP) {
36
void aio_context_set_poll_params(AioContext *ctx, int64_t max_ns,
30
/* Break the link as the next request is going to be parsed from the
37
diff --git a/util/fdmon-io_uring.c b/util/fdmon-io_uring.c
31
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_flush_complete(void *opaque, int ret)
38
index XXXXXXX..XXXXXXX 100644
32
}
39
--- a/util/fdmon-io_uring.c
33
40
+++ b/util/fdmon-io_uring.c
34
virtio_blk_req_complete(req, VIRTIO_BLK_S_OK);
41
@@ -XXX,XX +XXX,XX @@ void fdmon_io_uring_destroy(AioContext *ctx)
35
- block_acct_done(blk_get_stats(req->dev->blk), &req->acct);
42
36
+ block_acct_done(blk_get_stats(s->blk), &req->acct);
43
io_uring_queue_exit(&ctx->fdmon_io_uring);
37
virtio_blk_free_request(req);
44
38
45
- /* No need to submit these anymore, just free them. */
39
out:
46
+ /* Move handlers due to be removed onto the deleted list */
40
@@ -XXX,XX +XXX,XX @@ static int virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb)
47
while ((node = QSLIST_FIRST_RCU(&ctx->submit_list))) {
41
- sizeof(struct virtio_blk_inhdr);
48
+ unsigned flags = atomic_fetch_and(&node->flags,
42
iov_discard_back(in_iov, &in_num, sizeof(struct virtio_blk_inhdr));
49
+ ~(FDMON_IO_URING_PENDING |
43
50
+ FDMON_IO_URING_ADD |
44
- type = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type);
51
+ FDMON_IO_URING_REMOVE));
45
+ type = virtio_ldl_p(vdev, &req->out.type);
52
+
46
53
+ if (flags & FDMON_IO_URING_REMOVE) {
47
/* VIRTIO_BLK_T_OUT defines the command direction. VIRTIO_BLK_T_BARRIER
54
+ QLIST_INSERT_HEAD_RCU(&ctx->deleted_aio_handlers, node, node_deleted);
48
* is an optional flag. Although a guest should not send this flag if
55
+ }
49
@@ -XXX,XX +XXX,XX @@ static int virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb)
56
+
50
case VIRTIO_BLK_T_IN:
57
QSLIST_REMOVE_HEAD_RCU(&ctx->submit_list, node_submitted);
51
{
58
- QLIST_REMOVE(node, node);
52
bool is_write = type & VIRTIO_BLK_T_OUT;
59
- g_free(node);
53
- req->sector_num = virtio_ldq_p(VIRTIO_DEVICE(req->dev),
54
- &req->out.sector);
55
+ req->sector_num = virtio_ldq_p(vdev, &req->out.sector);
56
57
if (is_write) {
58
qemu_iovec_init_external(&req->qiov, out_iov, out_num);
59
@@ -XXX,XX +XXX,XX @@ static int virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb)
60
req->qiov.size / BDRV_SECTOR_SIZE);
61
}
60
}
62
61
63
- if (!virtio_blk_sect_range_ok(req->dev, req->sector_num,
62
ctx->fdmon_ops = &fdmon_poll_ops;
64
- req->qiov.size)) {
65
+ if (!virtio_blk_sect_range_ok(s, req->sector_num, req->qiov.size)) {
66
virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR);
67
- block_acct_invalid(blk_get_stats(req->dev->blk),
68
+ block_acct_invalid(blk_get_stats(s->blk),
69
is_write ? BLOCK_ACCT_WRITE : BLOCK_ACCT_READ);
70
virtio_blk_free_request(req);
71
return 0;
72
}
73
74
- block_acct_start(blk_get_stats(req->dev->blk),
75
- &req->acct, req->qiov.size,
76
+ block_acct_start(blk_get_stats(s->blk), &req->acct, req->qiov.size,
77
is_write ? BLOCK_ACCT_WRITE : BLOCK_ACCT_READ);
78
79
/* merge would exceed maximum number of requests or IO direction
80
* changes */
81
if (mrb->num_reqs > 0 && (mrb->num_reqs == VIRTIO_BLK_MAX_MERGE_REQS ||
82
is_write != mrb->is_write ||
83
- !req->dev->conf.request_merging)) {
84
- virtio_blk_submit_multireq(req->dev->blk, mrb);
85
+ !s->conf.request_merging)) {
86
+ virtio_blk_submit_multireq(s->blk, mrb);
87
}
88
89
assert(mrb->num_reqs < VIRTIO_BLK_MAX_MERGE_REQS);
90
--
63
--
91
2.20.1
64
2.25.3
92
65
93
diff view generated by jsdifflib
1
From: Stefano Garzarella <sgarzare@redhat.com>
1
The glib event loop does not call fdmon_io_uring_wait() so fd handlers
2
waiting to be submitted build up in the list. There is no benefit is
3
using io_uring when the glib GSource is being used, so disable it
4
instead of implementing a more complex fix.
2
5
3
This patch adds the support of DISCARD and WRITE_ZEROES commands,
6
This fixes a memory leak where AioHandlers would build up and increasing
4
that have been introduced in the virtio-blk protocol to have
7
amounts of CPU time were spent iterating them in aio_pending(). The
5
better performance when using SSD backend.
8
symptom is that guests become slow when QEMU is built with io_uring
9
support.
6
10
7
We support only one segment per request since multiple segments
11
Buglink: https://bugs.launchpad.net/qemu/+bug/1877716
8
are not widely used and there are no userspace APIs that allow
12
Fixes: 73fd282e7b6dd4e4ea1c3bbb3d302c8db51e4ccf ("aio-posix: add io_uring fd monitoring implementation")
9
applications to submit multiple segments in a single call.
13
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
10
14
Tested-by: Oleksandr Natalenko <oleksandr@redhat.com>
11
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
15
Message-id: 20200511183630.279750-3-stefanha@redhat.com
12
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
13
Signed-off-by: Stefano Garzarella <sgarzare@redhat.com>
14
Acked-by: Pankaj Gupta <pagupta@redhat.com>
15
Message-id: 20190208134950.187665-5-sgarzare@redhat.com
16
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
16
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
17
---
17
---
18
include/hw/virtio/virtio-blk.h | 2 +
18
include/block/aio.h | 3 +++
19
hw/block/virtio-blk.c | 184 +++++++++++++++++++++++++++++++++
19
util/aio-posix.c | 12 ++++++++++++
20
2 files changed, 186 insertions(+)
20
util/aio-win32.c | 4 ++++
21
util/async.c | 1 +
22
4 files changed, 20 insertions(+)
21
23
22
diff --git a/include/hw/virtio/virtio-blk.h b/include/hw/virtio/virtio-blk.h
24
diff --git a/include/block/aio.h b/include/block/aio.h
23
index XXXXXXX..XXXXXXX 100644
25
index XXXXXXX..XXXXXXX 100644
24
--- a/include/hw/virtio/virtio-blk.h
26
--- a/include/block/aio.h
25
+++ b/include/hw/virtio/virtio-blk.h
27
+++ b/include/block/aio.h
26
@@ -XXX,XX +XXX,XX @@ struct VirtIOBlkConf
28
@@ -XXX,XX +XXX,XX @@ void aio_context_setup(AioContext *ctx);
27
uint32_t request_merging;
29
*/
28
uint16_t num_queues;
30
void aio_context_destroy(AioContext *ctx);
29
uint16_t queue_size;
31
30
+ uint32_t max_discard_sectors;
32
+/* Used internally, do not call outside AioContext code */
31
+ uint32_t max_write_zeroes_sectors;
33
+void aio_context_use_g_source(AioContext *ctx);
32
};
34
+
33
35
/**
34
struct VirtIOBlockDataPlane;
36
* aio_context_set_poll_params:
35
diff --git a/hw/block/virtio-blk.c b/hw/block/virtio-blk.c
37
* @ctx: the aio context
38
diff --git a/util/aio-posix.c b/util/aio-posix.c
36
index XXXXXXX..XXXXXXX 100644
39
index XXXXXXX..XXXXXXX 100644
37
--- a/hw/block/virtio-blk.c
40
--- a/util/aio-posix.c
38
+++ b/hw/block/virtio-blk.c
41
+++ b/util/aio-posix.c
39
@@ -XXX,XX +XXX,XX @@ out:
42
@@ -XXX,XX +XXX,XX @@ void aio_context_destroy(AioContext *ctx)
40
aio_context_release(blk_get_aio_context(s->conf.conf.blk));
43
aio_free_deleted_handlers(ctx);
41
}
44
}
42
45
43
+static void virtio_blk_discard_write_zeroes_complete(void *opaque, int ret)
46
+void aio_context_use_g_source(AioContext *ctx)
44
+{
47
+{
45
+ VirtIOBlockReq *req = opaque;
48
+ /*
46
+ VirtIOBlock *s = req->dev;
49
+ * Disable io_uring when the glib main loop is used because it doesn't
47
+ bool is_write_zeroes = (virtio_ldl_p(VIRTIO_DEVICE(s), &req->out.type) &
50
+ * support mixed glib/aio_poll() usage. It relies on aio_poll() being
48
+ ~VIRTIO_BLK_T_BARRIER) == VIRTIO_BLK_T_WRITE_ZEROES;
51
+ * called regularly so that changes to the monitored file descriptors are
49
+
52
+ * submitted, otherwise a list of pending fd handlers builds up.
50
+ aio_context_acquire(blk_get_aio_context(s->conf.conf.blk));
53
+ */
51
+ if (ret) {
54
+ fdmon_io_uring_destroy(ctx);
52
+ if (virtio_blk_handle_rw_error(req, -ret, false, is_write_zeroes)) {
55
+ aio_free_deleted_handlers(ctx);
53
+ goto out;
54
+ }
55
+ }
56
+
57
+ virtio_blk_req_complete(req, VIRTIO_BLK_S_OK);
58
+ if (is_write_zeroes) {
59
+ block_acct_done(blk_get_stats(s->blk), &req->acct);
60
+ }
61
+ virtio_blk_free_request(req);
62
+
63
+out:
64
+ aio_context_release(blk_get_aio_context(s->conf.conf.blk));
65
+}
56
+}
66
+
57
+
67
#ifdef __linux__
58
void aio_context_set_poll_params(AioContext *ctx, int64_t max_ns,
68
59
int64_t grow, int64_t shrink, Error **errp)
69
typedef struct {
60
{
70
@@ -XXX,XX +XXX,XX @@ static bool virtio_blk_sect_range_ok(VirtIOBlock *dev,
61
diff --git a/util/aio-win32.c b/util/aio-win32.c
71
return true;
62
index XXXXXXX..XXXXXXX 100644
63
--- a/util/aio-win32.c
64
+++ b/util/aio-win32.c
65
@@ -XXX,XX +XXX,XX @@ void aio_context_destroy(AioContext *ctx)
66
{
72
}
67
}
73
68
74
+static uint8_t virtio_blk_handle_discard_write_zeroes(VirtIOBlockReq *req,
69
+void aio_context_use_g_source(AioContext *ctx)
75
+ struct virtio_blk_discard_write_zeroes *dwz_hdr, bool is_write_zeroes)
76
+{
70
+{
77
+ VirtIOBlock *s = req->dev;
78
+ VirtIODevice *vdev = VIRTIO_DEVICE(s);
79
+ uint64_t sector;
80
+ uint32_t num_sectors, flags, max_sectors;
81
+ uint8_t err_status;
82
+ int bytes;
83
+
84
+ sector = virtio_ldq_p(vdev, &dwz_hdr->sector);
85
+ num_sectors = virtio_ldl_p(vdev, &dwz_hdr->num_sectors);
86
+ flags = virtio_ldl_p(vdev, &dwz_hdr->flags);
87
+ max_sectors = is_write_zeroes ? s->conf.max_write_zeroes_sectors :
88
+ s->conf.max_discard_sectors;
89
+
90
+ /*
91
+ * max_sectors is at most BDRV_REQUEST_MAX_SECTORS, this check
92
+ * make us sure that "num_sectors << BDRV_SECTOR_BITS" can fit in
93
+ * the integer variable.
94
+ */
95
+ if (unlikely(num_sectors > max_sectors)) {
96
+ err_status = VIRTIO_BLK_S_IOERR;
97
+ goto err;
98
+ }
99
+
100
+ bytes = num_sectors << BDRV_SECTOR_BITS;
101
+
102
+ if (unlikely(!virtio_blk_sect_range_ok(s, sector, bytes))) {
103
+ err_status = VIRTIO_BLK_S_IOERR;
104
+ goto err;
105
+ }
106
+
107
+ /*
108
+ * The device MUST set the status byte to VIRTIO_BLK_S_UNSUPP for discard
109
+ * and write zeroes commands if any unknown flag is set.
110
+ */
111
+ if (unlikely(flags & ~VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP)) {
112
+ err_status = VIRTIO_BLK_S_UNSUPP;
113
+ goto err;
114
+ }
115
+
116
+ if (is_write_zeroes) { /* VIRTIO_BLK_T_WRITE_ZEROES */
117
+ int blk_aio_flags = 0;
118
+
119
+ if (flags & VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP) {
120
+ blk_aio_flags |= BDRV_REQ_MAY_UNMAP;
121
+ }
122
+
123
+ block_acct_start(blk_get_stats(s->blk), &req->acct, bytes,
124
+ BLOCK_ACCT_WRITE);
125
+
126
+ blk_aio_pwrite_zeroes(s->blk, sector << BDRV_SECTOR_BITS,
127
+ bytes, blk_aio_flags,
128
+ virtio_blk_discard_write_zeroes_complete, req);
129
+ } else { /* VIRTIO_BLK_T_DISCARD */
130
+ /*
131
+ * The device MUST set the status byte to VIRTIO_BLK_S_UNSUPP for
132
+ * discard commands if the unmap flag is set.
133
+ */
134
+ if (unlikely(flags & VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP)) {
135
+ err_status = VIRTIO_BLK_S_UNSUPP;
136
+ goto err;
137
+ }
138
+
139
+ blk_aio_pdiscard(s->blk, sector << BDRV_SECTOR_BITS, bytes,
140
+ virtio_blk_discard_write_zeroes_complete, req);
141
+ }
142
+
143
+ return VIRTIO_BLK_S_OK;
144
+
145
+err:
146
+ if (is_write_zeroes) {
147
+ block_acct_invalid(blk_get_stats(s->blk), BLOCK_ACCT_WRITE);
148
+ }
149
+ return err_status;
150
+}
71
+}
151
+
72
+
152
static int virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb)
73
void aio_context_set_poll_params(AioContext *ctx, int64_t max_ns,
74
int64_t grow, int64_t shrink, Error **errp)
153
{
75
{
154
uint32_t type;
76
diff --git a/util/async.c b/util/async.c
155
@@ -XXX,XX +XXX,XX @@ static int virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb)
77
index XXXXXXX..XXXXXXX 100644
156
virtio_blk_free_request(req);
78
--- a/util/async.c
157
break;
79
+++ b/util/async.c
158
}
80
@@ -XXX,XX +XXX,XX @@ static GSourceFuncs aio_source_funcs = {
159
+ /*
81
160
+ * VIRTIO_BLK_T_DISCARD and VIRTIO_BLK_T_WRITE_ZEROES are defined with
82
GSource *aio_get_g_source(AioContext *ctx)
161
+ * VIRTIO_BLK_T_OUT flag set. We masked this flag in the switch statement,
83
{
162
+ * so we must mask it for these requests, then we will check if it is set.
84
+ aio_context_use_g_source(ctx);
163
+ */
85
g_source_ref(&ctx->source);
164
+ case VIRTIO_BLK_T_DISCARD & ~VIRTIO_BLK_T_OUT:
86
return &ctx->source;
165
+ case VIRTIO_BLK_T_WRITE_ZEROES & ~VIRTIO_BLK_T_OUT:
166
+ {
167
+ struct virtio_blk_discard_write_zeroes dwz_hdr;
168
+ size_t out_len = iov_size(out_iov, out_num);
169
+ bool is_write_zeroes = (type & ~VIRTIO_BLK_T_BARRIER) ==
170
+ VIRTIO_BLK_T_WRITE_ZEROES;
171
+ uint8_t err_status;
172
+
173
+ /*
174
+ * Unsupported if VIRTIO_BLK_T_OUT is not set or the request contains
175
+ * more than one segment.
176
+ */
177
+ if (unlikely(!(type & VIRTIO_BLK_T_OUT) ||
178
+ out_len > sizeof(dwz_hdr))) {
179
+ virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP);
180
+ virtio_blk_free_request(req);
181
+ return 0;
182
+ }
183
+
184
+ if (unlikely(iov_to_buf(out_iov, out_num, 0, &dwz_hdr,
185
+ sizeof(dwz_hdr)) != sizeof(dwz_hdr))) {
186
+ virtio_error(vdev, "virtio-blk discard/write_zeroes header"
187
+ " too short");
188
+ return -1;
189
+ }
190
+
191
+ err_status = virtio_blk_handle_discard_write_zeroes(req, &dwz_hdr,
192
+ is_write_zeroes);
193
+ if (err_status != VIRTIO_BLK_S_OK) {
194
+ virtio_blk_req_complete(req, err_status);
195
+ virtio_blk_free_request(req);
196
+ }
197
+
198
+ break;
199
+ }
200
default:
201
virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP);
202
virtio_blk_free_request(req);
203
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config)
204
blkcfg.alignment_offset = 0;
205
blkcfg.wce = blk_enable_write_cache(s->blk);
206
virtio_stw_p(vdev, &blkcfg.num_queues, s->conf.num_queues);
207
+ if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_DISCARD)) {
208
+ virtio_stl_p(vdev, &blkcfg.max_discard_sectors,
209
+ s->conf.max_discard_sectors);
210
+ virtio_stl_p(vdev, &blkcfg.discard_sector_alignment,
211
+ blk_size >> BDRV_SECTOR_BITS);
212
+ /*
213
+ * We support only one segment per request since multiple segments
214
+ * are not widely used and there are no userspace APIs that allow
215
+ * applications to submit multiple segments in a single call.
216
+ */
217
+ virtio_stl_p(vdev, &blkcfg.max_discard_seg, 1);
218
+ }
219
+ if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_WRITE_ZEROES)) {
220
+ virtio_stl_p(vdev, &blkcfg.max_write_zeroes_sectors,
221
+ s->conf.max_write_zeroes_sectors);
222
+ blkcfg.write_zeroes_may_unmap = 1;
223
+ virtio_stl_p(vdev, &blkcfg.max_write_zeroes_seg, 1);
224
+ }
225
memcpy(config, &blkcfg, sizeof(struct virtio_blk_config));
226
}
87
}
227
228
@@ -XXX,XX +XXX,XX @@ static void virtio_blk_device_realize(DeviceState *dev, Error **errp)
229
return;
230
}
231
232
+ if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_DISCARD) &&
233
+ (!conf->max_discard_sectors ||
234
+ conf->max_discard_sectors > BDRV_REQUEST_MAX_SECTORS)) {
235
+ error_setg(errp, "invalid max-discard-sectors property (%" PRIu32 ")"
236
+ ", must be between 1 and %d",
237
+ conf->max_discard_sectors, (int)BDRV_REQUEST_MAX_SECTORS);
238
+ return;
239
+ }
240
+
241
+ if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_WRITE_ZEROES) &&
242
+ (!conf->max_write_zeroes_sectors ||
243
+ conf->max_write_zeroes_sectors > BDRV_REQUEST_MAX_SECTORS)) {
244
+ error_setg(errp, "invalid max-write-zeroes-sectors property (%" PRIu32
245
+ "), must be between 1 and %d",
246
+ conf->max_write_zeroes_sectors,
247
+ (int)BDRV_REQUEST_MAX_SECTORS);
248
+ return;
249
+ }
250
+
251
virtio_init(vdev, "virtio-blk", VIRTIO_ID_BLOCK,
252
sizeof(struct virtio_blk_config));
253
254
@@ -XXX,XX +XXX,XX @@ static Property virtio_blk_properties[] = {
255
VIRTIO_BLK_F_DISCARD, true),
256
DEFINE_PROP_BIT64("write-zeroes", VirtIOBlock, host_features,
257
VIRTIO_BLK_F_WRITE_ZEROES, true),
258
+ DEFINE_PROP_UINT32("max-discard-sectors", VirtIOBlock,
259
+ conf.max_discard_sectors, BDRV_REQUEST_MAX_SECTORS),
260
+ DEFINE_PROP_UINT32("max-write-zeroes-sectors", VirtIOBlock,
261
+ conf.max_write_zeroes_sectors, BDRV_REQUEST_MAX_SECTORS),
262
DEFINE_PROP_END_OF_LIST(),
263
};
264
265
--
88
--
266
2.20.1
89
2.25.3
267
90
268
diff view generated by jsdifflib