Series comparison

-[Qemu-devel] [PULL 0/8] Block patches
+[PULL 0/3] Block patches
-The following changes since commit 812b835fb4d23dd108b2f9802158472d50b73579:
+The following changes since commit 9cf289af47bcfae5c75de37d8e5d6fd23705322c:
-  Merge remote-tracking branch 'remotes/maxreitz/tags/pull-block-2019-05-07' into staging (2019-05-09 16:31:12 +0100)
+  Merge tag 'qga-pull-request' of gitlab.com:marcandre.lureau/qemu into staging (2022-05-04 03:42:49 -0700)
 are available in the Git repository at:
-  https://github.com/stefanha/qemu.git tags/block-pull-request
+  https://gitlab.com/stefanha/qemu.git tags/block-pull-request
-for you to fetch changes up to e84125761f78919fe63616d9888ea45e72dc956f:
+for you to fetch changes up to bef2e050d6a7feb865854c65570c496ac5a8cf53:
-  docs: add Security chapter to the documentation (2019-05-10 10:53:52 +0100)
+  util/event-loop-base: Introduce options to set the thread pool size (2022-05-04 17:02:19 +0100)
 ----------------------------------------------------------------
 Pull request
+Add new thread-pool-min/thread-pool-max parameters to control the thread pool
+used for async I/O.
 ----------------------------------------------------------------
-Andrey Shinkevich (1):
+Nicolas Saenz Julienne (3):
-  block/io.c: fix for the allocation failure
+  Introduce event-loop-base abstract class
   util/main-loop: Introduce the main loop into QOM
   util/event-loop-base: Introduce options to set the thread pool size
-Jules Irenge (3):
+ qapi/qom.json                    |  43 ++++++++--
-  util/readline: add a space to fix errors by checkpatch tool
+ meson.build                      |  26 +++---
-  util: readline: replace tab indent by four spaces to fix checkpatch
+ include/block/aio.h              |  10 +++
-    errors
+ include/block/thread-pool.h      |   3 +
-  util/readline: Add braces to fix checkpatch errors
+ include/qemu/main-loop.h         |  10 +++
+ include/sysemu/event-loop-base.h |  41 +++++++++
-Nikita Alekseev (1):
+ include/sysemu/iothread.h        |   6 +-
-  block: Add coroutine_fn to bdrv_check_co_entry
+ event-loop-base.c                | 140 +++++++++++++++++++++++++++++++
+ iothread.c                       |  68 +++++----------
-Paolo Bonzini (1):
+ util/aio-posix.c                 |   1 +
-  aio-posix: ensure poll mode is left when aio_notify is called
+ util/async.c                     |  20 +++++
+ util/main-loop.c                 |  65 ++++++++++++++
-Stefan Hajnoczi (2):
+ util/thread-pool.c               |  55 +++++++++++-
-  docs: add Secure Coding Practices to developer docs
+files changed, 419 insertions(+), 69 deletions(-)
-  docs: add Security chapter to the documentation
+ create mode 100644 include/sysemu/event-loop-base.h
+ create mode 100644 event-loop-base.c
  Makefile                               |   2 +-
  block.c                                |   2 +-
  block/io.c                             |   2 +-
  util/aio-posix.c                       |  12 +-
  util/readline.c                        | 174 ++++++++++++++-----------
  docs/devel/index.rst                   |   1 +
  docs/devel/secure-coding-practices.rst | 106 +++++++++++++++
  docs/security.texi                     | 131 +++++++++++++++++++
  qemu-doc.texi                          |   3 +
 files changed, 347 insertions(+), 86 deletions(-)
  create mode 100644 docs/devel/secure-coding-practices.rst
  create mode 100644 docs/security.texi
 --
-.21.0
+.35.1

-[Qemu-devel] [PULL 1/8] util/readline: add a space to fix errors by checkpatch tool
+Deleted patch
-From: Jules Irenge <jbi.octave@gmail.com>
-util/readline: add a space to fix errors reported by checkpatch.pl tool
-"ERROR: space required before the open parenthesis"
-"ERROR: space required after that ..."
-within "util/redline.c" file
-Signed-off-by: Jules Irenge <jbi.octave@gmail.com>
-Reviewed-by: Thomas Huth <thuth@redhat.com>
-Message-id: 20190401024406.10819-2-jbi.octave@gmail.com
-Message-Id: <20190401024406.10819-2-jbi.octave@gmail.com>
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
----
- util/readline.c | 34 +++++++++++++++++-----------------
-file changed, 17 insertions(+), 17 deletions(-)
-diff --git a/util/readline.c b/util/readline.c
-index XXXXXXX..XXXXXXX 100644
---- a/util/readline.c
-+++ b/util/readline.c
-@@ -XXX,XX +XXX,XX @@ static void readline_update(ReadLineState *rs)
-     if (rs->cmd_buf_size != rs->last_cmd_buf_size ||
-         memcmp(rs->cmd_buf, rs->last_cmd_buf, rs->cmd_buf_size) != 0) {
--        for(i = 0; i < rs->last_cmd_buf_index; i++) {
-+        for (i = 0; i < rs->last_cmd_buf_index; i++) {
-             rs->printf_func(rs->opaque, "\033[D");
-         }
-         rs->cmd_buf[rs->cmd_buf_size] = '\0';
-         if (rs->read_password) {
-             len = strlen(rs->cmd_buf);
--            for(i = 0; i < len; i++)
-+            for (i = 0; i < len; i++)
-                 rs->printf_func(rs->opaque, "*");
-         } else {
-             rs->printf_func(rs->opaque, "%s", rs->cmd_buf);
-@@ -XXX,XX +XXX,XX @@ static void readline_update(ReadLineState *rs)
-     if (rs->cmd_buf_index != rs->last_cmd_buf_index) {
-         delta = rs->cmd_buf_index - rs->last_cmd_buf_index;
-         if (delta > 0) {
--            for(i = 0;i < delta; i++) {
-+            for (i = 0; i < delta; i++) {
-                 rs->printf_func(rs->opaque, "\033[C");
-             }
-         } else {
-             delta = -delta;
--            for(i = 0;i < delta; i++) {
-+            for (i = 0; i < delta; i++) {
-                 rs->printf_func(rs->opaque, "\033[D");
-             }
-         }
-@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
-         return;
-     if (rs->nb_completions == 1) {
-         len = strlen(rs->completions[0]);
--        for(i = rs->completion_index; i < len; i++) {
-+        for (i = rs->completion_index; i < len; i++) {
-             readline_insert_char(rs, rs->completions[0][i]);
-         }
-         /* extra space for next argument. XXX: make it more generic */
-@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
-               completion_comp);
-         rs->printf_func(rs->opaque, "\n");
-         max_width = 0;
--        max_prefix = 0;
--        for(i = 0; i < rs->nb_completions; i++) {
-+        max_prefix = 0;
-+        for (i = 0; i < rs->nb_completions; i++) {
-             len = strlen(rs->completions[i]);
--            if (i==0) {
-+            if (i == 0) {
-                 max_prefix = len;
-             } else {
-                 if (len < max_prefix)
-                     max_prefix = len;
--                for(j=0; j<max_prefix; j++) {
-+                for (j = 0; j < max_prefix; j++) {
-                     if (rs->completions[i][j] != rs->completions[0][j])
-                         max_prefix = j;
-                 }
-@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
-             if (len > max_width)
-                 max_width = len;
-         }
--        if (max_prefix > 0)
--            for(i = rs->completion_index; i < max_prefix; i++) {
-+        if (max_prefix > 0)
-+            for (i = rs->completion_index; i < max_prefix; i++) {
-                 readline_insert_char(rs, rs->completions[0][i]);
-             }
-         max_width += 2;
-@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
-             max_width = 80;
-         nb_cols = 80 / max_width;
-         j = 0;
--        for(i = 0; i < rs->nb_completions; i++) {
-+        for (i = 0; i < rs->nb_completions; i++) {
-             rs->printf_func(rs->opaque, "%-*s", max_width, rs->completions[i]);
-             if (++j == nb_cols || i == (rs->nb_completions - 1)) {
-                 rs->printf_func(rs->opaque, "\n");
-@@ -XXX,XX +XXX,XX @@ static void readline_clear_screen(ReadLineState *rs)
- /* return true if command handled */
- void readline_handle_byte(ReadLineState *rs, int ch)
- {
--    switch(rs->esc_state) {
-+    switch (rs->esc_state) {
-     case IS_NORM:
--        switch(ch) {
-+        switch (ch) {
-         case 1:
-             readline_bol(rs);
-             break;
-@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
-         }
-         break;
-     case IS_CSI:
--        switch(ch) {
-+        switch (ch) {
-     case 'A':
-     case 'F':
-         readline_up_char(rs);
-@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
-             rs->esc_param = rs->esc_param * 10 + (ch - '0');
-             goto the_end;
-         case '~':
--            switch(rs->esc_param) {
-+            switch (rs->esc_param) {
-             case 1:
-                 readline_bol(rs);
-                 break;
-@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
-     the_end:
-         break;
-     case IS_SS3:
--        switch(ch) {
-+        switch (ch) {
-         case 'F':
-             readline_eol(rs);
-             break;
---
-.21.0

-[Qemu-devel] [PULL 8/8] docs: add Security chapter to the documentation
+[PULL 1/3] Introduce event-loop-base abstract class
-This new chapter in the QEMU documentation covers the security
+From: Nicolas Saenz Julienne <nsaenzju@redhat.com>
-requirements that QEMU is designed to meet and principles for securely
-deploying QEMU.
+Introduce the 'event-loop-base' abstract class, it'll hold the
+properties common to all event loops and provide the necessary hooks for
-It is just a starting point that can be extended in the future with more
+their creation and maintenance. Then have iothread inherit from it.
-information.
+EventLoopBaseClass is defined as user creatable and provides a hook for
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
+its children to attach themselves to the user creatable class 'complete'
-Acked-by: Stefano Garzarella <sgarzare@redhat.com>
+function. It also provides an update_params() callback to propagate
-Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
+property changes onto its children.
-Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com>
-Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
+The new 'event-loop-base' class will live in the root directory. It is
-Reviewed-by: Li Qiang <liq3ea@gmail.com>
+built on its own using the 'link_whole' option (there are no direct
-Message-id: 20190509121820.16294-3-stefanha@redhat.com
+function dependencies between the class and its children, it all happens
-Message-Id: <20190509121820.16294-3-stefanha@redhat.com>
+trough 'constructor' magic). And also imposes new compilation
 dependencies:
     qom <- event-loop-base <- blockdev (iothread.c)
 And in subsequent patches:
     qom <- event-loop-base <- qemuutil (util/main-loop.c)
 All this forced some amount of reordering in meson.build:
  - Moved qom build definition before qemuutil. Doing it the other way
    around (i.e. moving qemuutil after qom) isn't possible as a lot of
    core libraries that live in between the two depend on it.
  - Process the 'hw' subdir earlier, as it introduces files into the
    'qom' source set.
 No functional changes intended.
 Signed-off-by: Nicolas Saenz Julienne <nsaenzju@redhat.com>
 Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
 Acked-by: Markus Armbruster <armbru@redhat.com>
 Message-id: 20220425075723.20019-2-nsaenzju@redhat.com
 Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
 ---
- Makefile           |   2 +-
+ qapi/qom.json                    |  22 +++++--
- docs/security.texi | 131 +++++++++++++++++++++++++++++++++++++++++++++
+ meson.build                      |  23 ++++---
- qemu-doc.texi      |   3 ++
+ include/sysemu/event-loop-base.h |  36 +++++++++++
-files changed, 135 insertions(+), 1 deletion(-)
+ include/sysemu/iothread.h        |   6 +-
- create mode 100644 docs/security.texi
+ event-loop-base.c                | 104 +++++++++++++++++++++++++++++++
+ iothread.c                       |  65 ++++++-------------
-diff --git a/Makefile b/Makefile
+files changed, 192 insertions(+), 64 deletions(-)
  create mode 100644 include/sysemu/event-loop-base.h
  create mode 100644 event-loop-base.c
 diff --git a/qapi/qom.json b/qapi/qom.json
 index XXXXXXX..XXXXXXX 100644
---- a/Makefile
+--- a/qapi/qom.json
-+++ b/Makefile
++++ b/qapi/qom.json
-@@ -XXX,XX +XXX,XX @@ qemu-doc.html qemu-doc.info qemu-doc.pdf qemu-doc.txt: \
+@@ -XXX,XX +XXX,XX @@
-     qemu-img.texi qemu-nbd.texi qemu-options.texi qemu-option-trace.texi \
+             '*repeat': 'bool',
-     qemu-deprecated.texi qemu-monitor.texi qemu-img-cmds.texi qemu-ga.texi \
+             '*grab-toggle': 'GrabToggleKeys' } }
-     qemu-monitor-info.texi docs/qemu-block-drivers.texi \
--    docs/qemu-cpu-models.texi
++##
-+    docs/qemu-cpu-models.texi docs/security.texi
++# @EventLoopBaseProperties:
++#
- docs/interop/qemu-ga-ref.dvi docs/interop/qemu-ga-ref.html \
++# Common properties for event loops
-     docs/interop/qemu-ga-ref.info docs/interop/qemu-ga-ref.pdf \
++#
-diff --git a/docs/security.texi b/docs/security.texi
++# @aio-max-batch: maximum number of requests in a batch for the AIO engine,
 +#                 0 means that the engine will use its default.
 +#                 (default: 0)
 +#
 +# Since: 7.1
 +##
 +{ 'struct': 'EventLoopBaseProperties',
 +  'data': { '*aio-max-batch': 'int' } }
 +
  ##
  # @IothreadProperties:
  #
@@ -XXX,XX +XXX,XX @@
  #               algorithm detects it is spending too long polling without
  #               encountering events. 0 selects a default behaviour (default: 0)
  #
 -# @aio-max-batch: maximum number of requests in a batch for the AIO engine,
 -#                 0 means that the engine will use its default
 -#                 (default:0, since 6.1)
 +# The @aio-max-batch option is available since 6.1.
  #
  # Since: 2.0
  ##
  { 'struct': 'IothreadProperties',
 +  'base': 'EventLoopBaseProperties',
    'data': { '*poll-max-ns': 'int',
              '*poll-grow': 'int',
 -            '*poll-shrink': 'int',
 -            '*aio-max-batch': 'int' } }
 +            '*poll-shrink': 'int' } }
  ##
  # @MemoryBackendProperties:
 diff --git a/meson.build b/meson.build
 index XXXXXXX..XXXXXXX 100644
 --- a/meson.build
 +++ b/meson.build
@@ -XXX,XX +XXX,XX @@ subdir('qom')
  subdir('authz')
  subdir('crypto')
  subdir('ui')
 +subdir('hw')
  if enable_modules
@@ -XXX,XX +XXX,XX @@ if enable_modules
    modulecommon = declare_dependency(link_whole: libmodulecommon, compile_args: '-DBUILD_DSO')
  endif
 +qom_ss = qom_ss.apply(config_host, strict: false)
 +libqom = static_library('qom', qom_ss.sources() + genh,
 +                        dependencies: [qom_ss.dependencies()],
 +                        name_suffix: 'fa')
 +qom = declare_dependency(link_whole: libqom)
 +
 +event_loop_base = files('event-loop-base.c')
 +event_loop_base = static_library('event-loop-base', sources: event_loop_base + genh,
 +                                 build_by_default: true)
 +event_loop_base = declare_dependency(link_whole: event_loop_base,
 +                                     dependencies: [qom])
 +
  stub_ss = stub_ss.apply(config_all, strict: false)
  util_ss.add_all(trace_ss)
@@ -XXX,XX +XXX,XX @@ subdir('monitor')
  subdir('net')
  subdir('replay')
  subdir('semihosting')
 -subdir('hw')
  subdir('tcg')
  subdir('fpu')
  subdir('accel')
@@ -XXX,XX +XXX,XX @@ qemu_syms = custom_target('qemu.syms', output: 'qemu.syms',
                               capture: true,
                               command: [undefsym, nm, '@INPUT@'])
 -qom_ss = qom_ss.apply(config_host, strict: false)
 -libqom = static_library('qom', qom_ss.sources() + genh,
 -                        dependencies: [qom_ss.dependencies()],
 -                        name_suffix: 'fa')
 -
 -qom = declare_dependency(link_whole: libqom)
 -
  authz_ss = authz_ss.apply(config_host, strict: false)
  libauthz = static_library('authz', authz_ss.sources() + genh,
                            dependencies: [authz_ss.dependencies()],
@@ -XXX,XX +XXX,XX @@ libblockdev = static_library('blockdev', blockdev_ss.sources() + genh,
                               build_by_default: false)
  blockdev = declare_dependency(link_whole: [libblockdev],
 -                              dependencies: [block])
 +                              dependencies: [block, event_loop_base])
  qmp_ss = qmp_ss.apply(config_host, strict: false)
  libqmp = static_library('qmp', qmp_ss.sources() + genh,
 diff --git a/include/sysemu/event-loop-base.h b/include/sysemu/event-loop-base.h
 new file mode 100644
 index XXXXXXX..XXXXXXX
 --- /dev/null
-+++ b/docs/security.texi
++++ b/include/sysemu/event-loop-base.h
 @@ -XXX,XX +XXX,XX @@
-+@node Security
++/*
-+@chapter Security
++ * QEMU event-loop backend
-+
++ *
-+@section Overview
++ * Copyright (C) 2022 Red Hat Inc
-+
++ *
-+This chapter explains the security requirements that QEMU is designed to meet
++ * Authors:
-+and principles for securely deploying QEMU.
++ *  Nicolas Saenz Julienne <nsaenzju@redhat.com>
-+
++ *
-+@section Security Requirements
++ * This work is licensed under the terms of the GNU GPL, version 2 or later.
-+
++ * See the COPYING file in the top-level directory.
-+QEMU supports many different use cases, some of which have stricter security
++ */
-+requirements than others.  The community has agreed on the overall security
++#ifndef QEMU_EVENT_LOOP_BASE_H
-+requirements that users may depend on.  These requirements define what is
++#define QEMU_EVENT_LOOP_BASE_H
-+considered supported from a security perspective.
++
-+
++#include "qom/object.h"
-+@subsection Virtualization Use Case
++#include "block/aio.h"
-+
++#include "qemu/typedefs.h"
-+The virtualization use case covers cloud and virtual private server (VPS)
++
-+hosting, as well as traditional data center and desktop virtualization.  These
++#define TYPE_EVENT_LOOP_BASE         "event-loop-base"
-+use cases rely on hardware virtualization extensions to execute guest code
++OBJECT_DECLARE_TYPE(EventLoopBase, EventLoopBaseClass,
-+safely on the physical CPU at close-to-native speed.
++                    EVENT_LOOP_BASE)
 +
-+The following entities are untrusted, meaning that they may be buggy or
++struct EventLoopBaseClass {
-+malicious:
++    ObjectClass parent_class;
 +
-+@itemize
++    void (*init)(EventLoopBase *base, Error **errp);
-+@item Guest
++    void (*update_params)(EventLoopBase *base, Error **errp);
-+@item User-facing interfaces (e.g. VNC, SPICE, WebSocket)
++};
-+@item Network protocols (e.g. NBD, live migration)
++
-+@item User-supplied files (e.g. disk images, kernels, device trees)
++struct EventLoopBase {
-+@item Passthrough devices (e.g. PCI, USB)
++    Object parent;
-+@end itemize
++
-+
++    /* AioContext AIO engine parameters */
-+Bugs affecting these entities are evaluated on whether they can cause damage in
++    int64_t aio_max_batch;
-+real-world use cases and treated as security bugs if this is the case.
++};
-+
++#endif
-+@subsection Non-virtualization Use Case
+diff --git a/include/sysemu/iothread.h b/include/sysemu/iothread.h
 +
 +The non-virtualization use case covers emulation using the Tiny Code Generator
 +(TCG).  In principle the TCG and device emulation code used in conjunction with
 +the non-virtualization use case should meet the same security requirements as
 +the virtualization use case.  However, for historical reasons much of the
 +non-virtualization use case code was not written with these security
 +requirements in mind.
 +
 +Bugs affecting the non-virtualization use case are not considered security
 +bugs at this time.  Users with non-virtualization use cases must not rely on
 +QEMU to provide guest isolation or any security guarantees.
 +
 +@section Architecture
 +
 +This section describes the design principles that ensure the security
 +requirements are met.
 +
 +@subsection Guest Isolation
 +
 +Guest isolation is the confinement of guest code to the virtual machine.  When
 +guest code gains control of execution on the host this is called escaping the
 +virtual machine.  Isolation also includes resource limits such as throttling of
 +CPU, memory, disk, or network.  Guests must be unable to exceed their resource
 +limits.
 +
 +QEMU presents an attack surface to the guest in the form of emulated devices.
 +The guest must not be able to gain control of QEMU.  Bugs in emulated devices
 +could allow malicious guests to gain code execution in QEMU.  At this point the
 +guest has escaped the virtual machine and is able to act in the context of the
 +QEMU process on the host.
 +
 +Guests often interact with other guests and share resources with them.  A
 +malicious guest must not gain control of other guests or access their data.
 +Disk image files and network traffic must be protected from other guests unless
 +explicitly shared between them by the user.
 +
 +@subsection Principle of Least Privilege
 +
 +The principle of least privilege states that each component only has access to
 +the privileges necessary for its function.  In the case of QEMU this means that
 +each process only has access to resources belonging to the guest.
 +
 +The QEMU process should not have access to any resources that are inaccessible
 +to the guest.  This way the guest does not gain anything by escaping into the
 +QEMU process since it already has access to those same resources from within
 +the guest.
 +
 +Following the principle of least privilege immediately fulfills guest isolation
 +requirements.  For example, guest A only has access to its own disk image file
 +@code{a.img} and not guest B's disk image file @code{b.img}.
 +
 +In reality certain resources are inaccessible to the guest but must be
 +available to QEMU to perform its function.  For example, host system calls are
 +necessary for QEMU but are not exposed to guests.  A guest that escapes into
 +the QEMU process can then begin invoking host system calls.
 +
 +New features must be designed to follow the principle of least privilege.
 +Should this not be possible for technical reasons, the security risk must be
 +clearly documented so users are aware of the trade-off of enabling the feature.
 +
 +@subsection Isolation mechanisms
 +
 +Several isolation mechanisms are available to realize this architecture of
 +guest isolation and the principle of least privilege.  With the exception of
 +Linux seccomp, these mechanisms are all deployed by management tools that
 +launch QEMU, such as libvirt.  They are also platform-specific so they are only
 +described briefly for Linux here.
 +
 +The fundamental isolation mechanism is that QEMU processes must run as
 +unprivileged users.  Sometimes it seems more convenient to launch QEMU as
 +root to give it access to host devices (e.g. @code{/dev/net/tun}) but this poses a
 +huge security risk.  File descriptor passing can be used to give an otherwise
 +unprivileged QEMU process access to host devices without running QEMU as root.
 +It is also possible to launch QEMU as a non-root user and configure UNIX groups
 +for access to @code{/dev/kvm}, @code{/dev/net/tun}, and other device nodes.
 +Some Linux distros already ship with UNIX groups for these devices by default.
 +
 +@itemize
 +@item SELinux and AppArmor make it possible to confine processes beyond the
 +traditional UNIX process and file permissions model.  They restrict the QEMU
 +process from accessing processes and files on the host system that are not
 +needed by QEMU.
 +
 +@item Resource limits and cgroup controllers provide throughput and utilization
 +limits on key resources such as CPU time, memory, and I/O bandwidth.
 +
 +@item Linux namespaces can be used to make process, file system, and other system
 +resources unavailable to QEMU.  A namespaced QEMU process is restricted to only
 +those resources that were granted to it.
 +
 +@item Linux seccomp is available via the QEMU @option{--sandbox} option.  It disables
 +system calls that are not needed by QEMU, thereby reducing the host kernel
 +attack surface.
 +@end itemize
 diff --git a/qemu-doc.texi b/qemu-doc.texi
 index XXXXXXX..XXXXXXX 100644
---- a/qemu-doc.texi
+--- a/include/sysemu/iothread.h
-+++ b/qemu-doc.texi
++++ b/include/sysemu/iothread.h
 @@ -XXX,XX +XXX,XX @@
- * QEMU Guest Agent::
+ #include "block/aio.h"
- * QEMU User space emulator::
+ #include "qemu/thread.h"
- * System requirements::
+ #include "qom/object.h"
-+* Security::
++#include "sysemu/event-loop-base.h"
- * Implementation notes::
- * Deprecated features::
+ #define TYPE_IOTHREAD "iothread"
- * Supported build platforms::
-@@ -XXX,XX +XXX,XX @@ added with Linux 4.5 which is supported by the major distros. And even
+ struct IOThread {
- if RHEL7 has kernel 3.10, KVM there has the required functionality there
+-    Object parent_obj;
- to make it close to a 4.5 or newer kernel.
++    EventLoopBase parent_obj;
-+@include docs/security.texi
+     QemuThread thread;
-+
+     AioContext *ctx;
- @include qemu-tech.texi
+@@ -XXX,XX +XXX,XX @@ struct IOThread {
+     int64_t poll_max_ns;
- @include qemu-deprecated.texi
+     int64_t poll_grow;
      int64_t poll_shrink;
 -
 -    /* AioContext AIO engine parameters */
 -    int64_t aio_max_batch;
  };
  typedef struct IOThread IOThread;
 diff --git a/event-loop-base.c b/event-loop-base.c
 new file mode 100644
 index XXXXXXX..XXXXXXX
 --- /dev/null
 +++ b/event-loop-base.c
@@ -XXX,XX +XXX,XX @@
 +/*
 + * QEMU event-loop base
 + *
 + * Copyright (C) 2022 Red Hat Inc
 + *
 + * Authors:
 + *  Stefan Hajnoczi <stefanha@redhat.com>
 + *  Nicolas Saenz Julienne <nsaenzju@redhat.com>
 + *
 + * This work is licensed under the terms of the GNU GPL, version 2 or later.
 + * See the COPYING file in the top-level directory.
 + */
 +
 +#include "qemu/osdep.h"
 +#include "qom/object_interfaces.h"
 +#include "qapi/error.h"
 +#include "sysemu/event-loop-base.h"
 +
 +typedef struct {
 +    const char *name;
 +    ptrdiff_t offset; /* field's byte offset in EventLoopBase struct */
 +} EventLoopBaseParamInfo;
 +
 +static EventLoopBaseParamInfo aio_max_batch_info = {
 +    "aio-max-batch", offsetof(EventLoopBase, aio_max_batch),
 +};
 +
 +static void event_loop_base_get_param(Object *obj, Visitor *v,
 +        const char *name, void *opaque, Error **errp)
 +{
 +    EventLoopBase *event_loop_base = EVENT_LOOP_BASE(obj);
 +    EventLoopBaseParamInfo *info = opaque;
 +    int64_t *field = (void *)event_loop_base + info->offset;
 +
 +    visit_type_int64(v, name, field, errp);
 +}
 +
 +static void event_loop_base_set_param(Object *obj, Visitor *v,
 +        const char *name, void *opaque, Error **errp)
 +{
 +    EventLoopBaseClass *bc = EVENT_LOOP_BASE_GET_CLASS(obj);
 +    EventLoopBase *base = EVENT_LOOP_BASE(obj);
 +    EventLoopBaseParamInfo *info = opaque;
 +    int64_t *field = (void *)base + info->offset;
 +    int64_t value;
 +
 +    if (!visit_type_int64(v, name, &value, errp)) {
 +        return;
 +    }
 +
 +    if (value < 0) {
 +        error_setg(errp, "%s value must be in range [0, %" PRId64 "]",
 +                   info->name, INT64_MAX);
 +        return;
 +    }
 +
 +    *field = value;
 +
 +    if (bc->update_params) {
 +        bc->update_params(base, errp);
 +    }
 +
 +    return;
 +}
 +
 +static void event_loop_base_complete(UserCreatable *uc, Error **errp)
 +{
 +    EventLoopBaseClass *bc = EVENT_LOOP_BASE_GET_CLASS(uc);
 +    EventLoopBase *base = EVENT_LOOP_BASE(uc);
 +
 +    if (bc->init) {
 +        bc->init(base, errp);
 +    }
 +}
 +
 +static void event_loop_base_class_init(ObjectClass *klass, void *class_data)
 +{
 +    UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
 +    ucc->complete = event_loop_base_complete;
 +
 +    object_class_property_add(klass, "aio-max-batch", "int",
 +                              event_loop_base_get_param,
 +                              event_loop_base_set_param,
 +                              NULL, &aio_max_batch_info);
 +}
 +
 +static const TypeInfo event_loop_base_info = {
 +    .name = TYPE_EVENT_LOOP_BASE,
 +    .parent = TYPE_OBJECT,
 +    .instance_size = sizeof(EventLoopBase),
 +    .class_size = sizeof(EventLoopBaseClass),
 +    .class_init = event_loop_base_class_init,
 +    .abstract = true,
 +    .interfaces = (InterfaceInfo[]) {
 +        { TYPE_USER_CREATABLE },
 +        { }
 +    }
 +};
 +
 +static void register_types(void)
 +{
 +    type_register_static(&event_loop_base_info);
 +}
 +type_init(register_types);
 diff --git a/iothread.c b/iothread.c
 index XXXXXXX..XXXXXXX 100644
 --- a/iothread.c
 +++ b/iothread.c
@@ -XXX,XX +XXX,XX @@
  #include "qemu/module.h"
  #include "block/aio.h"
  #include "block/block.h"
 +#include "sysemu/event-loop-base.h"
  #include "sysemu/iothread.h"
  #include "qapi/error.h"
  #include "qapi/qapi-commands-misc.h"
@@ -XXX,XX +XXX,XX @@ static void iothread_init_gcontext(IOThread *iothread)
      iothread->main_loop = g_main_loop_new(iothread->worker_context, TRUE);
  }
 -static void iothread_set_aio_context_params(IOThread *iothread, Error **errp)
 +static void iothread_set_aio_context_params(EventLoopBase *base, Error **errp)
  {
 +    IOThread *iothread = IOTHREAD(base);
      ERRP_GUARD();
 +    if (!iothread->ctx) {
 +        return;
 +    }
 +
      aio_context_set_poll_params(iothread->ctx,
                                  iothread->poll_max_ns,
                                  iothread->poll_grow,
@@ -XXX,XX +XXX,XX @@ static void iothread_set_aio_context_params(IOThread *iothread, Error **errp)
      }
      aio_context_set_aio_params(iothread->ctx,
 -                               iothread->aio_max_batch,
 +                               iothread->parent_obj.aio_max_batch,
                                 errp);
  }
 -static void iothread_complete(UserCreatable *obj, Error **errp)
 +
 +static void iothread_init(EventLoopBase *base, Error **errp)
  {
      Error *local_error = NULL;
 -    IOThread *iothread = IOTHREAD(obj);
 +    IOThread *iothread = IOTHREAD(base);
      char *thread_name;
      iothread->stopping = false;
@@ -XXX,XX +XXX,XX @@ static void iothread_complete(UserCreatable *obj, Error **errp)
       */
      iothread_init_gcontext(iothread);
 -    iothread_set_aio_context_params(iothread, &local_error);
 +    iothread_set_aio_context_params(base, &local_error);
      if (local_error) {
          error_propagate(errp, local_error);
          aio_context_unref(iothread->ctx);
@@ -XXX,XX +XXX,XX @@ static void iothread_complete(UserCreatable *obj, Error **errp)
       * to inherit.
       */
      thread_name = g_strdup_printf("IO %s",
 -                        object_get_canonical_path_component(OBJECT(obj)));
 +                        object_get_canonical_path_component(OBJECT(base)));
      qemu_thread_create(&iothread->thread, thread_name, iothread_run,
                         iothread, QEMU_THREAD_JOINABLE);
      g_free(thread_name);
@@ -XXX,XX +XXX,XX @@ static IOThreadParamInfo poll_grow_info = {
  static IOThreadParamInfo poll_shrink_info = {
      "poll-shrink", offsetof(IOThread, poll_shrink),
  };
 -static IOThreadParamInfo aio_max_batch_info = {
 -    "aio-max-batch", offsetof(IOThread, aio_max_batch),
 -};
  static void iothread_get_param(Object *obj, Visitor *v,
          const char *name, IOThreadParamInfo *info, Error **errp)
@@ -XXX,XX +XXX,XX @@ static void iothread_set_poll_param(Object *obj, Visitor *v,
      }
  }
 -static void iothread_get_aio_param(Object *obj, Visitor *v,
 -        const char *name, void *opaque, Error **errp)
 -{
 -    IOThreadParamInfo *info = opaque;
 -
 -    iothread_get_param(obj, v, name, info, errp);
 -}
 -
 -static void iothread_set_aio_param(Object *obj, Visitor *v,
 -        const char *name, void *opaque, Error **errp)
 -{
 -    IOThread *iothread = IOTHREAD(obj);
 -    IOThreadParamInfo *info = opaque;
 -
 -    if (!iothread_set_param(obj, v, name, info, errp)) {
 -        return;
 -    }
 -
 -    if (iothread->ctx) {
 -        aio_context_set_aio_params(iothread->ctx,
 -                                   iothread->aio_max_batch,
 -                                   errp);
 -    }
 -}
 -
  static void iothread_class_init(ObjectClass *klass, void *class_data)
  {
 -    UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
 -    ucc->complete = iothread_complete;
 +    EventLoopBaseClass *bc = EVENT_LOOP_BASE_CLASS(klass);
 +
 +    bc->init = iothread_init;
 +    bc->update_params = iothread_set_aio_context_params;
      object_class_property_add(klass, "poll-max-ns", "int",
                                iothread_get_poll_param,
@@ -XXX,XX +XXX,XX @@ static void iothread_class_init(ObjectClass *klass, void *class_data)
                                iothread_get_poll_param,
                                iothread_set_poll_param,
                                NULL, &poll_shrink_info);
 -    object_class_property_add(klass, "aio-max-batch", "int",
 -                              iothread_get_aio_param,
 -                              iothread_set_aio_param,
 -                              NULL, &aio_max_batch_info);
  }
  static const TypeInfo iothread_info = {
      .name = TYPE_IOTHREAD,
 -    .parent = TYPE_OBJECT,
 +    .parent = TYPE_EVENT_LOOP_BASE,
      .class_init = iothread_class_init,
      .instance_size = sizeof(IOThread),
      .instance_init = iothread_instance_init,
      .instance_finalize = iothread_instance_finalize,
 -    .interfaces = (InterfaceInfo[]) {
 -        {TYPE_USER_CREATABLE},
 -        {}
 -    },
  };
  static void iothread_register_types(void)
@@ -XXX,XX +XXX,XX @@ static int query_one_iothread(Object *object, void *opaque)
      info->poll_max_ns = iothread->poll_max_ns;
      info->poll_grow = iothread->poll_grow;
      info->poll_shrink = iothread->poll_shrink;
 -    info->aio_max_batch = iothread->aio_max_batch;
 +    info->aio_max_batch = iothread->parent_obj.aio_max_batch;
      QAPI_LIST_APPEND(*tail, info);
      return 0;
 --
-.21.0
+.35.1

-[Qemu-devel] [PULL 2/8] util: readline: replace tab indent by four spaces to fix checkpatch errors
+[PULL 2/3] util/main-loop: Introduce the main loop into QOM
-From: Jules Irenge <jbi.octave@gmail.com>
+From: Nicolas Saenz Julienne <nsaenzju@redhat.com>
-Replace tab indent by four spaces to fix errors issued by checkpatch.pl tool
+'event-loop-base' provides basic property handling for all 'AioContext'
-"ERROR: code indent should never use tabs" within "util/readline.c" file.
+based event loops. So let's define a new 'MainLoopClass' that inherits
+from it. This will permit tweaking the main loop's properties through
-Signed-off-by: Jules Irenge <jbi.octave@gmail.com>
+qapi as well as through the command line using the '-object' keyword[1].
-Reviewed-by: Thomas Huth <thuth@redhat.com>
+Only one instance of 'MainLoopClass' might be created at any time.
-Message-id: 20190401024406.10819-3-jbi.octave@gmail.com
-Message-Id: <20190401024406.10819-3-jbi.octave@gmail.com>
+'EventLoopBaseClass' learns a new callback, 'can_be_deleted()' so as to
 mark 'MainLoop' as non-deletable.
 [1] For example:
       -object main-loop,id=main-loop,aio-max-batch=<value>
 Signed-off-by: Nicolas Saenz Julienne <nsaenzju@redhat.com>
 Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
 Acked-by: Markus Armbruster <armbru@redhat.com>
 Message-id: 20220425075723.20019-3-nsaenzju@redhat.com
 Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
 ---
- util/readline.c | 98 ++++++++++++++++++++++++-------------------------
+ qapi/qom.json                    | 13 ++++++++
-file changed, 49 insertions(+), 49 deletions(-)
+ meson.build                      |  3 +-
+ include/qemu/main-loop.h         | 10 ++++++
-diff --git a/util/readline.c b/util/readline.c
+ include/sysemu/event-loop-base.h |  1 +
-index XXXXXXX..XXXXXXX 100644
+ event-loop-base.c                | 13 ++++++++
---- a/util/readline.c
+ util/main-loop.c                 | 56 ++++++++++++++++++++++++++++++++
-+++ b/util/readline.c
+files changed, 95 insertions(+), 1 deletion(-)
-@@ -XXX,XX +XXX,XX @@ static void readline_up_char(ReadLineState *rs)
-     int idx;
+diff --git a/qapi/qom.json b/qapi/qom.json
+index XXXXXXX..XXXXXXX 100644
-     if (rs->hist_entry == 0)
+--- a/qapi/qom.json
--    return;
++++ b/qapi/qom.json
-+        return;
+@@ -XXX,XX +XXX,XX @@
-     if (rs->hist_entry == -1) {
+             '*poll-grow': 'int',
--    /* Find latest entry */
+             '*poll-shrink': 'int' } }
--    for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
--        if (rs->history[idx] == NULL)
++##
--        break;
++# @MainLoopProperties:
--    }
++#
--    rs->hist_entry = idx;
++# Properties for the main-loop object.
-+        /* Find latest entry */
++#
-+        for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
++# Since: 7.1
-+            if (rs->history[idx] == NULL)
++##
-+                break;
++{ 'struct': 'MainLoopProperties',
-+        }
++  'base': 'EventLoopBaseProperties',
-+        rs->hist_entry = idx;
++  'data': {} }
-     }
++
-     rs->hist_entry--;
+ ##
-     if (rs->hist_entry >= 0) {
+ # @MemoryBackendProperties:
--    pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
+ #
-+        pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
+@@ -XXX,XX +XXX,XX @@
-                 rs->history[rs->hist_entry]);
+     { 'name': 'input-linux',
--    rs->cmd_buf_index = rs->cmd_buf_size = strlen(rs->cmd_buf);
+       'if': 'CONFIG_LINUX' },
-+        rs->cmd_buf_index = rs->cmd_buf_size = strlen(rs->cmd_buf);
+     'iothread',
 +    'main-loop',
      { 'name': 'memory-backend-epc',
        'if': 'CONFIG_LINUX' },
      'memory-backend-file',
@@ -XXX,XX +XXX,XX @@
        'input-linux':                { 'type': 'InputLinuxProperties',
                                        'if': 'CONFIG_LINUX' },
        'iothread':                   'IothreadProperties',
 +      'main-loop':                  'MainLoopProperties',
        'memory-backend-epc':         { 'type': 'MemoryBackendEpcProperties',
                                        'if': 'CONFIG_LINUX' },
        'memory-backend-file':        'MemoryBackendFileProperties',
 diff --git a/meson.build b/meson.build
 index XXXXXXX..XXXXXXX 100644
 --- a/meson.build
 +++ b/meson.build
@@ -XXX,XX +XXX,XX @@ libqemuutil = static_library('qemuutil',
                               sources: util_ss.sources() + stub_ss.sources() + genh,
                               dependencies: [util_ss.dependencies(), libm, threads, glib, socket, malloc, pixman])
  qemuutil = declare_dependency(link_with: libqemuutil,
 -                              sources: genh + version_res)
 +                              sources: genh + version_res,
 +                              dependencies: [event_loop_base])
  if have_system or have_user
    decodetree = generator(find_program('scripts/decodetree.py'),
 diff --git a/include/qemu/main-loop.h b/include/qemu/main-loop.h
 index XXXXXXX..XXXXXXX 100644
 --- a/include/qemu/main-loop.h
 +++ b/include/qemu/main-loop.h
@@ -XXX,XX +XXX,XX @@
  #define QEMU_MAIN_LOOP_H
  #include "block/aio.h"
 +#include "qom/object.h"
 +#include "sysemu/event-loop-base.h"
  #define SIG_IPI SIGUSR1
 +#define TYPE_MAIN_LOOP  "main-loop"
 +OBJECT_DECLARE_TYPE(MainLoop, MainLoopClass, MAIN_LOOP)
 +
 +struct MainLoop {
 +    EventLoopBase parent_obj;
 +};
 +typedef struct MainLoop MainLoop;
 +
  /**
   * qemu_init_main_loop: Set up the process so that it can run the main loop.
   *
 diff --git a/include/sysemu/event-loop-base.h b/include/sysemu/event-loop-base.h
 index XXXXXXX..XXXXXXX 100644
 --- a/include/sysemu/event-loop-base.h
 +++ b/include/sysemu/event-loop-base.h
@@ -XXX,XX +XXX,XX @@ struct EventLoopBaseClass {
      void (*init)(EventLoopBase *base, Error **errp);
      void (*update_params)(EventLoopBase *base, Error **errp);
 +    bool (*can_be_deleted)(EventLoopBase *base);
  };
  struct EventLoopBase {
 diff --git a/event-loop-base.c b/event-loop-base.c
 index XXXXXXX..XXXXXXX 100644
 --- a/event-loop-base.c
 +++ b/event-loop-base.c
@@ -XXX,XX +XXX,XX @@ static void event_loop_base_complete(UserCreatable *uc, Error **errp)
      }
  }
-@@ -XXX,XX +XXX,XX @@ static void readline_down_char(ReadLineState *rs)
++static bool event_loop_base_can_be_deleted(UserCreatable *uc)
-         return;
++{
-     if (rs->hist_entry < READLINE_MAX_CMDS - 1 &&
++    EventLoopBaseClass *bc = EVENT_LOOP_BASE_GET_CLASS(uc);
-         rs->history[++rs->hist_entry] != NULL) {
++    EventLoopBase *backend = EVENT_LOOP_BASE(uc);
--    pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
++
-+        pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
++    if (bc->can_be_deleted) {
-                 rs->history[rs->hist_entry]);
++        return bc->can_be_deleted(backend);
-     } else {
++    }
-         rs->cmd_buf[0] = 0;
++
--    rs->hist_entry = -1;
++    return true;
-+        rs->hist_entry = -1;
++}
-     }
++
-     rs->cmd_buf_index = rs->cmd_buf_size = strlen(rs->cmd_buf);
+ static void event_loop_base_class_init(ObjectClass *klass, void *class_data)
  {
      UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
      ucc->complete = event_loop_base_complete;
 +    ucc->can_be_deleted = event_loop_base_can_be_deleted;
      object_class_property_add(klass, "aio-max-batch", "int",
                                event_loop_base_get_param,
 diff --git a/util/main-loop.c b/util/main-loop.c
 index XXXXXXX..XXXXXXX 100644
 --- a/util/main-loop.c
 +++ b/util/main-loop.c
@@ -XXX,XX +XXX,XX @@
  #include "qemu/error-report.h"
  #include "qemu/queue.h"
  #include "qemu/compiler.h"
 +#include "qom/object.h"
  #ifndef _WIN32
  #include <sys/wait.h>
@@ -XXX,XX +XXX,XX @@ int qemu_init_main_loop(Error **errp)
      return 0;
  }
-@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
-     int idx;
++static void main_loop_update_params(EventLoopBase *base, Error **errp)
++{
-     if (cmdline[0] == '\0')
++    if (!qemu_aio_context) {
--    return;
++        error_setg(errp, "qemu aio context not ready");
 +        return;
-     new_entry = NULL;
++    }
-     if (rs->hist_entry != -1) {
++
--    /* We were editing an existing history entry: replace it */
++    aio_context_set_aio_params(qemu_aio_context, base->aio_max_batch, errp);
--    hist_entry = rs->history[rs->hist_entry];
++}
--    idx = rs->hist_entry;
++
--    if (strcmp(hist_entry, cmdline) == 0) {
++MainLoop *mloop;
--        goto same_entry;
++
--    }
++static void main_loop_init(EventLoopBase *base, Error **errp)
-+        /* We were editing an existing history entry: replace it */
++{
-+        hist_entry = rs->history[rs->hist_entry];
++    MainLoop *m = MAIN_LOOP(base);
-+        idx = rs->hist_entry;
++
-+        if (strcmp(hist_entry, cmdline) == 0) {
++    if (mloop) {
-+            goto same_entry;
++        error_setg(errp, "only one main-loop instance allowed");
-+        }
++        return;
-     }
++    }
-     /* Search cmdline in history buffers */
++
-     for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
++    main_loop_update_params(base, errp);
--    hist_entry = rs->history[idx];
++
--    if (hist_entry == NULL)
++    mloop = m;
--        break;
++    return;
--    if (strcmp(hist_entry, cmdline) == 0) {
++}
--    same_entry:
++
--        new_entry = hist_entry;
++static bool main_loop_can_be_deleted(EventLoopBase *base)
--        /* Put this entry at the end of history */
++{
--        memmove(&rs->history[idx], &rs->history[idx + 1],
++    return false;
--            (READLINE_MAX_CMDS - (idx + 1)) * sizeof(char *));
++}
--        rs->history[READLINE_MAX_CMDS - 1] = NULL;
++
--        for (; idx < READLINE_MAX_CMDS; idx++) {
++static void main_loop_class_init(ObjectClass *oc, void *class_data)
--        if (rs->history[idx] == NULL)
++{
--            break;
++    EventLoopBaseClass *bc = EVENT_LOOP_BASE_CLASS(oc);
--        }
++
--        break;
++    bc->init = main_loop_init;
--    }
++    bc->update_params = main_loop_update_params;
-+        hist_entry = rs->history[idx];
++    bc->can_be_deleted = main_loop_can_be_deleted;
-+        if (hist_entry == NULL)
++}
-+            break;
++
-+        if (strcmp(hist_entry, cmdline) == 0) {
++static const TypeInfo main_loop_info = {
-+        same_entry:
++    .name = TYPE_MAIN_LOOP,
-+            new_entry = hist_entry;
++    .parent = TYPE_EVENT_LOOP_BASE,
-+            /* Put this entry at the end of history */
++    .class_init = main_loop_class_init,
-+            memmove(&rs->history[idx], &rs->history[idx + 1],
++    .instance_size = sizeof(MainLoop),
-+                    (READLINE_MAX_CMDS - (idx + 1)) * sizeof(char *));
++};
-+            rs->history[READLINE_MAX_CMDS - 1] = NULL;
++
-+            for (; idx < READLINE_MAX_CMDS; idx++) {
++static void main_loop_register_types(void)
-+                if (rs->history[idx] == NULL)
++{
-+                    break;
++    type_register_static(&main_loop_info);
-+            }
++}
-+            break;
++
-+        }
++type_init(main_loop_register_types)
-     }
++
-     if (idx == READLINE_MAX_CMDS) {
+ static int max_priority;
--    /* Need to get one free slot */
-+        /* Need to get one free slot */
+ #ifndef _WIN32
          g_free(rs->history[0]);
 -    memmove(rs->history, &rs->history[1],
 -            (READLINE_MAX_CMDS - 1) * sizeof(char *));
 -    rs->history[READLINE_MAX_CMDS - 1] = NULL;
 -    idx = READLINE_MAX_CMDS - 1;
 +        memmove(rs->history, &rs->history[1],
 +                (READLINE_MAX_CMDS - 1) * sizeof(char *));
 +        rs->history[READLINE_MAX_CMDS - 1] = NULL;
 +        idx = READLINE_MAX_CMDS - 1;
      }
      if (new_entry == NULL)
          new_entry = g_strdup(cmdline);
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
          case 8:
              readline_backspace(rs);
              break;
 -    case 155:
 +        case 155:
              rs->esc_state = IS_CSI;
 -        break;
 +            break;
          default:
              if (ch >= 32) {
                  readline_insert_char(rs, ch);
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
          break;
      case IS_CSI:
          switch (ch) {
 -    case 'A':
 -    case 'F':
 -        readline_up_char(rs);
 -        break;
 -    case 'B':
 -    case 'E':
 -        readline_down_char(rs);
 -        break;
 +        case 'A':
 +        case 'F':
 +            readline_up_char(rs);
 +            break;
 +        case 'B':
 +        case 'E':
 +            readline_down_char(rs);
 +            break;
          case 'D':
              readline_backward_char(rs);
              break;
 --
-.21.0
+.35.1

-[Qemu-devel] [PULL 3/8] util/readline: Add braces to fix checkpatch errors
+Deleted patch
-From: Jules Irenge <jbi.octave@gmail.com>
-Add braces to fix errors issued by checkpatch.pl tool
-"ERROR: braces {} are necessary for all arms of this statement"
-Within "util/readline.c" file
-Message-Id: <20190330112142.14082-1-jbi.octave@gmail.com>
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
----
- util/readline.c | 50 ++++++++++++++++++++++++++++++++-----------------
-file changed, 33 insertions(+), 17 deletions(-)
-diff --git a/util/readline.c b/util/readline.c
-index XXXXXXX..XXXXXXX 100644
---- a/util/readline.c
-+++ b/util/readline.c
-@@ -XXX,XX +XXX,XX @@ static void readline_update(ReadLineState *rs)
-         rs->cmd_buf[rs->cmd_buf_size] = '\0';
-         if (rs->read_password) {
-             len = strlen(rs->cmd_buf);
--            for (i = 0; i < len; i++)
-+            for (i = 0; i < len; i++) {
-                 rs->printf_func(rs->opaque, "*");
-+            }
-         } else {
-             rs->printf_func(rs->opaque, "%s", rs->cmd_buf);
-         }
-@@ -XXX,XX +XXX,XX @@ static void readline_up_char(ReadLineState *rs)
- {
-     int idx;
--    if (rs->hist_entry == 0)
-+    if (rs->hist_entry == 0) {
-         return;
-+    }
-     if (rs->hist_entry == -1) {
-         /* Find latest entry */
-         for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
--            if (rs->history[idx] == NULL)
-+            if (rs->history[idx] == NULL) {
-                 break;
-+            }
-         }
-         rs->hist_entry = idx;
-     }
-@@ -XXX,XX +XXX,XX @@ static void readline_up_char(ReadLineState *rs)
- static void readline_down_char(ReadLineState *rs)
- {
--    if (rs->hist_entry == -1)
-+    if (rs->hist_entry == -1) {
-         return;
-+    }
-     if (rs->hist_entry < READLINE_MAX_CMDS - 1 &&
-         rs->history[++rs->hist_entry] != NULL) {
-         pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
-@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
-     char *hist_entry, *new_entry;
-     int idx;
--    if (cmdline[0] == '\0')
-+    if (cmdline[0] == '\0') {
-         return;
-+    }
-     new_entry = NULL;
-     if (rs->hist_entry != -1) {
-         /* We were editing an existing history entry: replace it */
-@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
-     /* Search cmdline in history buffers */
-     for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
-         hist_entry = rs->history[idx];
--        if (hist_entry == NULL)
-+        if (hist_entry == NULL) {
-             break;
-+        }
-         if (strcmp(hist_entry, cmdline) == 0) {
-         same_entry:
-             new_entry = hist_entry;
-@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
-                     (READLINE_MAX_CMDS - (idx + 1)) * sizeof(char *));
-             rs->history[READLINE_MAX_CMDS - 1] = NULL;
-             for (; idx < READLINE_MAX_CMDS; idx++) {
--                if (rs->history[idx] == NULL)
-+                if (rs->history[idx] == NULL) {
-                     break;
-+                }
-             }
-             break;
-         }
-@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
-         rs->history[READLINE_MAX_CMDS - 1] = NULL;
-         idx = READLINE_MAX_CMDS - 1;
-     }
--    if (new_entry == NULL)
-+    if (new_entry == NULL) {
-         new_entry = g_strdup(cmdline);
-+    }
-     rs->history[idx] = new_entry;
-     rs->hist_entry = -1;
- }
-@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
-     g_free(cmdline);
-     /* no completion found */
--    if (rs->nb_completions <= 0)
-+    if (rs->nb_completions <= 0) {
-         return;
-+    }
-     if (rs->nb_completions == 1) {
-         len = strlen(rs->completions[0]);
-         for (i = rs->completion_index; i < len; i++) {
-             readline_insert_char(rs, rs->completions[0][i]);
-         }
-         /* extra space for next argument. XXX: make it more generic */
--        if (len > 0 && rs->completions[0][len - 1] != '/')
-+        if (len > 0 && rs->completions[0][len - 1] != '/') {
-             readline_insert_char(rs, ' ');
-+        }
-     } else {
-         qsort(rs->completions, rs->nb_completions, sizeof(char *),
-               completion_comp);
-@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
-             if (i == 0) {
-                 max_prefix = len;
-             } else {
--                if (len < max_prefix)
-+                if (len < max_prefix) {
-                     max_prefix = len;
-+                }
-                 for (j = 0; j < max_prefix; j++) {
--                    if (rs->completions[i][j] != rs->completions[0][j])
-+                    if (rs->completions[i][j] != rs->completions[0][j]) {
-                         max_prefix = j;
-+                    }
-                 }
-             }
--            if (len > max_width)
-+            if (len > max_width) {
-                 max_width = len;
-+            }
-         }
-         if (max_prefix > 0)
-             for (i = rs->completion_index; i < max_prefix; i++) {
-                 readline_insert_char(rs, rs->completions[0][i]);
-             }
-         max_width += 2;
--        if (max_width < 10)
-+        if (max_width < 10) {
-             max_width = 10;
--        else if (max_width > 80)
-+        } else if (max_width > 80) {
-             max_width = 80;
-+        }
-         nb_cols = 80 / max_width;
-         j = 0;
-         for (i = 0; i < rs->nb_completions; i++) {
-@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
-         case 10:
-         case 13:
-             rs->cmd_buf[rs->cmd_buf_size] = '\0';
--            if (!rs->read_password)
-+            if (!rs->read_password) {
-                 readline_hist_add(rs, rs->cmd_buf);
-+            }
-             rs->printf_func(rs->opaque, "\n");
-             rs->cmd_buf_index = 0;
-             rs->cmd_buf_size = 0;
-@@ -XXX,XX +XXX,XX @@ void readline_restart(ReadLineState *rs)
- const char *readline_get_history(ReadLineState *rs, unsigned int index)
- {
--    if (index >= READLINE_MAX_CMDS)
-+    if (index >= READLINE_MAX_CMDS) {
-         return NULL;
-+    }
-     return rs->history[index];
- }
---
-.21.0

-[Qemu-devel] [PULL 4/8] block: Add coroutine_fn to bdrv_check_co_entry
+Deleted patch
-From: Nikita Alekseev <n.alekseev2104@gmail.com>
-bdrv_check_co_entry calls bdrv_co_check, which is a coroutine function.
-Thus, it also needs to be marked as a coroutine.
-Signed-off-by: Nikita Alekseev <n.alekseev2104@gmail.com>
-Message-id: 20190401093051.16488-1-n.alekseev2104@gmail.com
-Message-Id: <20190401093051.16488-1-n.alekseev2104@gmail.com>
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
----
- block.c | 2 +-
-file changed, 1 insertion(+), 1 deletion(-)
-diff --git a/block.c b/block.c
-index XXXXXXX..XXXXXXX 100644
---- a/block.c
-+++ b/block.c
-@@ -XXX,XX +XXX,XX @@ typedef struct CheckCo {
-     int ret;
- } CheckCo;
--static void bdrv_check_co_entry(void *opaque)
-+static void coroutine_fn bdrv_check_co_entry(void *opaque)
- {
-     CheckCo *cco = opaque;
-     cco->ret = bdrv_co_check(cco->bs, cco->res, cco->fix);
---
-.21.0

-[Qemu-devel] [PULL 5/8] block/io.c: fix for the allocation failure
+Deleted patch
-From: Andrey Shinkevich <andrey.shinkevich@virtuozzo.com>
-On a file system used by the customer, fallocate() returns an error
-if the block is not properly aligned. So, bdrv_co_pwrite_zeroes()
-fails. We can handle that case the same way as it is done for the
-unsupported cases, namely, call to bdrv_driver_pwritev() that writes
-zeroes to an image for the unaligned chunk of the block.
-Suggested-by: Denis V. Lunev <den@openvz.org>
-Signed-off-by: Andrey Shinkevich <andrey.shinkevich@virtuozzo.com>
-Reviewed-by: John Snow <jsnow@redhat.com>
-Message-id: 1554474244-553661-1-git-send-email-andrey.shinkevich@virtuozzo.com
-Message-Id: <1554474244-553661-1-git-send-email-andrey.shinkevich@virtuozzo.com>
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
----
- block/io.c | 2 +-
-file changed, 1 insertion(+), 1 deletion(-)
-diff --git a/block/io.c b/block/io.c
-index XXXXXXX..XXXXXXX 100644
---- a/block/io.c
-+++ b/block/io.c
-@@ -XXX,XX +XXX,XX @@ static int coroutine_fn bdrv_co_do_pwrite_zeroes(BlockDriverState *bs,
-             assert(!bs->supported_zero_flags);
-         }
--        if (ret == -ENOTSUP && !(flags & BDRV_REQ_NO_FALLBACK)) {
-+        if (ret < 0 && !(flags & BDRV_REQ_NO_FALLBACK)) {
-             /* Fall back to bounce buffer if write zeroes is unsupported */
-             BdrvRequestFlags write_flags = flags & ~BDRV_REQ_ZERO_WRITE;
---
-.21.0

-[Qemu-devel] [PULL 6/8] aio-posix: ensure poll mode is left when aio_notify is called
+[PULL 3/3] util/event-loop-base: Introduce options to set the thread pool size
-From: Paolo Bonzini <pbonzini@redhat.com>
+From: Nicolas Saenz Julienne <nsaenzju@redhat.com>
-With aio=thread, adaptive polling makes latency worse rather than
+The thread pool regulates itself: when idle, it kills threads until
-better, because it delays the execution of the ThreadPool's
+empty, when in demand, it creates new threads until full. This behaviour
-completion bottom half.
+doesn't play well with latency sensitive workloads where the price of
 creating a new thread is too high. For example, when paired with qemu's
 '-mlock', or using safety features like SafeStack, creating a new thread
 has been measured take multiple milliseconds.
-event_notifier_poll() does run while polling, detecting that
+In order to mitigate this let's introduce a new 'EventLoopBase'
-a bottom half was scheduled by a worker thread, but because
+property to set the thread pool size. The threads will be created during
-ctx->notifier is explicitly ignored in run_poll_handlers_once(),
+the pool's initialization or upon updating the property's value, remain
-scheduling the BH does not count as making progress and
+available during its lifetime regardless of demand, and destroyed upon
-run_poll_handlers() keeps running.  Fix this by recomputing
+freeing it. A properly characterized workload will then be able to
-the deadline after *timeout could have changed.
+configure the pool to avoid any latency spikes.
-With this change, ThreadPool still cannot participate in polling
+Signed-off-by: Nicolas Saenz Julienne <nsaenzju@redhat.com>
-but at least it does not suffer from extra latency.
+Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
+Acked-by: Markus Armbruster <armbru@redhat.com>
-Reported-by: Sergio Lopez <slp@redhat.com>
+Message-id: 20220425075723.20019-4-nsaenzju@redhat.com
 Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
 Message-id: 20190409122823.12416-1-pbonzini@redhat.com
 Cc: Stefan Hajnoczi <stefanha@gmail.com>
 Cc: Kevin Wolf <kwolf@redhat.com>
 Cc: qemu-block@nongnu.org
 Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
 Message-Id: <1553692145-86728-1-git-send-email-pbonzini@redhat.com>
 Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
 Message-Id: <20190409122823.12416-1-pbonzini@redhat.com>
 Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
 ---
- util/aio-posix.c | 12 ++++++++----
+ qapi/qom.json                    | 10 +++++-
-file changed, 8 insertions(+), 4 deletions(-)
+ include/block/aio.h              | 10 ++++++
  include/block/thread-pool.h      |  3 ++
  include/sysemu/event-loop-base.h |  4 +++
  event-loop-base.c                | 23 +++++++++++++
  iothread.c                       |  3 ++
  util/aio-posix.c                 |  1 +
  util/async.c                     | 20 ++++++++++++
  util/main-loop.c                 |  9 ++++++
  util/thread-pool.c               | 55 +++++++++++++++++++++++++++++---
 files changed, 133 insertions(+), 5 deletions(-)
+diff --git a/qapi/qom.json b/qapi/qom.json
+index XXXXXXX..XXXXXXX 100644
+--- a/qapi/qom.json
++++ b/qapi/qom.json
+@@ -XXX,XX +XXX,XX @@
+ #                 0 means that the engine will use its default.
+ #                 (default: 0)
+ #
++# @thread-pool-min: minimum number of threads reserved in the thread pool
++#                   (default:0)
++#
++# @thread-pool-max: maximum number of threads the thread pool can contain
++#                   (default:64)
++#
+ # Since: 7.1
+ ##
+ { 'struct': 'EventLoopBaseProperties',
+-  'data': { '*aio-max-batch': 'int' } }
++  'data': { '*aio-max-batch': 'int',
++            '*thread-pool-min': 'int',
++            '*thread-pool-max': 'int' } }
+ ##
+ # @IothreadProperties:
+diff --git a/include/block/aio.h b/include/block/aio.h
+index XXXXXXX..XXXXXXX 100644
+--- a/include/block/aio.h
++++ b/include/block/aio.h
+@@ -XXX,XX +XXX,XX @@ struct AioContext {
+     QSLIST_HEAD(, Coroutine) scheduled_coroutines;
+     QEMUBH *co_schedule_bh;
++    int thread_pool_min;
++    int thread_pool_max;
+     /* Thread pool for performing work and receiving completion callbacks.
+      * Has its own locking.
+      */
+@@ -XXX,XX +XXX,XX @@ void aio_context_set_poll_params(AioContext *ctx, int64_t max_ns,
+ void aio_context_set_aio_params(AioContext *ctx, int64_t max_batch,
+                                 Error **errp);
++/**
++ * aio_context_set_thread_pool_params:
++ * @ctx: the aio context
++ * @min: min number of threads to have readily available in the thread pool
++ * @min: max number of threads the thread pool can contain
++ */
++void aio_context_set_thread_pool_params(AioContext *ctx, int64_t min,
++                                        int64_t max, Error **errp);
+ #endif
+diff --git a/include/block/thread-pool.h b/include/block/thread-pool.h
+index XXXXXXX..XXXXXXX 100644
+--- a/include/block/thread-pool.h
++++ b/include/block/thread-pool.h
+@@ -XXX,XX +XXX,XX @@
+ #include "block/block.h"
++#define THREAD_POOL_MAX_THREADS_DEFAULT         64
++
+ typedef int ThreadPoolFunc(void *opaque);
+ typedef struct ThreadPool ThreadPool;
+@@ -XXX,XX +XXX,XX @@ BlockAIOCB *thread_pool_submit_aio(ThreadPool *pool,
+ int coroutine_fn thread_pool_submit_co(ThreadPool *pool,
+         ThreadPoolFunc *func, void *arg);
+ void thread_pool_submit(ThreadPool *pool, ThreadPoolFunc *func, void *arg);
++void thread_pool_update_params(ThreadPool *pool, struct AioContext *ctx);
+ #endif
+diff --git a/include/sysemu/event-loop-base.h b/include/sysemu/event-loop-base.h
+index XXXXXXX..XXXXXXX 100644
+--- a/include/sysemu/event-loop-base.h
++++ b/include/sysemu/event-loop-base.h
+@@ -XXX,XX +XXX,XX @@ struct EventLoopBase {
+     /* AioContext AIO engine parameters */
+     int64_t aio_max_batch;
++
++    /* AioContext thread pool parameters */
++    int64_t thread_pool_min;
++    int64_t thread_pool_max;
+ };
+ #endif
+diff --git a/event-loop-base.c b/event-loop-base.c
+index XXXXXXX..XXXXXXX 100644
+--- a/event-loop-base.c
++++ b/event-loop-base.c
+@@ -XXX,XX +XXX,XX @@
+ #include "qemu/osdep.h"
+ #include "qom/object_interfaces.h"
+ #include "qapi/error.h"
++#include "block/thread-pool.h"
+ #include "sysemu/event-loop-base.h"
+ typedef struct {
+@@ -XXX,XX +XXX,XX @@ typedef struct {
+     ptrdiff_t offset; /* field's byte offset in EventLoopBase struct */
+ } EventLoopBaseParamInfo;
++static void event_loop_base_instance_init(Object *obj)
++{
++    EventLoopBase *base = EVENT_LOOP_BASE(obj);
++
++    base->thread_pool_max = THREAD_POOL_MAX_THREADS_DEFAULT;
++}
++
+ static EventLoopBaseParamInfo aio_max_batch_info = {
+     "aio-max-batch", offsetof(EventLoopBase, aio_max_batch),
+ };
++static EventLoopBaseParamInfo thread_pool_min_info = {
++    "thread-pool-min", offsetof(EventLoopBase, thread_pool_min),
++};
++static EventLoopBaseParamInfo thread_pool_max_info = {
++    "thread-pool-max", offsetof(EventLoopBase, thread_pool_max),
++};
+ static void event_loop_base_get_param(Object *obj, Visitor *v,
+         const char *name, void *opaque, Error **errp)
+@@ -XXX,XX +XXX,XX @@ static void event_loop_base_class_init(ObjectClass *klass, void *class_data)
+                               event_loop_base_get_param,
+                               event_loop_base_set_param,
+                               NULL, &aio_max_batch_info);
++    object_class_property_add(klass, "thread-pool-min", "int",
++                              event_loop_base_get_param,
++                              event_loop_base_set_param,
++                              NULL, &thread_pool_min_info);
++    object_class_property_add(klass, "thread-pool-max", "int",
++                              event_loop_base_get_param,
++                              event_loop_base_set_param,
++                              NULL, &thread_pool_max_info);
+ }
+ static const TypeInfo event_loop_base_info = {
+     .name = TYPE_EVENT_LOOP_BASE,
+     .parent = TYPE_OBJECT,
+     .instance_size = sizeof(EventLoopBase),
++    .instance_init = event_loop_base_instance_init,
+     .class_size = sizeof(EventLoopBaseClass),
+     .class_init = event_loop_base_class_init,
+     .abstract = true,
+diff --git a/iothread.c b/iothread.c
+index XXXXXXX..XXXXXXX 100644
+--- a/iothread.c
++++ b/iothread.c
+@@ -XXX,XX +XXX,XX @@ static void iothread_set_aio_context_params(EventLoopBase *base, Error **errp)
+     aio_context_set_aio_params(iothread->ctx,
+                                iothread->parent_obj.aio_max_batch,
+                                errp);
++
++    aio_context_set_thread_pool_params(iothread->ctx, base->thread_pool_min,
++                                       base->thread_pool_max, errp);
+ }
 diff --git a/util/aio-posix.c b/util/aio-posix.c
 index XXXXXXX..XXXXXXX 100644
 --- a/util/aio-posix.c
 +++ b/util/aio-posix.c
-@@ -XXX,XX +XXX,XX @@ static bool run_poll_handlers_once(AioContext *ctx, int64_t *timeout)
+@@ -XXX,XX +XXX,XX @@
-         if (!node->deleted && node->io_poll &&
-             aio_node_check(ctx, node->is_external) &&
+ #include "qemu/osdep.h"
-             node->io_poll(node->opaque)) {
+ #include "block/block.h"
-+            /*
++#include "block/thread-pool.h"
-+             * Polling was successful, exit try_poll_mode immediately
+ #include "qemu/main-loop.h"
-+             * to adjust the next polling time.
+ #include "qemu/rcu.h"
-+             */
+ #include "qemu/rcu_queue.h"
-             *timeout = 0;
+diff --git a/util/async.c b/util/async.c
-             if (node->opaque != &ctx->notifier) {
+index XXXXXXX..XXXXXXX 100644
-                 progress = true;
+--- a/util/async.c
-@@ -XXX,XX +XXX,XX @@ static bool run_poll_handlers(AioContext *ctx, int64_t max_ns, int64_t *timeout)
++++ b/util/async.c
-     do {
+@@ -XXX,XX +XXX,XX @@ AioContext *aio_context_new(Error **errp)
-         progress = run_poll_handlers_once(ctx, timeout);
-         elapsed_time = qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - start_time;
+     ctx->aio_max_batch = 0;
--    } while (!progress && elapsed_time < max_ns
--             && !atomic_read(&ctx->poll_disable_cnt));
++    ctx->thread_pool_min = 0;
-+        max_ns = qemu_soonest_timeout(*timeout, max_ns);
++    ctx->thread_pool_max = THREAD_POOL_MAX_THREADS_DEFAULT;
-+        assert(!(max_ns && progress));
++
-+    } while (elapsed_time < max_ns && !atomic_read(&ctx->poll_disable_cnt));
+     return ctx;
+ fail:
-     /* If time has passed with no successful polling, adjust *timeout to
+     g_source_destroy(&ctx->source);
-      * keep the same ending time.
+@@ -XXX,XX +XXX,XX @@ void qemu_set_current_aio_context(AioContext *ctx)
-@@ -XXX,XX +XXX,XX @@ static bool run_poll_handlers(AioContext *ctx, int64_t max_ns, int64_t *timeout)
+     assert(!get_my_aiocontext());
-  */
+     set_my_aiocontext(ctx);
- static bool try_poll_mode(AioContext *ctx, int64_t *timeout)
+ }
 +
 +void aio_context_set_thread_pool_params(AioContext *ctx, int64_t min,
 +                                        int64_t max, Error **errp)
 +{
 +
 +    if (min > max || !max || min > INT_MAX || max > INT_MAX) {
 +        error_setg(errp, "bad thread-pool-min/thread-pool-max values");
 +        return;
 +    }
 +
 +    ctx->thread_pool_min = min;
 +    ctx->thread_pool_max = max;
 +
 +    if (ctx->thread_pool) {
 +        thread_pool_update_params(ctx->thread_pool, ctx);
 +    }
 +}
 diff --git a/util/main-loop.c b/util/main-loop.c
 index XXXXXXX..XXXXXXX 100644
 --- a/util/main-loop.c
 +++ b/util/main-loop.c
@@ -XXX,XX +XXX,XX @@
  #include "sysemu/replay.h"
  #include "qemu/main-loop.h"
  #include "block/aio.h"
 +#include "block/thread-pool.h"
  #include "qemu/error-report.h"
  #include "qemu/queue.h"
  #include "qemu/compiler.h"
@@ -XXX,XX +XXX,XX @@ int qemu_init_main_loop(Error **errp)
  static void main_loop_update_params(EventLoopBase *base, Error **errp)
  {
--    /* See qemu_soonest_timeout() uint64_t hack */
++    ERRP_GUARD();
--    int64_t max_ns = MIN((uint64_t)*timeout, (uint64_t)ctx->poll_ns);
++
-+    int64_t max_ns = qemu_soonest_timeout(*timeout, ctx->poll_ns);
+     if (!qemu_aio_context) {
+         error_setg(errp, "qemu aio context not ready");
-     if (max_ns && !atomic_read(&ctx->poll_disable_cnt)) {
+         return;
-         poll_set_started(ctx, true);
+     }
      aio_context_set_aio_params(qemu_aio_context, base->aio_max_batch, errp);
 +    if (*errp) {
 +        return;
 +    }
 +
 +    aio_context_set_thread_pool_params(qemu_aio_context, base->thread_pool_min,
 +                                       base->thread_pool_max, errp);
  }
  MainLoop *mloop;
 diff --git a/util/thread-pool.c b/util/thread-pool.c
 index XXXXXXX..XXXXXXX 100644
 --- a/util/thread-pool.c
 +++ b/util/thread-pool.c
@@ -XXX,XX +XXX,XX @@ struct ThreadPool {
      QemuMutex lock;
      QemuCond worker_stopped;
      QemuSemaphore sem;
 -    int max_threads;
      QEMUBH *new_thread_bh;
      /* The following variables are only accessed from one AioContext. */
@@ -XXX,XX +XXX,XX @@ struct ThreadPool {
      int new_threads;     /* backlog of threads we need to create */
      int pending_threads; /* threads created but not running yet */
      bool stopping;
 +    int min_threads;
 +    int max_threads;
  };
 +static inline bool back_to_sleep(ThreadPool *pool, int ret)
 +{
 +    /*
 +     * The semaphore timed out, we should exit the loop except when:
 +     *  - There is work to do, we raced with the signal.
 +     *  - The max threads threshold just changed, we raced with the signal.
 +     *  - The thread pool forces a minimum number of readily available threads.
 +     */
 +    if (ret == -1 && (!QTAILQ_EMPTY(&pool->request_list) ||
 +            pool->cur_threads > pool->max_threads ||
 +            pool->cur_threads <= pool->min_threads)) {
 +            return true;
 +    }
 +
 +    return false;
 +}
 +
  static void *worker_thread(void *opaque)
  {
      ThreadPool *pool = opaque;
@@ -XXX,XX +XXX,XX @@ static void *worker_thread(void *opaque)
              ret = qemu_sem_timedwait(&pool->sem, 10000);
              qemu_mutex_lock(&pool->lock);
              pool->idle_threads--;
 -        } while (ret == -1 && !QTAILQ_EMPTY(&pool->request_list));
 -        if (ret == -1 || pool->stopping) {
 +        } while (back_to_sleep(pool, ret));
 +        if (ret == -1 || pool->stopping ||
 +            pool->cur_threads > pool->max_threads) {
              break;
          }
@@ -XXX,XX +XXX,XX @@ void thread_pool_submit(ThreadPool *pool, ThreadPoolFunc *func, void *arg)
      thread_pool_submit_aio(pool, func, arg, NULL, NULL);
  }
 +void thread_pool_update_params(ThreadPool *pool, AioContext *ctx)
 +{
 +    qemu_mutex_lock(&pool->lock);
 +
 +    pool->min_threads = ctx->thread_pool_min;
 +    pool->max_threads = ctx->thread_pool_max;
 +
 +    /*
 +     * We either have to:
 +     *  - Increase the number available of threads until over the min_threads
 +     *    threshold.
 +     *  - Decrease the number of available threads until under the max_threads
 +     *    threshold.
 +     *  - Do nothing. The current number of threads fall in between the min and
 +     *    max thresholds. We'll let the pool manage itself.
 +     */
 +    for (int i = pool->cur_threads; i < pool->min_threads; i++) {
 +        spawn_thread(pool);
 +    }
 +
 +    for (int i = pool->cur_threads; i > pool->max_threads; i--) {
 +        qemu_sem_post(&pool->sem);
 +    }
 +
 +    qemu_mutex_unlock(&pool->lock);
 +}
 +
  static void thread_pool_init_one(ThreadPool *pool, AioContext *ctx)
  {
      if (!ctx) {
@@ -XXX,XX +XXX,XX @@ static void thread_pool_init_one(ThreadPool *pool, AioContext *ctx)
      qemu_mutex_init(&pool->lock);
      qemu_cond_init(&pool->worker_stopped);
      qemu_sem_init(&pool->sem, 0);
 -    pool->max_threads = 64;
      pool->new_thread_bh = aio_bh_new(ctx, spawn_thread_bh_fn, pool);
      QLIST_INIT(&pool->head);
      QTAILQ_INIT(&pool->request_list);
 +
 +    thread_pool_update_params(pool, ctx);
  }
  ThreadPool *thread_pool_new(AioContext *ctx)
 --
-.21.0
+.35.1

-[Qemu-devel] [PULL 7/8] docs: add Secure Coding Practices to developer docs
+Deleted patch
-At KVM Forum 2018 I gave a presentation on security in QEMU:
-https://www.youtube.com/watch?v=YAdRf_hwxU8 (video)
-https://vmsplice.net/~stefan/stefanha-kvm-forum-2018.pdf (slides)
-This patch adds a guide to secure coding practices.  This document
-covers things that developers should know about security in QEMU.  It is
-just a starting point that we can expand on later.  I hope it will be
-useful as a resource for new contributors and will save code reviewers
-from explaining the same concepts many times.
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
-Acked-by: Stefano Garzarella <sgarzare@redhat.com>
-Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
-Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com>
-Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
-Reviewed-by: Li Qiang <liq3ea@gmail.com>
-Message-id: 20190509121820.16294-2-stefanha@redhat.com
-Message-Id: <20190509121820.16294-2-stefanha@redhat.com>
-Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
----
- docs/devel/index.rst                   |   1 +
- docs/devel/secure-coding-practices.rst | 106 +++++++++++++++++++++++++
-files changed, 107 insertions(+)
- create mode 100644 docs/devel/secure-coding-practices.rst
-diff --git a/docs/devel/index.rst b/docs/devel/index.rst
-index XXXXXXX..XXXXXXX 100644
---- a/docs/devel/index.rst
-+++ b/docs/devel/index.rst
-@@ -XXX,XX +XXX,XX @@ Contents:
-    stable-process
-    testing
-    decodetree
-+   secure-coding-practices
-diff --git a/docs/devel/secure-coding-practices.rst b/docs/devel/secure-coding-practices.rst
-new file mode 100644
-index XXXXXXX..XXXXXXX
---- /dev/null
-+++ b/docs/devel/secure-coding-practices.rst
-@@ -XXX,XX +XXX,XX @@
-+=======================
-+Secure Coding Practices
-+=======================
-+This document covers topics that both developers and security researchers must
-+be aware of so that they can develop safe code and audit existing code
-+properly.
-+
-+Reporting Security Bugs
-+-----------------------
-+For details on how to report security bugs or ask questions about potential
-+security bugs, see the `Security Process wiki page
-+<https://wiki.qemu.org/SecurityProcess>`_.
-+
-+General Secure C Coding Practices
-+---------------------------------
-+Most CVEs (security bugs) reported against QEMU are not specific to
-+virtualization or emulation.  They are simply C programming bugs.  Therefore
-+it's critical to be aware of common classes of security bugs.
-+
-+There is a wide selection of resources available covering secure C coding.  For
-+example, the `CERT C Coding Standard
-+<https://wiki.sei.cmu.edu/confluence/display/c/SEI+CERT+C+Coding+Standard>`_
-+covers the most important classes of security bugs.
-+
-+Instead of describing them in detail here, only the names of the most important
-+classes of security bugs are mentioned:
-+
-+* Buffer overflows
-+* Use-after-free and double-free
-+* Integer overflows
-+* Format string vulnerabilities
-+
-+Some of these classes of bugs can be detected by analyzers.  Static analysis is
-+performed regularly by Coverity and the most obvious of these bugs are even
-+reported by compilers.  Dynamic analysis is possible with valgrind, tsan, and
-+asan.
-+
-+Input Validation
-+----------------
-+Inputs from the guest or external sources (e.g. network, files) cannot be
-+trusted and may be invalid.  Inputs must be checked before using them in a way
-+that could crash the program, expose host memory to the guest, or otherwise be
-+exploitable by an attacker.
-+
-+The most sensitive attack surface is device emulation.  All hardware register
-+accesses and data read from guest memory must be validated.  A typical example
-+is a device that contains multiple units that are selectable by the guest via
-+an index register::
-+
-+  typedef struct {
-+      ProcessingUnit unit[2];
-+      ...
-+  } MyDeviceState;
-+
-+  static void mydev_writel(void *opaque, uint32_t addr, uint32_t val)
-+  {
-+      MyDeviceState *mydev = opaque;
-+      ProcessingUnit *unit;
-+
-+      switch (addr) {
-+      case MYDEV_SELECT_UNIT:
-+          unit = &mydev->unit[val];   <-- this input wasn't validated!
-+          ...
-+      }
-+  }
-+
-+If ``val`` is not in range [0, 1] then an out-of-bounds memory access will take
-+place when ``unit`` is dereferenced.  The code must check that ``val`` is 0 or
-+1 and handle the case where it is invalid.
-+
-+Unexpected Device Accesses
-+--------------------------
-+The guest may access device registers in unusual orders or at unexpected
-+moments.  Device emulation code must not assume that the guest follows the
-+typical "theory of operation" presented in driver writer manuals.  The guest
-+may make nonsense accesses to device registers such as starting operations
-+before the device has been fully initialized.
-+
-+A related issue is that device emulation code must be prepared for unexpected
-+device register accesses while asynchronous operations are in progress.  A
-+well-behaved guest might wait for a completion interrupt before accessing
-+certain device registers.  Device emulation code must handle the case where the
-+guest overwrites registers or submits further requests before an ongoing
-+request completes.  Unexpected accesses must not cause memory corruption or
-+leaks in QEMU.
-+
-+Invalid device register accesses can be reported with
-+``qemu_log_mask(LOG_GUEST_ERROR, ...)``.  The ``-d guest_errors`` command-line
-+option enables these log messages.
-+
-+Live Migration
-+--------------
-+Device state can be saved to disk image files and shared with other users.
-+Live migration code must validate inputs when loading device state so an
-+attacker cannot gain control by crafting invalid device states.  Device state
-+is therefore considered untrusted even though it is typically generated by QEMU
-+itself.
-+
-+Guest Memory Access Races
-+-------------------------
-+Guests with multiple vCPUs may modify guest RAM while device emulation code is
-+running.  Device emulation code must copy in descriptors and other guest RAM
-+structures and only process the local copy.  This prevents
-+time-of-check-to-time-of-use (TOCTOU) race conditions that could cause QEMU to
-+crash when a vCPU thread modifies guest RAM while device emulation is
-+processing it.
---
-.21.0

The following changes since commit 812b835fb4d23dd108b2f9802158472d50b73579:

Merge remote-tracking branch 'remotes/maxreitz/tags/pull-block-2019-05-07' into staging (2019-05-09 16:31:12 +0100)

are available in the Git repository at:

https://github.com/stefanha/qemu.git tags/block-pull-request

for you to fetch changes up to e84125761f78919fe63616d9888ea45e72dc956f:

docs: add Security chapter to the documentation (2019-05-10 10:53:52 +0100)

----------------------------------------------------------------
Pull request

----------------------------------------------------------------

Andrey Shinkevich (1):
  block/io.c: fix for the allocation failure

Jules Irenge (3):
  util/readline: add a space to fix errors by checkpatch tool
  util: readline: replace tab indent by four spaces to fix checkpatch
    errors
  util/readline: Add braces to fix checkpatch errors

Nikita Alekseev (1):
  block: Add coroutine_fn to bdrv_check_co_entry

Paolo Bonzini (1):
  aio-posix: ensure poll mode is left when aio_notify is called

Stefan Hajnoczi (2):
  docs: add Secure Coding Practices to developer docs
  docs: add Security chapter to the documentation

-- 
2.21.0

From: Jules Irenge <jbi.octave@gmail.com>

util/readline: add a space to fix errors reported by checkpatch.pl tool
"ERROR: space required before the open parenthesis"
"ERROR: space required after that ..."
within "util/redline.c" file

Signed-off-by: Jules Irenge <jbi.octave@gmail.com>
Reviewed-by: Thomas Huth <thuth@redhat.com>
Message-id: 20190401024406.10819-2-jbi.octave@gmail.com
Message-Id: <20190401024406.10819-2-jbi.octave@gmail.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 util/readline.c | 34 +++++++++++++++++-----------------
 1 file changed, 17 insertions(+), 17 deletions(-)

diff --git a/util/readline.c b/util/readline.c
index XXXXXXX..XXXXXXX 100644
--- a/util/readline.c
+++ b/util/readline.c
@@ -XXX,XX +XXX,XX @@ static void readline_update(ReadLineState *rs)
 
     if (rs->cmd_buf_size != rs->last_cmd_buf_size ||
         memcmp(rs->cmd_buf, rs->last_cmd_buf, rs->cmd_buf_size) != 0) {
-        for(i = 0; i < rs->last_cmd_buf_index; i++) {
+        for (i = 0; i < rs->last_cmd_buf_index; i++) {
             rs->printf_func(rs->opaque, "\033[D");
         }
         rs->cmd_buf[rs->cmd_buf_size] = '\0';
         if (rs->read_password) {
             len = strlen(rs->cmd_buf);
-            for(i = 0; i < len; i++)
+            for (i = 0; i < len; i++)
                 rs->printf_func(rs->opaque, "*");
         } else {
             rs->printf_func(rs->opaque, "%s", rs->cmd_buf);
@@ -XXX,XX +XXX,XX @@ static void readline_update(ReadLineState *rs)
     if (rs->cmd_buf_index != rs->last_cmd_buf_index) {
         delta = rs->cmd_buf_index - rs->last_cmd_buf_index;
         if (delta > 0) {
-            for(i = 0;i < delta; i++) {
+            for (i = 0; i < delta; i++) {
                 rs->printf_func(rs->opaque, "\033[C");
             }
         } else {
             delta = -delta;
-            for(i = 0;i < delta; i++) {
+            for (i = 0; i < delta; i++) {
                 rs->printf_func(rs->opaque, "\033[D");
             }
         }
@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
         return;
     if (rs->nb_completions == 1) {
         len = strlen(rs->completions[0]);
-        for(i = rs->completion_index; i < len; i++) {
+        for (i = rs->completion_index; i < len; i++) {
             readline_insert_char(rs, rs->completions[0][i]);
         }
         /* extra space for next argument. XXX: make it more generic */
@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
               completion_comp);
         rs->printf_func(rs->opaque, "\n");
         max_width = 0;
-        max_prefix = 0;	
-        for(i = 0; i < rs->nb_completions; i++) {
+        max_prefix = 0;
+        for (i = 0; i < rs->nb_completions; i++) {
             len = strlen(rs->completions[i]);
-            if (i==0) {
+            if (i == 0) {
                 max_prefix = len;
             } else {
                 if (len < max_prefix)
                     max_prefix = len;
-                for(j=0; j<max_prefix; j++) {
+                for (j = 0; j < max_prefix; j++) {
                     if (rs->completions[i][j] != rs->completions[0][j])
                         max_prefix = j;
                 }
@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
             if (len > max_width)
                 max_width = len;
         }
-        if (max_prefix > 0) 
-            for(i = rs->completion_index; i < max_prefix; i++) {
+        if (max_prefix > 0)
+            for (i = rs->completion_index; i < max_prefix; i++) {
                 readline_insert_char(rs, rs->completions[0][i]);
             }
         max_width += 2;
@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
             max_width = 80;
         nb_cols = 80 / max_width;
         j = 0;
-        for(i = 0; i < rs->nb_completions; i++) {
+        for (i = 0; i < rs->nb_completions; i++) {
             rs->printf_func(rs->opaque, "%-*s", max_width, rs->completions[i]);
             if (++j == nb_cols || i == (rs->nb_completions - 1)) {
                 rs->printf_func(rs->opaque, "\n");
@@ -XXX,XX +XXX,XX @@ static void readline_clear_screen(ReadLineState *rs)
 /* return true if command handled */
 void readline_handle_byte(ReadLineState *rs, int ch)
 {
-    switch(rs->esc_state) {
+    switch (rs->esc_state) {
     case IS_NORM:
-        switch(ch) {
+        switch (ch) {
         case 1:
             readline_bol(rs);
             break;
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
         }
         break;
     case IS_CSI:
-        switch(ch) {
+        switch (ch) {
 	case 'A':
 	case 'F':
 	    readline_up_char(rs);
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
             rs->esc_param = rs->esc_param * 10 + (ch - '0');
             goto the_end;
         case '~':
-            switch(rs->esc_param) {
+            switch (rs->esc_param) {
             case 1:
                 readline_bol(rs);
                 break;
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
     the_end:
         break;
     case IS_SS3:
-        switch(ch) {
+        switch (ch) {
         case 'F':
             readline_eol(rs);
             break;
-- 
2.21.0

From: Jules Irenge <jbi.octave@gmail.com>

Replace tab indent by four spaces to fix errors issued by checkpatch.pl tool
"ERROR: code indent should never use tabs" within "util/readline.c" file.

Signed-off-by: Jules Irenge <jbi.octave@gmail.com>
Reviewed-by: Thomas Huth <thuth@redhat.com>
Message-id: 20190401024406.10819-3-jbi.octave@gmail.com
Message-Id: <20190401024406.10819-3-jbi.octave@gmail.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 util/readline.c | 98 ++++++++++++++++++++++++-------------------------
 1 file changed, 49 insertions(+), 49 deletions(-)

diff --git a/util/readline.c b/util/readline.c
index XXXXXXX..XXXXXXX 100644
--- a/util/readline.c
+++ b/util/readline.c
@@ -XXX,XX +XXX,XX @@ static void readline_up_char(ReadLineState *rs)
     int idx;
 
     if (rs->hist_entry == 0)
-	return;
+        return;
     if (rs->hist_entry == -1) {
-	/* Find latest entry */
-	for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
-	    if (rs->history[idx] == NULL)
-		break;
-	}
-	rs->hist_entry = idx;
+        /* Find latest entry */
+        for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
+            if (rs->history[idx] == NULL)
+                break;
+        }
+        rs->hist_entry = idx;
     }
     rs->hist_entry--;
     if (rs->hist_entry >= 0) {
-	pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
+        pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
                 rs->history[rs->hist_entry]);
-	rs->cmd_buf_index = rs->cmd_buf_size = strlen(rs->cmd_buf);
+        rs->cmd_buf_index = rs->cmd_buf_size = strlen(rs->cmd_buf);
     }
 }
 
@@ -XXX,XX +XXX,XX @@ static void readline_down_char(ReadLineState *rs)
         return;
     if (rs->hist_entry < READLINE_MAX_CMDS - 1 &&
         rs->history[++rs->hist_entry] != NULL) {
-	pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
+        pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
                 rs->history[rs->hist_entry]);
     } else {
         rs->cmd_buf[0] = 0;
-	rs->hist_entry = -1;
+        rs->hist_entry = -1;
     }
     rs->cmd_buf_index = rs->cmd_buf_size = strlen(rs->cmd_buf);
 }
@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
     int idx;
 
     if (cmdline[0] == '\0')
-	return;
+        return;
     new_entry = NULL;
     if (rs->hist_entry != -1) {
-	/* We were editing an existing history entry: replace it */
-	hist_entry = rs->history[rs->hist_entry];
-	idx = rs->hist_entry;
-	if (strcmp(hist_entry, cmdline) == 0) {
-	    goto same_entry;
-	}
+        /* We were editing an existing history entry: replace it */
+        hist_entry = rs->history[rs->hist_entry];
+        idx = rs->hist_entry;
+        if (strcmp(hist_entry, cmdline) == 0) {
+            goto same_entry;
+        }
     }
     /* Search cmdline in history buffers */
     for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
-	hist_entry = rs->history[idx];
-	if (hist_entry == NULL)
-	    break;
-	if (strcmp(hist_entry, cmdline) == 0) {
-	same_entry:
-	    new_entry = hist_entry;
-	    /* Put this entry at the end of history */
-	    memmove(&rs->history[idx], &rs->history[idx + 1],
-		    (READLINE_MAX_CMDS - (idx + 1)) * sizeof(char *));
-	    rs->history[READLINE_MAX_CMDS - 1] = NULL;
-	    for (; idx < READLINE_MAX_CMDS; idx++) {
-		if (rs->history[idx] == NULL)
-		    break;
-	    }
-	    break;
-	}
+        hist_entry = rs->history[idx];
+        if (hist_entry == NULL)
+            break;
+        if (strcmp(hist_entry, cmdline) == 0) {
+        same_entry:
+            new_entry = hist_entry;
+            /* Put this entry at the end of history */
+            memmove(&rs->history[idx], &rs->history[idx + 1],
+                    (READLINE_MAX_CMDS - (idx + 1)) * sizeof(char *));
+            rs->history[READLINE_MAX_CMDS - 1] = NULL;
+            for (; idx < READLINE_MAX_CMDS; idx++) {
+                if (rs->history[idx] == NULL)
+                    break;
+            }
+            break;
+        }
     }
     if (idx == READLINE_MAX_CMDS) {
-	/* Need to get one free slot */
+        /* Need to get one free slot */
         g_free(rs->history[0]);
-	memmove(rs->history, &rs->history[1],
-	        (READLINE_MAX_CMDS - 1) * sizeof(char *));
-	rs->history[READLINE_MAX_CMDS - 1] = NULL;
-	idx = READLINE_MAX_CMDS - 1;
+        memmove(rs->history, &rs->history[1],
+                (READLINE_MAX_CMDS - 1) * sizeof(char *));
+        rs->history[READLINE_MAX_CMDS - 1] = NULL;
+        idx = READLINE_MAX_CMDS - 1;
     }
     if (new_entry == NULL)
         new_entry = g_strdup(cmdline);
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
         case 8:
             readline_backspace(rs);
             break;
-	case 155:
+        case 155:
             rs->esc_state = IS_CSI;
-	    break;
+            break;
         default:
             if (ch >= 32) {
                 readline_insert_char(rs, ch);
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
         break;
     case IS_CSI:
         switch (ch) {
-	case 'A':
-	case 'F':
-	    readline_up_char(rs);
-	    break;
-	case 'B':
-	case 'E':
-	    readline_down_char(rs);
-	    break;
+        case 'A':
+        case 'F':
+            readline_up_char(rs);
+            break;
+        case 'B':
+        case 'E':
+            readline_down_char(rs);
+            break;
         case 'D':
             readline_backward_char(rs);
             break;
-- 
2.21.0

From: Jules Irenge <jbi.octave@gmail.com>

Add braces to fix errors issued by checkpatch.pl tool
"ERROR: braces {} are necessary for all arms of this statement"
Within "util/readline.c" file
Message-Id: <20190330112142.14082-1-jbi.octave@gmail.com>

Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 util/readline.c | 50 ++++++++++++++++++++++++++++++++-----------------
 1 file changed, 33 insertions(+), 17 deletions(-)

diff --git a/util/readline.c b/util/readline.c
index XXXXXXX..XXXXXXX 100644
--- a/util/readline.c
+++ b/util/readline.c
@@ -XXX,XX +XXX,XX @@ static void readline_update(ReadLineState *rs)
         rs->cmd_buf[rs->cmd_buf_size] = '\0';
         if (rs->read_password) {
             len = strlen(rs->cmd_buf);
-            for (i = 0; i < len; i++)
+            for (i = 0; i < len; i++) {
                 rs->printf_func(rs->opaque, "*");
+            }
         } else {
             rs->printf_func(rs->opaque, "%s", rs->cmd_buf);
         }
@@ -XXX,XX +XXX,XX @@ static void readline_up_char(ReadLineState *rs)
 {
     int idx;
 
-    if (rs->hist_entry == 0)
+    if (rs->hist_entry == 0) {
         return;
+    }
     if (rs->hist_entry == -1) {
         /* Find latest entry */
         for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
-            if (rs->history[idx] == NULL)
+            if (rs->history[idx] == NULL) {
                 break;
+            }
         }
         rs->hist_entry = idx;
     }
@@ -XXX,XX +XXX,XX @@ static void readline_up_char(ReadLineState *rs)
 
 static void readline_down_char(ReadLineState *rs)
 {
-    if (rs->hist_entry == -1)
+    if (rs->hist_entry == -1) {
         return;
+    }
     if (rs->hist_entry < READLINE_MAX_CMDS - 1 &&
         rs->history[++rs->hist_entry] != NULL) {
         pstrcpy(rs->cmd_buf, sizeof(rs->cmd_buf),
@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
     char *hist_entry, *new_entry;
     int idx;
 
-    if (cmdline[0] == '\0')
+    if (cmdline[0] == '\0') {
         return;
+    }
     new_entry = NULL;
     if (rs->hist_entry != -1) {
         /* We were editing an existing history entry: replace it */
@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
     /* Search cmdline in history buffers */
     for (idx = 0; idx < READLINE_MAX_CMDS; idx++) {
         hist_entry = rs->history[idx];
-        if (hist_entry == NULL)
+        if (hist_entry == NULL) {
             break;
+        }
         if (strcmp(hist_entry, cmdline) == 0) {
         same_entry:
             new_entry = hist_entry;
@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
                     (READLINE_MAX_CMDS - (idx + 1)) * sizeof(char *));
             rs->history[READLINE_MAX_CMDS - 1] = NULL;
             for (; idx < READLINE_MAX_CMDS; idx++) {
-                if (rs->history[idx] == NULL)
+                if (rs->history[idx] == NULL) {
                     break;
+                }
             }
             break;
         }
@@ -XXX,XX +XXX,XX @@ static void readline_hist_add(ReadLineState *rs, const char *cmdline)
         rs->history[READLINE_MAX_CMDS - 1] = NULL;
         idx = READLINE_MAX_CMDS - 1;
     }
-    if (new_entry == NULL)
+    if (new_entry == NULL) {
         new_entry = g_strdup(cmdline);
+    }
     rs->history[idx] = new_entry;
     rs->hist_entry = -1;
 }
@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
     g_free(cmdline);
 
     /* no completion found */
-    if (rs->nb_completions <= 0)
+    if (rs->nb_completions <= 0) {
         return;
+    }
     if (rs->nb_completions == 1) {
         len = strlen(rs->completions[0]);
         for (i = rs->completion_index; i < len; i++) {
             readline_insert_char(rs, rs->completions[0][i]);
         }
         /* extra space for next argument. XXX: make it more generic */
-        if (len > 0 && rs->completions[0][len - 1] != '/')
+        if (len > 0 && rs->completions[0][len - 1] != '/') {
             readline_insert_char(rs, ' ');
+        }
     } else {
         qsort(rs->completions, rs->nb_completions, sizeof(char *),
               completion_comp);
@@ -XXX,XX +XXX,XX @@ static void readline_completion(ReadLineState *rs)
             if (i == 0) {
                 max_prefix = len;
             } else {
-                if (len < max_prefix)
+                if (len < max_prefix) {
                     max_prefix = len;
+                }
                 for (j = 0; j < max_prefix; j++) {
-                    if (rs->completions[i][j] != rs->completions[0][j])
+                    if (rs->completions[i][j] != rs->completions[0][j]) {
                         max_prefix = j;
+                    }
                 }
             }
-            if (len > max_width)
+            if (len > max_width) {
                 max_width = len;
+            }
         }
         if (max_prefix > 0)
             for (i = rs->completion_index; i < max_prefix; i++) {
                 readline_insert_char(rs, rs->completions[0][i]);
             }
         max_width += 2;
-        if (max_width < 10)
+        if (max_width < 10) {
             max_width = 10;
-        else if (max_width > 80)
+        } else if (max_width > 80) {
             max_width = 80;
+        }
         nb_cols = 80 / max_width;
         j = 0;
         for (i = 0; i < rs->nb_completions; i++) {
@@ -XXX,XX +XXX,XX @@ void readline_handle_byte(ReadLineState *rs, int ch)
         case 10:
         case 13:
             rs->cmd_buf[rs->cmd_buf_size] = '\0';
-            if (!rs->read_password)
+            if (!rs->read_password) {
                 readline_hist_add(rs, rs->cmd_buf);
+            }
             rs->printf_func(rs->opaque, "\n");
             rs->cmd_buf_index = 0;
             rs->cmd_buf_size = 0;
@@ -XXX,XX +XXX,XX @@ void readline_restart(ReadLineState *rs)
 
 const char *readline_get_history(ReadLineState *rs, unsigned int index)
 {
-    if (index >= READLINE_MAX_CMDS)
+    if (index >= READLINE_MAX_CMDS) {
         return NULL;
+    }
     return rs->history[index];
 }
 
-- 
2.21.0

From: Andrey Shinkevich <andrey.shinkevich@virtuozzo.com>

On a file system used by the customer, fallocate() returns an error
if the block is not properly aligned. So, bdrv_co_pwrite_zeroes()
fails. We can handle that case the same way as it is done for the
unsupported cases, namely, call to bdrv_driver_pwritev() that writes
zeroes to an image for the unaligned chunk of the block.

Suggested-by: Denis V. Lunev <den@openvz.org>
Signed-off-by: Andrey Shinkevich <andrey.shinkevich@virtuozzo.com>
Reviewed-by: John Snow <jsnow@redhat.com>
Message-id: 1554474244-553661-1-git-send-email-andrey.shinkevich@virtuozzo.com
Message-Id: <1554474244-553661-1-git-send-email-andrey.shinkevich@virtuozzo.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 block/io.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/block/io.c b/block/io.c
index XXXXXXX..XXXXXXX 100644
--- a/block/io.c
+++ b/block/io.c
@@ -XXX,XX +XXX,XX @@ static int coroutine_fn bdrv_co_do_pwrite_zeroes(BlockDriverState *bs,
             assert(!bs->supported_zero_flags);
         }
 
-        if (ret == -ENOTSUP && !(flags & BDRV_REQ_NO_FALLBACK)) {
+        if (ret < 0 && !(flags & BDRV_REQ_NO_FALLBACK)) {
             /* Fall back to bounce buffer if write zeroes is unsupported */
             BdrvRequestFlags write_flags = flags & ~BDRV_REQ_ZERO_WRITE;
 
-- 
2.21.0

From: Paolo Bonzini <pbonzini@redhat.com>

With aio=thread, adaptive polling makes latency worse rather than
better, because it delays the execution of the ThreadPool's
completion bottom half.

event_notifier_poll() does run while polling, detecting that
a bottom half was scheduled by a worker thread, but because
ctx->notifier is explicitly ignored in run_poll_handlers_once(),
scheduling the BH does not count as making progress and
run_poll_handlers() keeps running.  Fix this by recomputing
the deadline after *timeout could have changed.

With this change, ThreadPool still cannot participate in polling
but at least it does not suffer from extra latency.

Reported-by: Sergio Lopez <slp@redhat.com>
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
Message-id: 20190409122823.12416-1-pbonzini@redhat.com
Cc: Stefan Hajnoczi <stefanha@gmail.com>
Cc: Kevin Wolf <kwolf@redhat.com>
Cc: qemu-block@nongnu.org
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
Message-Id: <1553692145-86728-1-git-send-email-pbonzini@redhat.com>
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
Message-Id: <20190409122823.12416-1-pbonzini@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 util/aio-posix.c | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/util/aio-posix.c b/util/aio-posix.c
index XXXXXXX..XXXXXXX 100644
--- a/util/aio-posix.c
+++ b/util/aio-posix.c
@@ -XXX,XX +XXX,XX @@ static bool run_poll_handlers_once(AioContext *ctx, int64_t *timeout)
         if (!node->deleted && node->io_poll &&
             aio_node_check(ctx, node->is_external) &&
             node->io_poll(node->opaque)) {
+            /*
+             * Polling was successful, exit try_poll_mode immediately
+             * to adjust the next polling time.
+             */
             *timeout = 0;
             if (node->opaque != &ctx->notifier) {
                 progress = true;
@@ -XXX,XX +XXX,XX @@ static bool run_poll_handlers(AioContext *ctx, int64_t max_ns, int64_t *timeout)
     do {
         progress = run_poll_handlers_once(ctx, timeout);
         elapsed_time = qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - start_time;
-    } while (!progress && elapsed_time < max_ns
-             && !atomic_read(&ctx->poll_disable_cnt));
+        max_ns = qemu_soonest_timeout(*timeout, max_ns);
+        assert(!(max_ns && progress));
+    } while (elapsed_time < max_ns && !atomic_read(&ctx->poll_disable_cnt));
 
     /* If time has passed with no successful polling, adjust *timeout to
      * keep the same ending time.
@@ -XXX,XX +XXX,XX @@ static bool run_poll_handlers(AioContext *ctx, int64_t max_ns, int64_t *timeout)
  */
 static bool try_poll_mode(AioContext *ctx, int64_t *timeout)
 {
-    /* See qemu_soonest_timeout() uint64_t hack */
-    int64_t max_ns = MIN((uint64_t)*timeout, (uint64_t)ctx->poll_ns);
+    int64_t max_ns = qemu_soonest_timeout(*timeout, ctx->poll_ns);
 
     if (max_ns && !atomic_read(&ctx->poll_disable_cnt)) {
         poll_set_started(ctx, true);
-- 
2.21.0

At KVM Forum 2018 I gave a presentation on security in QEMU:
https://www.youtube.com/watch?v=YAdRf_hwxU8 (video)
https://vmsplice.net/~stefan/stefanha-kvm-forum-2018.pdf (slides)

This patch adds a guide to secure coding practices.  This document
covers things that developers should know about security in QEMU.  It is
just a starting point that we can expand on later.  I hope it will be
useful as a resource for new contributors and will save code reviewers
from explaining the same concepts many times.

Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Acked-by: Stefano Garzarella <sgarzare@redhat.com>
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com>
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Reviewed-by: Li Qiang <liq3ea@gmail.com>
Message-id: 20190509121820.16294-2-stefanha@redhat.com
Message-Id: <20190509121820.16294-2-stefanha@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 docs/devel/index.rst                   |   1 +
 docs/devel/secure-coding-practices.rst | 106 +++++++++++++++++++++++++
 2 files changed, 107 insertions(+)
 create mode 100644 docs/devel/secure-coding-practices.rst

diff --git a/docs/devel/index.rst b/docs/devel/index.rst
index XXXXXXX..XXXXXXX 100644
--- a/docs/devel/index.rst
+++ b/docs/devel/index.rst
@@ -XXX,XX +XXX,XX @@ Contents:
    stable-process
    testing
    decodetree
+   secure-coding-practices
diff --git a/docs/devel/secure-coding-practices.rst b/docs/devel/secure-coding-practices.rst
new file mode 100644
index XXXXXXX..XXXXXXX
--- /dev/null
+++ b/docs/devel/secure-coding-practices.rst
@@ -XXX,XX +XXX,XX @@
+=======================
+Secure Coding Practices
+=======================
+This document covers topics that both developers and security researchers must
+be aware of so that they can develop safe code and audit existing code
+properly.
+
+Reporting Security Bugs
+-----------------------
+For details on how to report security bugs or ask questions about potential
+security bugs, see the `Security Process wiki page
+<https://wiki.qemu.org/SecurityProcess>`_.
+
+General Secure C Coding Practices
+---------------------------------
+Most CVEs (security bugs) reported against QEMU are not specific to
+virtualization or emulation.  They are simply C programming bugs.  Therefore
+it's critical to be aware of common classes of security bugs.
+
+There is a wide selection of resources available covering secure C coding.  For
+example, the `CERT C Coding Standard
+<https://wiki.sei.cmu.edu/confluence/display/c/SEI+CERT+C+Coding+Standard>`_
+covers the most important classes of security bugs.
+
+Instead of describing them in detail here, only the names of the most important
+classes of security bugs are mentioned:
+
+* Buffer overflows
+* Use-after-free and double-free
+* Integer overflows
+* Format string vulnerabilities
+
+Some of these classes of bugs can be detected by analyzers.  Static analysis is
+performed regularly by Coverity and the most obvious of these bugs are even
+reported by compilers.  Dynamic analysis is possible with valgrind, tsan, and
+asan.
+
+Input Validation
+----------------
+Inputs from the guest or external sources (e.g. network, files) cannot be
+trusted and may be invalid.  Inputs must be checked before using them in a way
+that could crash the program, expose host memory to the guest, or otherwise be
+exploitable by an attacker.
+
+The most sensitive attack surface is device emulation.  All hardware register
+accesses and data read from guest memory must be validated.  A typical example
+is a device that contains multiple units that are selectable by the guest via
+an index register::
+
+  typedef struct {
+      ProcessingUnit unit[2];
+      ...
+  } MyDeviceState;
+
+  static void mydev_writel(void *opaque, uint32_t addr, uint32_t val)
+  {
+      MyDeviceState *mydev = opaque;
+      ProcessingUnit *unit;
+
+      switch (addr) {
+      case MYDEV_SELECT_UNIT:
+          unit = &mydev->unit[val];   <-- this input wasn't validated!
+          ...
+      }
+  }
+
+If ``val`` is not in range [0, 1] then an out-of-bounds memory access will take
+place when ``unit`` is dereferenced.  The code must check that ``val`` is 0 or
+1 and handle the case where it is invalid.
+
+Unexpected Device Accesses
+--------------------------
+The guest may access device registers in unusual orders or at unexpected
+moments.  Device emulation code must not assume that the guest follows the
+typical "theory of operation" presented in driver writer manuals.  The guest
+may make nonsense accesses to device registers such as starting operations
+before the device has been fully initialized.
+
+A related issue is that device emulation code must be prepared for unexpected
+device register accesses while asynchronous operations are in progress.  A
+well-behaved guest might wait for a completion interrupt before accessing
+certain device registers.  Device emulation code must handle the case where the
+guest overwrites registers or submits further requests before an ongoing
+request completes.  Unexpected accesses must not cause memory corruption or
+leaks in QEMU.
+
+Invalid device register accesses can be reported with
+``qemu_log_mask(LOG_GUEST_ERROR, ...)``.  The ``-d guest_errors`` command-line
+option enables these log messages.
+
+Live Migration
+--------------
+Device state can be saved to disk image files and shared with other users.
+Live migration code must validate inputs when loading device state so an
+attacker cannot gain control by crafting invalid device states.  Device state
+is therefore considered untrusted even though it is typically generated by QEMU
+itself.
+
+Guest Memory Access Races
+-------------------------
+Guests with multiple vCPUs may modify guest RAM while device emulation code is
+running.  Device emulation code must copy in descriptors and other guest RAM
+structures and only process the local copy.  This prevents
+time-of-check-to-time-of-use (TOCTOU) race conditions that could cause QEMU to
+crash when a vCPU thread modifies guest RAM while device emulation is
+processing it.
-- 
2.21.0

This new chapter in the QEMU documentation covers the security
requirements that QEMU is designed to meet and principles for securely
deploying QEMU.

It is just a starting point that can be extended in the future with more
information.

Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Acked-by: Stefano Garzarella <sgarzare@redhat.com>
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com>
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Reviewed-by: Li Qiang <liq3ea@gmail.com>
Message-id: 20190509121820.16294-3-stefanha@redhat.com
Message-Id: <20190509121820.16294-3-stefanha@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 Makefile           |   2 +-
 docs/security.texi | 131 +++++++++++++++++++++++++++++++++++++++++++++
 qemu-doc.texi      |   3 ++
 3 files changed, 135 insertions(+), 1 deletion(-)
 create mode 100644 docs/security.texi

diff --git a/Makefile b/Makefile
index XXXXXXX..XXXXXXX 100644
--- a/Makefile
+++ b/Makefile
@@ -XXX,XX +XXX,XX @@ qemu-doc.html qemu-doc.info qemu-doc.pdf qemu-doc.txt: \
 	qemu-img.texi qemu-nbd.texi qemu-options.texi qemu-option-trace.texi \
 	qemu-deprecated.texi qemu-monitor.texi qemu-img-cmds.texi qemu-ga.texi \
 	qemu-monitor-info.texi docs/qemu-block-drivers.texi \
-	docs/qemu-cpu-models.texi
+	docs/qemu-cpu-models.texi docs/security.texi
 
 docs/interop/qemu-ga-ref.dvi docs/interop/qemu-ga-ref.html \
     docs/interop/qemu-ga-ref.info docs/interop/qemu-ga-ref.pdf \
diff --git a/docs/security.texi b/docs/security.texi
new file mode 100644
index XXXXXXX..XXXXXXX
--- /dev/null
+++ b/docs/security.texi
@@ -XXX,XX +XXX,XX @@
+@node Security
+@chapter Security
+
+@section Overview
+
+This chapter explains the security requirements that QEMU is designed to meet
+and principles for securely deploying QEMU.
+
+@section Security Requirements
+
+QEMU supports many different use cases, some of which have stricter security
+requirements than others.  The community has agreed on the overall security
+requirements that users may depend on.  These requirements define what is
+considered supported from a security perspective.
+
+@subsection Virtualization Use Case
+
+The virtualization use case covers cloud and virtual private server (VPS)
+hosting, as well as traditional data center and desktop virtualization.  These
+use cases rely on hardware virtualization extensions to execute guest code
+safely on the physical CPU at close-to-native speed.
+
+The following entities are untrusted, meaning that they may be buggy or
+malicious:
+
+@itemize
+@item Guest
+@item User-facing interfaces (e.g. VNC, SPICE, WebSocket)
+@item Network protocols (e.g. NBD, live migration)
+@item User-supplied files (e.g. disk images, kernels, device trees)
+@item Passthrough devices (e.g. PCI, USB)
+@end itemize
+
+Bugs affecting these entities are evaluated on whether they can cause damage in
+real-world use cases and treated as security bugs if this is the case.
+
+@subsection Non-virtualization Use Case
+
+The non-virtualization use case covers emulation using the Tiny Code Generator
+(TCG).  In principle the TCG and device emulation code used in conjunction with
+the non-virtualization use case should meet the same security requirements as
+the virtualization use case.  However, for historical reasons much of the
+non-virtualization use case code was not written with these security
+requirements in mind.
+
+Bugs affecting the non-virtualization use case are not considered security
+bugs at this time.  Users with non-virtualization use cases must not rely on
+QEMU to provide guest isolation or any security guarantees.
+
+@section Architecture
+
+This section describes the design principles that ensure the security
+requirements are met.
+
+@subsection Guest Isolation
+
+Guest isolation is the confinement of guest code to the virtual machine.  When
+guest code gains control of execution on the host this is called escaping the
+virtual machine.  Isolation also includes resource limits such as throttling of
+CPU, memory, disk, or network.  Guests must be unable to exceed their resource
+limits.
+
+QEMU presents an attack surface to the guest in the form of emulated devices.
+The guest must not be able to gain control of QEMU.  Bugs in emulated devices
+could allow malicious guests to gain code execution in QEMU.  At this point the
+guest has escaped the virtual machine and is able to act in the context of the
+QEMU process on the host.
+
+Guests often interact with other guests and share resources with them.  A
+malicious guest must not gain control of other guests or access their data.
+Disk image files and network traffic must be protected from other guests unless
+explicitly shared between them by the user.
+
+@subsection Principle of Least Privilege
+
+The principle of least privilege states that each component only has access to
+the privileges necessary for its function.  In the case of QEMU this means that
+each process only has access to resources belonging to the guest.
+
+The QEMU process should not have access to any resources that are inaccessible
+to the guest.  This way the guest does not gain anything by escaping into the
+QEMU process since it already has access to those same resources from within
+the guest.
+
+Following the principle of least privilege immediately fulfills guest isolation
+requirements.  For example, guest A only has access to its own disk image file
+@code{a.img} and not guest B's disk image file @code{b.img}.
+
+In reality certain resources are inaccessible to the guest but must be
+available to QEMU to perform its function.  For example, host system calls are
+necessary for QEMU but are not exposed to guests.  A guest that escapes into
+the QEMU process can then begin invoking host system calls.
+
+New features must be designed to follow the principle of least privilege.
+Should this not be possible for technical reasons, the security risk must be
+clearly documented so users are aware of the trade-off of enabling the feature.
+
+@subsection Isolation mechanisms
+
+Several isolation mechanisms are available to realize this architecture of
+guest isolation and the principle of least privilege.  With the exception of
+Linux seccomp, these mechanisms are all deployed by management tools that
+launch QEMU, such as libvirt.  They are also platform-specific so they are only
+described briefly for Linux here.
+
+The fundamental isolation mechanism is that QEMU processes must run as
+unprivileged users.  Sometimes it seems more convenient to launch QEMU as
+root to give it access to host devices (e.g. @code{/dev/net/tun}) but this poses a
+huge security risk.  File descriptor passing can be used to give an otherwise
+unprivileged QEMU process access to host devices without running QEMU as root.
+It is also possible to launch QEMU as a non-root user and configure UNIX groups
+for access to @code{/dev/kvm}, @code{/dev/net/tun}, and other device nodes.
+Some Linux distros already ship with UNIX groups for these devices by default.
+
+@itemize
+@item SELinux and AppArmor make it possible to confine processes beyond the
+traditional UNIX process and file permissions model.  They restrict the QEMU
+process from accessing processes and files on the host system that are not
+needed by QEMU.
+
+@item Resource limits and cgroup controllers provide throughput and utilization
+limits on key resources such as CPU time, memory, and I/O bandwidth.
+
+@item Linux namespaces can be used to make process, file system, and other system
+resources unavailable to QEMU.  A namespaced QEMU process is restricted to only
+those resources that were granted to it.
+
+@item Linux seccomp is available via the QEMU @option{--sandbox} option.  It disables
+system calls that are not needed by QEMU, thereby reducing the host kernel
+attack surface.
+@end itemize
diff --git a/qemu-doc.texi b/qemu-doc.texi
index XXXXXXX..XXXXXXX 100644
--- a/qemu-doc.texi
+++ b/qemu-doc.texi
@@ -XXX,XX +XXX,XX @@
 * QEMU Guest Agent::
 * QEMU User space emulator::
 * System requirements::
+* Security::
 * Implementation notes::
 * Deprecated features::
 * Supported build platforms::
@@ -XXX,XX +XXX,XX @@ added with Linux 4.5 which is supported by the major distros. And even
 if RHEL7 has kernel 3.10, KVM there has the required functionality there
 to make it close to a 4.5 or newer kernel.
 
+@include docs/security.texi
+
 @include qemu-tech.texi
 
 @include qemu-deprecated.texi
-- 
2.21.0

The following changes since commit 9cf289af47bcfae5c75de37d8e5d6fd23705322c:

Merge tag 'qga-pull-request' of gitlab.com:marcandre.lureau/qemu into staging (2022-05-04 03:42:49 -0700)

are available in the Git repository at:

https://gitlab.com/stefanha/qemu.git tags/block-pull-request

for you to fetch changes up to bef2e050d6a7feb865854c65570c496ac5a8cf53:

util/event-loop-base: Introduce options to set the thread pool size (2022-05-04 17:02:19 +0100)

----------------------------------------------------------------
Pull request

Add new thread-pool-min/thread-pool-max parameters to control the thread pool
used for async I/O.

----------------------------------------------------------------

Nicolas Saenz Julienne (3):
  Introduce event-loop-base abstract class
  util/main-loop: Introduce the main loop into QOM
  util/event-loop-base: Introduce options to set the thread pool size

-- 
2.35.1

From: Nicolas Saenz Julienne <nsaenzju@redhat.com>

Introduce the 'event-loop-base' abstract class, it'll hold the
properties common to all event loops and provide the necessary hooks for
their creation and maintenance. Then have iothread inherit from it.

EventLoopBaseClass is defined as user creatable and provides a hook for
its children to attach themselves to the user creatable class 'complete'
function. It also provides an update_params() callback to propagate
property changes onto its children.

The new 'event-loop-base' class will live in the root directory. It is
built on its own using the 'link_whole' option (there are no direct
function dependencies between the class and its children, it all happens
trough 'constructor' magic). And also imposes new compilation
dependencies:

qom <- event-loop-base <- blockdev (iothread.c)

And in subsequent patches:

qom <- event-loop-base <- qemuutil (util/main-loop.c)

All this forced some amount of reordering in meson.build:

- Moved qom build definition before qemuutil. Doing it the other way
   around (i.e. moving qemuutil after qom) isn't possible as a lot of
   core libraries that live in between the two depend on it.

- Process the 'hw' subdir earlier, as it introduces files into the
   'qom' source set.

No functional changes intended.

Signed-off-by: Nicolas Saenz Julienne <nsaenzju@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Message-id: 20220425075723.20019-2-nsaenzju@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 qapi/qom.json                    |  22 +++++--
 meson.build                      |  23 ++++---
 include/sysemu/event-loop-base.h |  36 +++++++++++
 include/sysemu/iothread.h        |   6 +-
 event-loop-base.c                | 104 +++++++++++++++++++++++++++++++
 iothread.c                       |  65 ++++++-------------
 6 files changed, 192 insertions(+), 64 deletions(-)
 create mode 100644 include/sysemu/event-loop-base.h
 create mode 100644 event-loop-base.c

diff --git a/qapi/qom.json b/qapi/qom.json
index XXXXXXX..XXXXXXX 100644
--- a/qapi/qom.json
+++ b/qapi/qom.json
@@ -XXX,XX +XXX,XX @@
             '*repeat': 'bool',
             '*grab-toggle': 'GrabToggleKeys' } }
 
+##
+# @EventLoopBaseProperties:
+#
+# Common properties for event loops
+#
+# @aio-max-batch: maximum number of requests in a batch for the AIO engine,
+#                 0 means that the engine will use its default.
+#                 (default: 0)
+#
+# Since: 7.1
+##
+{ 'struct': 'EventLoopBaseProperties',
+  'data': { '*aio-max-batch': 'int' } }
+
 ##
 # @IothreadProperties:
 #
@@ -XXX,XX +XXX,XX @@
 #               algorithm detects it is spending too long polling without
 #               encountering events. 0 selects a default behaviour (default: 0)
 #
-# @aio-max-batch: maximum number of requests in a batch for the AIO engine,
-#                 0 means that the engine will use its default
-#                 (default:0, since 6.1)
+# The @aio-max-batch option is available since 6.1.
 #
 # Since: 2.0
 ##
 { 'struct': 'IothreadProperties',
+  'base': 'EventLoopBaseProperties',
   'data': { '*poll-max-ns': 'int',
             '*poll-grow': 'int',
-            '*poll-shrink': 'int',
-            '*aio-max-batch': 'int' } }
+            '*poll-shrink': 'int' } }
 
 ##
 # @MemoryBackendProperties:
diff --git a/meson.build b/meson.build
index XXXXXXX..XXXXXXX 100644
--- a/meson.build
+++ b/meson.build
@@ -XXX,XX +XXX,XX @@ subdir('qom')
 subdir('authz')
 subdir('crypto')
 subdir('ui')
+subdir('hw')
 
 
 if enable_modules
@@ -XXX,XX +XXX,XX @@ if enable_modules
   modulecommon = declare_dependency(link_whole: libmodulecommon, compile_args: '-DBUILD_DSO')
 endif
 
+qom_ss = qom_ss.apply(config_host, strict: false)
+libqom = static_library('qom', qom_ss.sources() + genh,
+                        dependencies: [qom_ss.dependencies()],
+                        name_suffix: 'fa')
+qom = declare_dependency(link_whole: libqom)
+
+event_loop_base = files('event-loop-base.c')
+event_loop_base = static_library('event-loop-base', sources: event_loop_base + genh,
+                                 build_by_default: true)
+event_loop_base = declare_dependency(link_whole: event_loop_base,
+                                     dependencies: [qom])
+
 stub_ss = stub_ss.apply(config_all, strict: false)
 
 util_ss.add_all(trace_ss)
@@ -XXX,XX +XXX,XX @@ subdir('monitor')
 subdir('net')
 subdir('replay')
 subdir('semihosting')
-subdir('hw')
 subdir('tcg')
 subdir('fpu')
 subdir('accel')
@@ -XXX,XX +XXX,XX @@ qemu_syms = custom_target('qemu.syms', output: 'qemu.syms',
                              capture: true,
                              command: [undefsym, nm, '@INPUT@'])
 
-qom_ss = qom_ss.apply(config_host, strict: false)
-libqom = static_library('qom', qom_ss.sources() + genh,
-                        dependencies: [qom_ss.dependencies()],
-                        name_suffix: 'fa')
-
-qom = declare_dependency(link_whole: libqom)
-
 authz_ss = authz_ss.apply(config_host, strict: false)
 libauthz = static_library('authz', authz_ss.sources() + genh,
                           dependencies: [authz_ss.dependencies()],
@@ -XXX,XX +XXX,XX @@ libblockdev = static_library('blockdev', blockdev_ss.sources() + genh,
                              build_by_default: false)
 
 blockdev = declare_dependency(link_whole: [libblockdev],
-                              dependencies: [block])
+                              dependencies: [block, event_loop_base])
 
 qmp_ss = qmp_ss.apply(config_host, strict: false)
 libqmp = static_library('qmp', qmp_ss.sources() + genh,
diff --git a/include/sysemu/event-loop-base.h b/include/sysemu/event-loop-base.h
new file mode 100644
index XXXXXXX..XXXXXXX
--- /dev/null
+++ b/include/sysemu/event-loop-base.h
@@ -XXX,XX +XXX,XX @@
+/*
+ * QEMU event-loop backend
+ *
+ * Copyright (C) 2022 Red Hat Inc
+ *
+ * Authors:
+ *  Nicolas Saenz Julienne <nsaenzju@redhat.com>
+ *
+ * This work is licensed under the terms of the GNU GPL, version 2 or later.
+ * See the COPYING file in the top-level directory.
+ */
+#ifndef QEMU_EVENT_LOOP_BASE_H
+#define QEMU_EVENT_LOOP_BASE_H
+
+#include "qom/object.h"
+#include "block/aio.h"
+#include "qemu/typedefs.h"
+
+#define TYPE_EVENT_LOOP_BASE         "event-loop-base"
+OBJECT_DECLARE_TYPE(EventLoopBase, EventLoopBaseClass,
+                    EVENT_LOOP_BASE)
+
+struct EventLoopBaseClass {
+    ObjectClass parent_class;
+
+    void (*init)(EventLoopBase *base, Error **errp);
+    void (*update_params)(EventLoopBase *base, Error **errp);
+};
+
+struct EventLoopBase {
+    Object parent;
+
+    /* AioContext AIO engine parameters */
+    int64_t aio_max_batch;
+};
+#endif
diff --git a/include/sysemu/iothread.h b/include/sysemu/iothread.h
index XXXXXXX..XXXXXXX 100644
--- a/include/sysemu/iothread.h
+++ b/include/sysemu/iothread.h
@@ -XXX,XX +XXX,XX @@
 #include "block/aio.h"
 #include "qemu/thread.h"
 #include "qom/object.h"
+#include "sysemu/event-loop-base.h"
 
 #define TYPE_IOTHREAD "iothread"
 
 struct IOThread {
-    Object parent_obj;
+    EventLoopBase parent_obj;
 
     QemuThread thread;
     AioContext *ctx;
@@ -XXX,XX +XXX,XX @@ struct IOThread {
     int64_t poll_max_ns;
     int64_t poll_grow;
     int64_t poll_shrink;
-
-    /* AioContext AIO engine parameters */
-    int64_t aio_max_batch;
 };
 typedef struct IOThread IOThread;
 
diff --git a/event-loop-base.c b/event-loop-base.c
new file mode 100644
index XXXXXXX..XXXXXXX
--- /dev/null
+++ b/event-loop-base.c
@@ -XXX,XX +XXX,XX @@
+/*
+ * QEMU event-loop base
+ *
+ * Copyright (C) 2022 Red Hat Inc
+ *
+ * Authors:
+ *  Stefan Hajnoczi <stefanha@redhat.com>
+ *  Nicolas Saenz Julienne <nsaenzju@redhat.com>
+ *
+ * This work is licensed under the terms of the GNU GPL, version 2 or later.
+ * See the COPYING file in the top-level directory.
+ */
+
+#include "qemu/osdep.h"
+#include "qom/object_interfaces.h"
+#include "qapi/error.h"
+#include "sysemu/event-loop-base.h"
+
+typedef struct {
+    const char *name;
+    ptrdiff_t offset; /* field's byte offset in EventLoopBase struct */
+} EventLoopBaseParamInfo;
+
+static EventLoopBaseParamInfo aio_max_batch_info = {
+    "aio-max-batch", offsetof(EventLoopBase, aio_max_batch),
+};
+
+static void event_loop_base_get_param(Object *obj, Visitor *v,
+        const char *name, void *opaque, Error **errp)
+{
+    EventLoopBase *event_loop_base = EVENT_LOOP_BASE(obj);
+    EventLoopBaseParamInfo *info = opaque;
+    int64_t *field = (void *)event_loop_base + info->offset;
+
+    visit_type_int64(v, name, field, errp);
+}
+
+static void event_loop_base_set_param(Object *obj, Visitor *v,
+        const char *name, void *opaque, Error **errp)
+{
+    EventLoopBaseClass *bc = EVENT_LOOP_BASE_GET_CLASS(obj);
+    EventLoopBase *base = EVENT_LOOP_BASE(obj);
+    EventLoopBaseParamInfo *info = opaque;
+    int64_t *field = (void *)base + info->offset;
+    int64_t value;
+
+    if (!visit_type_int64(v, name, &value, errp)) {
+        return;
+    }
+
+    if (value < 0) {
+        error_setg(errp, "%s value must be in range [0, %" PRId64 "]",
+                   info->name, INT64_MAX);
+        return;
+    }
+
+    *field = value;
+
+    if (bc->update_params) {
+        bc->update_params(base, errp);
+    }
+
+    return;
+}
+
+static void event_loop_base_complete(UserCreatable *uc, Error **errp)
+{
+    EventLoopBaseClass *bc = EVENT_LOOP_BASE_GET_CLASS(uc);
+    EventLoopBase *base = EVENT_LOOP_BASE(uc);
+
+    if (bc->init) {
+        bc->init(base, errp);
+    }
+}
+
+static void event_loop_base_class_init(ObjectClass *klass, void *class_data)
+{
+    UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
+    ucc->complete = event_loop_base_complete;
+
+    object_class_property_add(klass, "aio-max-batch", "int",
+                              event_loop_base_get_param,
+                              event_loop_base_set_param,
+                              NULL, &aio_max_batch_info);
+}
+
+static const TypeInfo event_loop_base_info = {
+    .name = TYPE_EVENT_LOOP_BASE,
+    .parent = TYPE_OBJECT,
+    .instance_size = sizeof(EventLoopBase),
+    .class_size = sizeof(EventLoopBaseClass),
+    .class_init = event_loop_base_class_init,
+    .abstract = true,
+    .interfaces = (InterfaceInfo[]) {
+        { TYPE_USER_CREATABLE },
+        { }
+    }
+};
+
+static void register_types(void)
+{
+    type_register_static(&event_loop_base_info);
+}
+type_init(register_types);
diff --git a/iothread.c b/iothread.c
index XXXXXXX..XXXXXXX 100644
--- a/iothread.c
+++ b/iothread.c
@@ -XXX,XX +XXX,XX @@
 #include "qemu/module.h"
 #include "block/aio.h"
 #include "block/block.h"
+#include "sysemu/event-loop-base.h"
 #include "sysemu/iothread.h"
 #include "qapi/error.h"
 #include "qapi/qapi-commands-misc.h"
@@ -XXX,XX +XXX,XX @@ static void iothread_init_gcontext(IOThread *iothread)
     iothread->main_loop = g_main_loop_new(iothread->worker_context, TRUE);
 }
 
-static void iothread_set_aio_context_params(IOThread *iothread, Error **errp)
+static void iothread_set_aio_context_params(EventLoopBase *base, Error **errp)
 {
+    IOThread *iothread = IOTHREAD(base);
     ERRP_GUARD();
 
+    if (!iothread->ctx) {
+        return;
+    }
+
     aio_context_set_poll_params(iothread->ctx,
                                 iothread->poll_max_ns,
                                 iothread->poll_grow,
@@ -XXX,XX +XXX,XX @@ static void iothread_set_aio_context_params(IOThread *iothread, Error **errp)
     }
 
     aio_context_set_aio_params(iothread->ctx,
-                               iothread->aio_max_batch,
+                               iothread->parent_obj.aio_max_batch,
                                errp);
 }
 
-static void iothread_complete(UserCreatable *obj, Error **errp)
+
+static void iothread_init(EventLoopBase *base, Error **errp)
 {
     Error *local_error = NULL;
-    IOThread *iothread = IOTHREAD(obj);
+    IOThread *iothread = IOTHREAD(base);
     char *thread_name;
 
     iothread->stopping = false;
@@ -XXX,XX +XXX,XX @@ static void iothread_complete(UserCreatable *obj, Error **errp)
      */
     iothread_init_gcontext(iothread);
 
-    iothread_set_aio_context_params(iothread, &local_error);
+    iothread_set_aio_context_params(base, &local_error);
     if (local_error) {
         error_propagate(errp, local_error);
         aio_context_unref(iothread->ctx);
@@ -XXX,XX +XXX,XX @@ static void iothread_complete(UserCreatable *obj, Error **errp)
      * to inherit.
      */
     thread_name = g_strdup_printf("IO %s",
-                        object_get_canonical_path_component(OBJECT(obj)));
+                        object_get_canonical_path_component(OBJECT(base)));
     qemu_thread_create(&iothread->thread, thread_name, iothread_run,
                        iothread, QEMU_THREAD_JOINABLE);
     g_free(thread_name);
@@ -XXX,XX +XXX,XX @@ static IOThreadParamInfo poll_grow_info = {
 static IOThreadParamInfo poll_shrink_info = {
     "poll-shrink", offsetof(IOThread, poll_shrink),
 };
-static IOThreadParamInfo aio_max_batch_info = {
-    "aio-max-batch", offsetof(IOThread, aio_max_batch),
-};
 
 static void iothread_get_param(Object *obj, Visitor *v,
         const char *name, IOThreadParamInfo *info, Error **errp)
@@ -XXX,XX +XXX,XX @@ static void iothread_set_poll_param(Object *obj, Visitor *v,
     }
 }
 
-static void iothread_get_aio_param(Object *obj, Visitor *v,
-        const char *name, void *opaque, Error **errp)
-{
-    IOThreadParamInfo *info = opaque;
-
-    iothread_get_param(obj, v, name, info, errp);
-}
-
-static void iothread_set_aio_param(Object *obj, Visitor *v,
-        const char *name, void *opaque, Error **errp)
-{
-    IOThread *iothread = IOTHREAD(obj);
-    IOThreadParamInfo *info = opaque;
-
-    if (!iothread_set_param(obj, v, name, info, errp)) {
-        return;
-    }
-
-    if (iothread->ctx) {
-        aio_context_set_aio_params(iothread->ctx,
-                                   iothread->aio_max_batch,
-                                   errp);
-    }
-}
-
 static void iothread_class_init(ObjectClass *klass, void *class_data)
 {
-    UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
-    ucc->complete = iothread_complete;
+    EventLoopBaseClass *bc = EVENT_LOOP_BASE_CLASS(klass);
+
+    bc->init = iothread_init;
+    bc->update_params = iothread_set_aio_context_params;
 
     object_class_property_add(klass, "poll-max-ns", "int",
                               iothread_get_poll_param,
@@ -XXX,XX +XXX,XX @@ static void iothread_class_init(ObjectClass *klass, void *class_data)
                               iothread_get_poll_param,
                               iothread_set_poll_param,
                               NULL, &poll_shrink_info);
-    object_class_property_add(klass, "aio-max-batch", "int",
-                              iothread_get_aio_param,
-                              iothread_set_aio_param,
-                              NULL, &aio_max_batch_info);
 }
 
 static const TypeInfo iothread_info = {
     .name = TYPE_IOTHREAD,
-    .parent = TYPE_OBJECT,
+    .parent = TYPE_EVENT_LOOP_BASE,
     .class_init = iothread_class_init,
     .instance_size = sizeof(IOThread),
     .instance_init = iothread_instance_init,
     .instance_finalize = iothread_instance_finalize,
-    .interfaces = (InterfaceInfo[]) {
-        {TYPE_USER_CREATABLE},
-        {}
-    },
 };
 
 static void iothread_register_types(void)
@@ -XXX,XX +XXX,XX @@ static int query_one_iothread(Object *object, void *opaque)
     info->poll_max_ns = iothread->poll_max_ns;
     info->poll_grow = iothread->poll_grow;
     info->poll_shrink = iothread->poll_shrink;
-    info->aio_max_batch = iothread->aio_max_batch;
+    info->aio_max_batch = iothread->parent_obj.aio_max_batch;
 
     QAPI_LIST_APPEND(*tail, info);
     return 0;
-- 
2.35.1

From: Nicolas Saenz Julienne <nsaenzju@redhat.com>

'event-loop-base' provides basic property handling for all 'AioContext'
based event loops. So let's define a new 'MainLoopClass' that inherits
from it. This will permit tweaking the main loop's properties through
qapi as well as through the command line using the '-object' keyword[1].
Only one instance of 'MainLoopClass' might be created at any time.

'EventLoopBaseClass' learns a new callback, 'can_be_deleted()' so as to
mark 'MainLoop' as non-deletable.

[1] For example:
      -object main-loop,id=main-loop,aio-max-batch=<value>

Signed-off-by: Nicolas Saenz Julienne <nsaenzju@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Message-id: 20220425075723.20019-3-nsaenzju@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 qapi/qom.json                    | 13 ++++++++
 meson.build                      |  3 +-
 include/qemu/main-loop.h         | 10 ++++++
 include/sysemu/event-loop-base.h |  1 +
 event-loop-base.c                | 13 ++++++++
 util/main-loop.c                 | 56 ++++++++++++++++++++++++++++++++
 6 files changed, 95 insertions(+), 1 deletion(-)

diff --git a/qapi/qom.json b/qapi/qom.json
index XXXXXXX..XXXXXXX 100644
--- a/qapi/qom.json
+++ b/qapi/qom.json
@@ -XXX,XX +XXX,XX @@
             '*poll-grow': 'int',
             '*poll-shrink': 'int' } }
 
+##
+# @MainLoopProperties:
+#
+# Properties for the main-loop object.
+#
+# Since: 7.1
+##
+{ 'struct': 'MainLoopProperties',
+  'base': 'EventLoopBaseProperties',
+  'data': {} }
+
 ##
 # @MemoryBackendProperties:
 #
@@ -XXX,XX +XXX,XX @@
     { 'name': 'input-linux',
       'if': 'CONFIG_LINUX' },
     'iothread',
+    'main-loop',
     { 'name': 'memory-backend-epc',
       'if': 'CONFIG_LINUX' },
     'memory-backend-file',
@@ -XXX,XX +XXX,XX @@
       'input-linux':                { 'type': 'InputLinuxProperties',
                                       'if': 'CONFIG_LINUX' },
       'iothread':                   'IothreadProperties',
+      'main-loop':                  'MainLoopProperties',
       'memory-backend-epc':         { 'type': 'MemoryBackendEpcProperties',
                                       'if': 'CONFIG_LINUX' },
       'memory-backend-file':        'MemoryBackendFileProperties',
diff --git a/meson.build b/meson.build
index XXXXXXX..XXXXXXX 100644
--- a/meson.build
+++ b/meson.build
@@ -XXX,XX +XXX,XX @@ libqemuutil = static_library('qemuutil',
                              sources: util_ss.sources() + stub_ss.sources() + genh,
                              dependencies: [util_ss.dependencies(), libm, threads, glib, socket, malloc, pixman])
 qemuutil = declare_dependency(link_with: libqemuutil,
-                              sources: genh + version_res)
+                              sources: genh + version_res,
+                              dependencies: [event_loop_base])
 
 if have_system or have_user
   decodetree = generator(find_program('scripts/decodetree.py'),
diff --git a/include/qemu/main-loop.h b/include/qemu/main-loop.h
index XXXXXXX..XXXXXXX 100644
--- a/include/qemu/main-loop.h
+++ b/include/qemu/main-loop.h
@@ -XXX,XX +XXX,XX @@
 #define QEMU_MAIN_LOOP_H
 
 #include "block/aio.h"
+#include "qom/object.h"
+#include "sysemu/event-loop-base.h"
 
 #define SIG_IPI SIGUSR1
 
+#define TYPE_MAIN_LOOP  "main-loop"
+OBJECT_DECLARE_TYPE(MainLoop, MainLoopClass, MAIN_LOOP)
+
+struct MainLoop {
+    EventLoopBase parent_obj;
+};
+typedef struct MainLoop MainLoop;
+
 /**
  * qemu_init_main_loop: Set up the process so that it can run the main loop.
  *
diff --git a/include/sysemu/event-loop-base.h b/include/sysemu/event-loop-base.h
index XXXXXXX..XXXXXXX 100644
--- a/include/sysemu/event-loop-base.h
+++ b/include/sysemu/event-loop-base.h
@@ -XXX,XX +XXX,XX @@ struct EventLoopBaseClass {
 
     void (*init)(EventLoopBase *base, Error **errp);
     void (*update_params)(EventLoopBase *base, Error **errp);
+    bool (*can_be_deleted)(EventLoopBase *base);
 };
 
 struct EventLoopBase {
diff --git a/event-loop-base.c b/event-loop-base.c
index XXXXXXX..XXXXXXX 100644
--- a/event-loop-base.c
+++ b/event-loop-base.c
@@ -XXX,XX +XXX,XX @@ static void event_loop_base_complete(UserCreatable *uc, Error **errp)
     }
 }
 
+static bool event_loop_base_can_be_deleted(UserCreatable *uc)
+{
+    EventLoopBaseClass *bc = EVENT_LOOP_BASE_GET_CLASS(uc);
+    EventLoopBase *backend = EVENT_LOOP_BASE(uc);
+
+    if (bc->can_be_deleted) {
+        return bc->can_be_deleted(backend);
+    }
+
+    return true;
+}
+
 static void event_loop_base_class_init(ObjectClass *klass, void *class_data)
 {
     UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
     ucc->complete = event_loop_base_complete;
+    ucc->can_be_deleted = event_loop_base_can_be_deleted;
 
     object_class_property_add(klass, "aio-max-batch", "int",
                               event_loop_base_get_param,
diff --git a/util/main-loop.c b/util/main-loop.c
index XXXXXXX..XXXXXXX 100644
--- a/util/main-loop.c
+++ b/util/main-loop.c
@@ -XXX,XX +XXX,XX @@
 #include "qemu/error-report.h"
 #include "qemu/queue.h"
 #include "qemu/compiler.h"
+#include "qom/object.h"
 
 #ifndef _WIN32
 #include <sys/wait.h>
@@ -XXX,XX +XXX,XX @@ int qemu_init_main_loop(Error **errp)
     return 0;
 }
 
+static void main_loop_update_params(EventLoopBase *base, Error **errp)
+{
+    if (!qemu_aio_context) {
+        error_setg(errp, "qemu aio context not ready");
+        return;
+    }
+
+    aio_context_set_aio_params(qemu_aio_context, base->aio_max_batch, errp);
+}
+
+MainLoop *mloop;
+
+static void main_loop_init(EventLoopBase *base, Error **errp)
+{
+    MainLoop *m = MAIN_LOOP(base);
+
+    if (mloop) {
+        error_setg(errp, "only one main-loop instance allowed");
+        return;
+    }
+
+    main_loop_update_params(base, errp);
+
+    mloop = m;
+    return;
+}
+
+static bool main_loop_can_be_deleted(EventLoopBase *base)
+{
+    return false;
+}
+
+static void main_loop_class_init(ObjectClass *oc, void *class_data)
+{
+    EventLoopBaseClass *bc = EVENT_LOOP_BASE_CLASS(oc);
+
+    bc->init = main_loop_init;
+    bc->update_params = main_loop_update_params;
+    bc->can_be_deleted = main_loop_can_be_deleted;
+}
+
+static const TypeInfo main_loop_info = {
+    .name = TYPE_MAIN_LOOP,
+    .parent = TYPE_EVENT_LOOP_BASE,
+    .class_init = main_loop_class_init,
+    .instance_size = sizeof(MainLoop),
+};
+
+static void main_loop_register_types(void)
+{
+    type_register_static(&main_loop_info);
+}
+
+type_init(main_loop_register_types)
+
 static int max_priority;
 
 #ifndef _WIN32
-- 
2.35.1

From: Nicolas Saenz Julienne <nsaenzju@redhat.com>

The thread pool regulates itself: when idle, it kills threads until
empty, when in demand, it creates new threads until full. This behaviour
doesn't play well with latency sensitive workloads where the price of
creating a new thread is too high. For example, when paired with qemu's
'-mlock', or using safety features like SafeStack, creating a new thread
has been measured take multiple milliseconds.

In order to mitigate this let's introduce a new 'EventLoopBase'
property to set the thread pool size. The threads will be created during
the pool's initialization or upon updating the property's value, remain
available during its lifetime regardless of demand, and destroyed upon
freeing it. A properly characterized workload will then be able to
configure the pool to avoid any latency spikes.

Signed-off-by: Nicolas Saenz Julienne <nsaenzju@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Message-id: 20220425075723.20019-4-nsaenzju@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
 qapi/qom.json                    | 10 +++++-
 include/block/aio.h              | 10 ++++++
 include/block/thread-pool.h      |  3 ++
 include/sysemu/event-loop-base.h |  4 +++
 event-loop-base.c                | 23 +++++++++++++
 iothread.c                       |  3 ++
 util/aio-posix.c                 |  1 +
 util/async.c                     | 20 ++++++++++++
 util/main-loop.c                 |  9 ++++++
 util/thread-pool.c               | 55 +++++++++++++++++++++++++++++---
 10 files changed, 133 insertions(+), 5 deletions(-)

diff --git a/qapi/qom.json b/qapi/qom.json
index XXXXXXX..XXXXXXX 100644
--- a/qapi/qom.json
+++ b/qapi/qom.json
@@ -XXX,XX +XXX,XX @@
 #                 0 means that the engine will use its default.
 #                 (default: 0)
 #
+# @thread-pool-min: minimum number of threads reserved in the thread pool
+#                   (default:0)
+#
+# @thread-pool-max: maximum number of threads the thread pool can contain
+#                   (default:64)
+#
 # Since: 7.1
 ##
 { 'struct': 'EventLoopBaseProperties',
-  'data': { '*aio-max-batch': 'int' } }
+  'data': { '*aio-max-batch': 'int',
+            '*thread-pool-min': 'int',
+            '*thread-pool-max': 'int' } }
 
 ##
 # @IothreadProperties:
diff --git a/include/block/aio.h b/include/block/aio.h
index XXXXXXX..XXXXXXX 100644
--- a/include/block/aio.h
+++ b/include/block/aio.h
@@ -XXX,XX +XXX,XX @@ struct AioContext {
     QSLIST_HEAD(, Coroutine) scheduled_coroutines;
     QEMUBH *co_schedule_bh;
 
+    int thread_pool_min;
+    int thread_pool_max;
     /* Thread pool for performing work and receiving completion callbacks.
      * Has its own locking.
      */
@@ -XXX,XX +XXX,XX @@ void aio_context_set_poll_params(AioContext *ctx, int64_t max_ns,
 void aio_context_set_aio_params(AioContext *ctx, int64_t max_batch,
                                 Error **errp);
 
+/**
+ * aio_context_set_thread_pool_params:
+ * @ctx: the aio context
+ * @min: min number of threads to have readily available in the thread pool
+ * @min: max number of threads the thread pool can contain
+ */
+void aio_context_set_thread_pool_params(AioContext *ctx, int64_t min,
+                                        int64_t max, Error **errp);
 #endif
diff --git a/include/block/thread-pool.h b/include/block/thread-pool.h
index XXXXXXX..XXXXXXX 100644
--- a/include/block/thread-pool.h
+++ b/include/block/thread-pool.h
@@ -XXX,XX +XXX,XX @@
 
 #include "block/block.h"
 
+#define THREAD_POOL_MAX_THREADS_DEFAULT         64
+
 typedef int ThreadPoolFunc(void *opaque);
 
 typedef struct ThreadPool ThreadPool;
@@ -XXX,XX +XXX,XX @@ BlockAIOCB *thread_pool_submit_aio(ThreadPool *pool,
 int coroutine_fn thread_pool_submit_co(ThreadPool *pool,
         ThreadPoolFunc *func, void *arg);
 void thread_pool_submit(ThreadPool *pool, ThreadPoolFunc *func, void *arg);
+void thread_pool_update_params(ThreadPool *pool, struct AioContext *ctx);
 
 #endif
diff --git a/include/sysemu/event-loop-base.h b/include/sysemu/event-loop-base.h
index XXXXXXX..XXXXXXX 100644
--- a/include/sysemu/event-loop-base.h
+++ b/include/sysemu/event-loop-base.h
@@ -XXX,XX +XXX,XX @@ struct EventLoopBase {
 
     /* AioContext AIO engine parameters */
     int64_t aio_max_batch;
+
+    /* AioContext thread pool parameters */
+    int64_t thread_pool_min;
+    int64_t thread_pool_max;
 };
 #endif
diff --git a/event-loop-base.c b/event-loop-base.c
index XXXXXXX..XXXXXXX 100644
--- a/event-loop-base.c
+++ b/event-loop-base.c
@@ -XXX,XX +XXX,XX @@
 #include "qemu/osdep.h"
 #include "qom/object_interfaces.h"
 #include "qapi/error.h"
+#include "block/thread-pool.h"
 #include "sysemu/event-loop-base.h"
 
 typedef struct {
@@ -XXX,XX +XXX,XX @@ typedef struct {
     ptrdiff_t offset; /* field's byte offset in EventLoopBase struct */
 } EventLoopBaseParamInfo;
 
+static void event_loop_base_instance_init(Object *obj)
+{
+    EventLoopBase *base = EVENT_LOOP_BASE(obj);
+
+    base->thread_pool_max = THREAD_POOL_MAX_THREADS_DEFAULT;
+}
+
 static EventLoopBaseParamInfo aio_max_batch_info = {
     "aio-max-batch", offsetof(EventLoopBase, aio_max_batch),
 };
+static EventLoopBaseParamInfo thread_pool_min_info = {
+    "thread-pool-min", offsetof(EventLoopBase, thread_pool_min),
+};
+static EventLoopBaseParamInfo thread_pool_max_info = {
+    "thread-pool-max", offsetof(EventLoopBase, thread_pool_max),
+};
 
 static void event_loop_base_get_param(Object *obj, Visitor *v,
         const char *name, void *opaque, Error **errp)
@@ -XXX,XX +XXX,XX @@ static void event_loop_base_class_init(ObjectClass *klass, void *class_data)
                               event_loop_base_get_param,
                               event_loop_base_set_param,
                               NULL, &aio_max_batch_info);
+    object_class_property_add(klass, "thread-pool-min", "int",
+                              event_loop_base_get_param,
+                              event_loop_base_set_param,
+                              NULL, &thread_pool_min_info);
+    object_class_property_add(klass, "thread-pool-max", "int",
+                              event_loop_base_get_param,
+                              event_loop_base_set_param,
+                              NULL, &thread_pool_max_info);
 }
 
 static const TypeInfo event_loop_base_info = {
     .name = TYPE_EVENT_LOOP_BASE,
     .parent = TYPE_OBJECT,
     .instance_size = sizeof(EventLoopBase),
+    .instance_init = event_loop_base_instance_init,
     .class_size = sizeof(EventLoopBaseClass),
     .class_init = event_loop_base_class_init,
     .abstract = true,
diff --git a/iothread.c b/iothread.c
index XXXXXXX..XXXXXXX 100644
--- a/iothread.c
+++ b/iothread.c
@@ -XXX,XX +XXX,XX @@ static void iothread_set_aio_context_params(EventLoopBase *base, Error **errp)
     aio_context_set_aio_params(iothread->ctx,
                                iothread->parent_obj.aio_max_batch,
                                errp);
+
+    aio_context_set_thread_pool_params(iothread->ctx, base->thread_pool_min,
+                                       base->thread_pool_max, errp);
 }
 
 
diff --git a/util/aio-posix.c b/util/aio-posix.c
index XXXXXXX..XXXXXXX 100644
--- a/util/aio-posix.c
+++ b/util/aio-posix.c
@@ -XXX,XX +XXX,XX @@
 
 #include "qemu/osdep.h"
 #include "block/block.h"
+#include "block/thread-pool.h"
 #include "qemu/main-loop.h"
 #include "qemu/rcu.h"
 #include "qemu/rcu_queue.h"
diff --git a/util/async.c b/util/async.c
index XXXXXXX..XXXXXXX 100644
--- a/util/async.c
+++ b/util/async.c
@@ -XXX,XX +XXX,XX @@ AioContext *aio_context_new(Error **errp)
 
     ctx->aio_max_batch = 0;
 
+    ctx->thread_pool_min = 0;
+    ctx->thread_pool_max = THREAD_POOL_MAX_THREADS_DEFAULT;
+
     return ctx;
 fail:
     g_source_destroy(&ctx->source);
@@ -XXX,XX +XXX,XX @@ void qemu_set_current_aio_context(AioContext *ctx)
     assert(!get_my_aiocontext());
     set_my_aiocontext(ctx);
 }
+
+void aio_context_set_thread_pool_params(AioContext *ctx, int64_t min,
+                                        int64_t max, Error **errp)
+{
+
+    if (min > max || !max || min > INT_MAX || max > INT_MAX) {
+        error_setg(errp, "bad thread-pool-min/thread-pool-max values");
+        return;
+    }
+
+    ctx->thread_pool_min = min;
+    ctx->thread_pool_max = max;
+
+    if (ctx->thread_pool) {
+        thread_pool_update_params(ctx->thread_pool, ctx);
+    }
+}
diff --git a/util/main-loop.c b/util/main-loop.c
index XXXXXXX..XXXXXXX 100644
--- a/util/main-loop.c
+++ b/util/main-loop.c
@@ -XXX,XX +XXX,XX @@
 #include "sysemu/replay.h"
 #include "qemu/main-loop.h"
 #include "block/aio.h"
+#include "block/thread-pool.h"
 #include "qemu/error-report.h"
 #include "qemu/queue.h"
 #include "qemu/compiler.h"
@@ -XXX,XX +XXX,XX @@ int qemu_init_main_loop(Error **errp)
 
 static void main_loop_update_params(EventLoopBase *base, Error **errp)
 {
+    ERRP_GUARD();
+
     if (!qemu_aio_context) {
         error_setg(errp, "qemu aio context not ready");
         return;
     }
 
     aio_context_set_aio_params(qemu_aio_context, base->aio_max_batch, errp);
+    if (*errp) {
+        return;
+    }
+
+    aio_context_set_thread_pool_params(qemu_aio_context, base->thread_pool_min,
+                                       base->thread_pool_max, errp);
 }
 
 MainLoop *mloop;
diff --git a/util/thread-pool.c b/util/thread-pool.c
index XXXXXXX..XXXXXXX 100644
--- a/util/thread-pool.c
+++ b/util/thread-pool.c
@@ -XXX,XX +XXX,XX @@ struct ThreadPool {
     QemuMutex lock;
     QemuCond worker_stopped;
     QemuSemaphore sem;
-    int max_threads;
     QEMUBH *new_thread_bh;
 
     /* The following variables are only accessed from one AioContext. */
@@ -XXX,XX +XXX,XX @@ struct ThreadPool {
     int new_threads;     /* backlog of threads we need to create */
     int pending_threads; /* threads created but not running yet */
     bool stopping;
+    int min_threads;
+    int max_threads;
 };
 
+static inline bool back_to_sleep(ThreadPool *pool, int ret)
+{
+    /*
+     * The semaphore timed out, we should exit the loop except when:
+     *  - There is work to do, we raced with the signal.
+     *  - The max threads threshold just changed, we raced with the signal.
+     *  - The thread pool forces a minimum number of readily available threads.
+     */
+    if (ret == -1 && (!QTAILQ_EMPTY(&pool->request_list) ||
+            pool->cur_threads > pool->max_threads ||
+            pool->cur_threads <= pool->min_threads)) {
+            return true;
+    }
+
+    return false;
+}
+
 static void *worker_thread(void *opaque)
 {
     ThreadPool *pool = opaque;
@@ -XXX,XX +XXX,XX @@ static void *worker_thread(void *opaque)
             ret = qemu_sem_timedwait(&pool->sem, 10000);
             qemu_mutex_lock(&pool->lock);
             pool->idle_threads--;
-        } while (ret == -1 && !QTAILQ_EMPTY(&pool->request_list));
-        if (ret == -1 || pool->stopping) {
+        } while (back_to_sleep(pool, ret));
+        if (ret == -1 || pool->stopping ||
+            pool->cur_threads > pool->max_threads) {
             break;
         }
 
@@ -XXX,XX +XXX,XX @@ void thread_pool_submit(ThreadPool *pool, ThreadPoolFunc *func, void *arg)
     thread_pool_submit_aio(pool, func, arg, NULL, NULL);
 }
 
+void thread_pool_update_params(ThreadPool *pool, AioContext *ctx)
+{
+    qemu_mutex_lock(&pool->lock);
+
+    pool->min_threads = ctx->thread_pool_min;
+    pool->max_threads = ctx->thread_pool_max;
+
+    /*
+     * We either have to:
+     *  - Increase the number available of threads until over the min_threads
+     *    threshold.
+     *  - Decrease the number of available threads until under the max_threads
+     *    threshold.
+     *  - Do nothing. The current number of threads fall in between the min and
+     *    max thresholds. We'll let the pool manage itself.
+     */
+    for (int i = pool->cur_threads; i < pool->min_threads; i++) {
+        spawn_thread(pool);
+    }
+
+    for (int i = pool->cur_threads; i > pool->max_threads; i--) {
+        qemu_sem_post(&pool->sem);
+    }
+
+    qemu_mutex_unlock(&pool->lock);
+}
+
 static void thread_pool_init_one(ThreadPool *pool, AioContext *ctx)
 {
     if (!ctx) {
@@ -XXX,XX +XXX,XX @@ static void thread_pool_init_one(ThreadPool *pool, AioContext *ctx)
     qemu_mutex_init(&pool->lock);
     qemu_cond_init(&pool->worker_stopped);
     qemu_sem_init(&pool->sem, 0);
-    pool->max_threads = 64;
     pool->new_thread_bh = aio_bh_new(ctx, spawn_thread_bh_fn, pool);
 
     QLIST_INIT(&pool->head);
     QTAILQ_INIT(&pool->request_list);
+
+    thread_pool_update_params(pool, ctx);
 }
 
 ThreadPool *thread_pool_new(AioContext *ctx)
-- 
2.35.1