Series comparison

-[PULL 00/26] target-arm queue
+[PULL 00/36] target-arm queue
-The following changes since commit 64ada298b98a51eb2512607f6e6180cb330c47b1:
+Hi; here's another arm pullreq; by volume most of this is
 refactoring from me, but there are also some bugfixes and
 other bits and pieces here.
-  Merge remote-tracking branch 'remotes/legoater/tags/pull-ppc-20220302' into staging (2022-03-02 12:38:46 +0000)
+thanks
 -- PMM
 The following changes since commit ed734377ab3f3f3cc15d7aa301a87ab6370f2eed:
   Merge tag 'linux-user-fix-gupnp-pull-request' of https://github.com/hdeller/qemu-hppa into staging (2025-01-24 14:43:07 -0500)
 are available in the Git repository at:
-  https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20220302
+  https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20250128-1
-for you to fetch changes up to 268c11984e67867c22f53beb3c7f8b98900d66b2:
+for you to fetch changes up to 664280abddcb3cacc9c6204706bb739fcc1316f7:
-  ui/cocoa.m: Remove unnecessary NSAutoreleasePools (2022-03-02 19:27:37 +0000)
+  hw/usb/canokey: Fix buffer overflow for OUT packet (2025-01-28 18:40:19 +0000)
 ----------------------------------------------------------------
 target-arm queue:
- * mps3-an547: Add missing user ahb interfaces
+ * hw/arm: Remove various uses of first_cpu global
- * hw/arm/mps2-tz.c: Update AN547 documentation URL
+ * hw/char/imx_serial: Fix reset value of UFCR register
- * hw/input/tsc210x: Don't abort on bad SPI word widths
+ * hw/char/imx_serial: Update all state before restarting ageing timer
- * hw/i2c: flatten pca954x mux device
+ * hw/pci-host/designware: Expose MSI IRQ
- * target/arm: Support PSCI 1.1 and SMCCC 1.0
+ * hw/arm/stellaris: refactoring, cleanup
- * target/arm: Fix early free of TCG temp in handle_simd_shift_fpint_conv()
+ * hw/arm/stellaris: map both I2C controllers
- * tests/qtest: add qtests for npcm7xx sdhci
+ * tests/functional: Add a test for the arm microbit machine
- * Implement FEAT_LVA
+ * target/arm: arm_reset_sve_state() should set FPSR, not FPCR
- * Implement FEAT_LPA
+ * target/arm: refactorings preparatory to FEAT_AFP implementation
- * Implement FEAT_LPA2 (but do not enable it yet)
+ * fpu: Rename float_flag_input_denormal to float_flag_input_denormal_flushed
- * Report KVM's actual PSCI version to guest in dtb
+ * fpu: Rename float_flag_output_denormal to float_flag_output_denormal_flushed
- * ui/cocoa.m: Fix updateUIInfo threading issues
+ * hw/usb/canokey: Fix buffer overflow for OUT packet
  * ui/cocoa.m: Remove unnecessary NSAutoreleasePools
 ----------------------------------------------------------------
-Akihiko Odaki (1):
+Bernhard Beschow (3):
-      target/arm: Support PSCI 1.1 and SMCCC 1.0
+      hw/char/imx_serial: Fix reset value of UFCR register
       hw/char/imx_serial: Update all state before restarting ageing timer
       hw/pci-host/designware: Expose MSI IRQ
-Jimmy Brisson (1):
+Hongren Zheng (1):
-      mps3-an547: Add missing user ahb interfaces
+      hw/usb/canokey: Fix buffer overflow for OUT packet
-Patrick Venture (1):
+Peter Maydell (22):
-      hw/i2c: flatten pca954x mux device
+      target/arm: arm_reset_sve_state() should set FPSR, not FPCR
       target/arm: Use FPSR_ constants in vfp_exceptbits_from_host()
       target/arm: Use uint32_t in vfp_exceptbits_from_host()
       target/arm: Define new fp_status_a32 and fp_status_a64
       target/arm: Use vfp.fp_status_a64 in A64-only helper functions
       target/arm: Use fp_status_a64 or fp_status_a32 in is_ebf()
       target/arm: Use fp_status_a32 in vjvct helper
       target/arm: Use fp_status_a32 in vfp_cmp helpers
       target/arm: Use FPST_A32 in A32 decoder
       target/arm: Use FPST_A64 in A64 decoder
       target/arm: Remove now-unused vfp.fp_status and FPST_FPCR
       target/arm: Define new fp_status_f16_a32 and fp_status_f16_a64
       target/arm: Use fp_status_f16_a32 in AArch32-only helpers
       target/arm: Use fp_status_f16_a64 in AArch64-only helpers
       target/arm: Use FPST_A32_F16 in A32 decoder
       target/arm: Use FPST_A64_F16 in A64 decoder
       target/arm: Remove now-unused vfp.fp_status_f16 and FPST_FPCR_F16
       fpu: Rename float_flag_input_denormal to float_flag_input_denormal_flushed
       fpu: Rename float_flag_output_denormal to float_flag_output_denormal_flushed
       fpu: Fix a comment in softfloat-types.h
       target/arm: Remove redundant advsimd float16 helpers
       target/arm: Use FPST_A64_F16 for halfprec-to-other conversions
-Peter Maydell (5):
+Philippe Mathieu-Daudé (9):
-      hw/arm/mps2-tz.c: Update AN547 documentation URL
+      hw/arm/nrf51: Rename ARMv7MState 'cpu' -> 'armv7m'
-      hw/input/tsc210x: Don't abort on bad SPI word widths
+      hw/arm/stellaris: Add 'armv7m' local variable
-      target/arm: Report KVM's actual PSCI version to guest in dtb
+      hw/arm/v7m: Remove use of &first_cpu in machine_init()
-      ui/cocoa.m: Fix updateUIInfo threading issues
+      hw/arm/stellaris: Link each board schematic
-      ui/cocoa.m: Remove unnecessary NSAutoreleasePools
+      hw/arm/stellaris: Constify read-only arrays
       hw/arm/stellaris: Remove incorrect unimplemented i2c-0 at 0x40002000
       hw/arm/stellaris: Replace magic numbers by definitions
       hw/arm/stellaris: Use DEVCAP macro to access DeviceCapability registers
       hw/arm/stellaris: Map both I2C controllers
-Richard Henderson (16):
+Thomas Huth (1):
-      hw/registerfields: Add FIELD_SEX<N> and FIELD_SDP<N>
+      tests/functional: Add a test for the arm microbit machine
       target/arm: Set TCR_EL1.TSZ for user-only
       target/arm: Fault on invalid TCR_ELx.TxSZ
       target/arm: Move arm_pamax out of line
       target/arm: Pass outputsize down to check_s2_mmu_setup
       target/arm: Use MAKE_64BIT_MASK to compute indexmask
       target/arm: Honor TCR_ELx.{I}PS
       target/arm: Prepare DBGBVR and DBGWVR for FEAT_LVA
       target/arm: Implement FEAT_LVA
       target/arm: Implement FEAT_LPA
       target/arm: Extend arm_fi_to_lfsc to level -1
       target/arm: Introduce tlbi_aa64_get_range
       target/arm: Fix TLBIRange.base for 16k and 64k pages
       target/arm: Validate tlbi TG matches translation granule in use
       target/arm: Advertise all page sizes for -cpu max
       target/arm: Implement FEAT_LPA2
-Shengtan Mao (1):
+ MAINTAINERS                           |   1 +
-      tests/qtest: add qtests for npcm7xx sdhci
+ hw/usb/canokey.h                      |   4 --
  include/fpu/softfloat-types.h         |  10 +--
  include/hw/arm/fsl-imx6.h             |   4 +-
  include/hw/arm/fsl-imx7.h             |   4 +-
  include/hw/arm/nrf51_soc.h            |   2 +-
  include/hw/char/imx_serial.h          |   2 +-
  include/hw/pci-host/designware.h      |   1 +
  target/arm/cpu.h                      |  12 ++--
  target/arm/tcg/helper-a64.h           |   8 ---
  target/arm/tcg/translate.h            |  32 ++++++---
  fpu/softfloat.c                       |   6 +-
  hw/arm/b-l475e-iot01a.c               |   2 +-
  hw/arm/fsl-imx6.c                     |  13 +++-
  hw/arm/fsl-imx7.c                     |  13 +++-
  hw/arm/microbit.c                     |   2 +-
  hw/arm/mps2-tz.c                      |   2 +-
  hw/arm/mps2.c                         |   2 +-
  hw/arm/msf2-som.c                     |   2 +-
  hw/arm/musca.c                        |   2 +-
  hw/arm/netduino2.c                    |   2 +-
  hw/arm/netduinoplus2.c                |   2 +-
  hw/arm/nrf51_soc.c                    |  18 ++---
  hw/arm/olimex-stm32-h405.c            |   2 +-
  hw/arm/stellaris.c                    | 118 +++++++++++++++++++-----------
  hw/arm/stm32vldiscovery.c             |   2 +-
  hw/char/imx_serial.c                  |   7 +-
  hw/pci-host/designware.c              |   7 +-
  hw/usb/canokey.c                      |   6 +-
  target/arm/cpu.c                      |   6 +-
  target/arm/helper.c                   |   2 +-
  target/arm/tcg/helper-a64.c           |   9 ---
  target/arm/tcg/sme_helper.c           |   6 +-
  target/arm/tcg/sve_helper.c           |   6 +-
  target/arm/tcg/translate-a64.c        | 103 ++++++++++++++-------------
  target/arm/tcg/translate-sme.c        |   4 +-
  target/arm/tcg/translate-sve.c        | 130 +++++++++++++++++-----------------
  target/arm/tcg/translate-vfp.c        |  78 ++++++++++----------
  target/arm/tcg/vec_helper.c           |  22 +++---
  target/arm/vfp_helper.c               |  73 +++++++++++--------
  target/i386/tcg/fpu_helper.c          |   8 +--
  target/m68k/fpu_helper.c              |   2 +-
  target/mips/tcg/msa_helper.c          |   4 +-
  target/rx/op_helper.c                 |   4 +-
  target/tricore/fpu_helper.c           |   6 +-
  fpu/softfloat-parts.c.inc             |   4 +-
  hw/arm/Kconfig                        |   2 +
  tests/functional/meson.build          |   1 +
  tests/functional/test_arm_microbit.py |  31 ++++++++
 files changed, 452 insertions(+), 337 deletions(-)
  create mode 100755 tests/functional/test_arm_microbit.py
-Wentao_Liang (1):
-      target/arm: Fix early free of TCG temp in handle_simd_shift_fpint_conv()
- docs/system/arm/emulation.rst    |   3 +
- include/hw/registerfields.h      |  48 +++++-
- target/arm/cpu-param.h           |   4 +-
- target/arm/cpu.h                 |  27 ++++
- target/arm/internals.h           |  58 ++++---
- target/arm/kvm-consts.h          |  14 +-
- hw/arm/boot.c                    |  11 +-
- hw/arm/mps2-tz.c                 |   6 +-
- hw/i2c/i2c_mux_pca954x.c         |  77 ++-------
- hw/input/tsc210x.c               |   8 +-
- target/arm/cpu.c                 |   8 +-
- target/arm/cpu64.c               |   7 +-
- target/arm/helper.c              | 332 ++++++++++++++++++++++++++++++---------
- target/arm/hvf/hvf.c             |  27 +++-
- target/arm/kvm64.c               |  14 +-
- target/arm/psci.c                |  35 ++++-
- target/arm/translate-a64.c       |   2 +-
- tests/qtest/npcm7xx_sdhci-test.c | 215 +++++++++++++++++++++++++
- tests/qtest/meson.build          |   1 +
- ui/cocoa.m                       |  31 ++--
-files changed, 736 insertions(+), 192 deletions(-)
- create mode 100644 tests/qtest/npcm7xx_sdhci-test.c

-[PULL 13/26] target/arm: Use MAKE_64BIT_MASK to compute indexmask
+[PULL 01/36] hw/arm/nrf51: Rename ARMv7MState 'cpu' -> 'armv7m'
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-The macro is a bit more readable than the inlined computation.
+The ARMv7MState object is not simply a CPU, it also
 contains the NVIC, SysTick timer, and various MemoryRegions.
-Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
+Rename the field as 'armv7m', like other Cortex-M boards.
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-7-richard.henderson@linaro.org
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
 Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
 Message-id: 20250112225614.33723-2-philmd@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/helper.c | 4 ++--
+ include/hw/arm/nrf51_soc.h |  2 +-
-file changed, 2 insertions(+), 2 deletions(-)
+ hw/arm/nrf51_soc.c         | 18 +++++++++---------
 files changed, 10 insertions(+), 10 deletions(-)
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+diff --git a/include/hw/arm/nrf51_soc.h b/include/hw/arm/nrf51_soc.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
+--- a/include/hw/arm/nrf51_soc.h
-+++ b/target/arm/helper.c
++++ b/include/hw/arm/nrf51_soc.h
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
+@@ -XXX,XX +XXX,XX @@ struct NRF51State {
-         level = startlevel;
+     SysBusDevice parent_obj;
      /*< public >*/
 -    ARMv7MState cpu;
 +    ARMv7MState armv7m;
      NRF51UARTState uart;
      NRF51RNGState rng;
 diff --git a/hw/arm/nrf51_soc.c b/hw/arm/nrf51_soc.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/nrf51_soc.c
 +++ b/hw/arm/nrf51_soc.c
@@ -XXX,XX +XXX,XX @@ static void nrf51_soc_realize(DeviceState *dev_soc, Error **errp)
      }
+     /* This clock doesn't need migration because it is fixed-frequency */
--    indexmask_grainsize = (1ULL << (stride + 3)) - 1;
+     clock_set_hz(s->sysclk, HCLK_FRQ);
--    indexmask = (1ULL << (inputsize - (stride * (4 - level)))) - 1;
+-    qdev_connect_clock_in(DEVICE(&s->cpu), "cpuclk", s->sysclk);
-+    indexmask_grainsize = MAKE_64BIT_MASK(0, stride + 3);
++    qdev_connect_clock_in(DEVICE(&s->armv7m), "cpuclk", s->sysclk);
-+    indexmask = MAKE_64BIT_MASK(0, inputsize - (stride * (4 - level)));
+     /*
+      * This SoC has no systick device, so don't connect refclk.
-     /* Now we can extract the actual base address from the TTBR */
+      * TODO: model the lack of systick (currently the armv7m object
-     descaddr = extract64(ttbr, 0, 48);
+      * will always provide one).
       */
 -    object_property_set_link(OBJECT(&s->cpu), "memory", OBJECT(&s->container),
 +    object_property_set_link(OBJECT(&s->armv7m), "memory", OBJECT(&s->container),
                               &error_abort);
 -    if (!sysbus_realize(SYS_BUS_DEVICE(&s->cpu), errp)) {
 +    if (!sysbus_realize(SYS_BUS_DEVICE(&s->armv7m), errp)) {
          return;
      }
@@ -XXX,XX +XXX,XX @@ static void nrf51_soc_realize(DeviceState *dev_soc, Error **errp)
      mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->uart), 0);
      memory_region_add_subregion_overlap(&s->container, NRF51_UART_BASE, mr, 0);
      sysbus_connect_irq(SYS_BUS_DEVICE(&s->uart), 0,
 -                       qdev_get_gpio_in(DEVICE(&s->cpu),
 +                       qdev_get_gpio_in(DEVICE(&s->armv7m),
                         BASE_TO_IRQ(NRF51_UART_BASE)));
      /* RNG */
@@ -XXX,XX +XXX,XX @@ static void nrf51_soc_realize(DeviceState *dev_soc, Error **errp)
      mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->rng), 0);
      memory_region_add_subregion_overlap(&s->container, NRF51_RNG_BASE, mr, 0);
      sysbus_connect_irq(SYS_BUS_DEVICE(&s->rng), 0,
 -                       qdev_get_gpio_in(DEVICE(&s->cpu),
 +                       qdev_get_gpio_in(DEVICE(&s->armv7m),
                         BASE_TO_IRQ(NRF51_RNG_BASE)));
      /* UICR, FICR, NVMC, FLASH */
@@ -XXX,XX +XXX,XX @@ static void nrf51_soc_realize(DeviceState *dev_soc, Error **errp)
          sysbus_mmio_map(SYS_BUS_DEVICE(&s->timer[i]), 0, base_addr);
          sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer[i]), 0,
 -                           qdev_get_gpio_in(DEVICE(&s->cpu),
 +                           qdev_get_gpio_in(DEVICE(&s->armv7m),
                                              BASE_TO_IRQ(base_addr)));
      }
@@ -XXX,XX +XXX,XX @@ static void nrf51_soc_init(Object *obj)
      memory_region_init(&s->container, obj, "nrf51-container", UINT64_MAX);
 -    object_initialize_child(OBJECT(s), "armv6m", &s->cpu, TYPE_ARMV7M);
 -    qdev_prop_set_string(DEVICE(&s->cpu), "cpu-type",
 +    object_initialize_child(OBJECT(s), "armv6m", &s->armv7m, TYPE_ARMV7M);
 +    qdev_prop_set_string(DEVICE(&s->armv7m), "cpu-type",
                           ARM_CPU_TYPE_NAME("cortex-m0"));
 -    qdev_prop_set_uint32(DEVICE(&s->cpu), "num-irq", 32);
 +    qdev_prop_set_uint32(DEVICE(&s->armv7m), "num-irq", 32);
      object_initialize_child(obj, "uart", &s->uart, TYPE_NRF51_UART);
      object_property_add_alias(obj, "serial0", OBJECT(&s->uart), "chardev");
 --
-.25.1
+.34.1

-[PULL 08/26] hw/registerfields: Add FIELD_SEX<N> and FIELD_SDP<N>
+[PULL 02/36] hw/arm/stellaris: Add 'armv7m' local variable
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-Add new macros to manipulate signed fields within the register.
+While the TYPE_ARMV7M object forward its NVIC interrupt lines,
 it is somehow misleading to name it 'nvic'. Add the 'armv7m'
 local variable for clarity, but also keep the 'nvic' variable
 behaving like before when used for wiring IRQ lines.
-Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
+Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
-Message-id: 20220301215958.157011-2-richard.henderson@linaro.org
+Message-id: 20250112225614.33723-3-philmd@linaro.org
 Suggested-by: Peter Maydell <peter.maydell@linaro.org>
 Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- include/hw/registerfields.h | 48 ++++++++++++++++++++++++++++++++++++-
+ hw/arm/stellaris.c | 21 +++++++++++----------
-file changed, 47 insertions(+), 1 deletion(-)
+file changed, 11 insertions(+), 10 deletions(-)
-diff --git a/include/hw/registerfields.h b/include/hw/registerfields.h
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
---- a/include/hw/registerfields.h
+--- a/hw/arm/stellaris.c
-+++ b/include/hw/registerfields.h
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-     extract64((storage), R_ ## reg ## _ ## field ## _SHIFT,               \
+      */
-               R_ ## reg ## _ ## field ## _LENGTH)
+     Object *soc_container;
-+#define FIELD_SEX8(storage, reg, field)                                   \
+-    DeviceState *gpio_dev[7], *nvic;
-+    sextract8((storage), R_ ## reg ## _ ## field ## _SHIFT,               \
++    DeviceState *gpio_dev[7], *armv7m, *nvic;
-+              R_ ## reg ## _ ## field ## _LENGTH)
+     qemu_irq gpio_in[7][8];
-+#define FIELD_SEX16(storage, reg, field)                                  \
+     qemu_irq gpio_out[7][8];
-+    sextract16((storage), R_ ## reg ## _ ## field ## _SHIFT,              \
+     qemu_irq adc;
-+               R_ ## reg ## _ ## field ## _LENGTH)
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-+#define FIELD_SEX32(storage, reg, field)                                  \
+     qdev_prop_set_uint32(ssys_dev, "dc4", board->dc4);
-+    sextract32((storage), R_ ## reg ## _ ## field ## _SHIFT,              \
+     sysbus_realize_and_unref(SYS_BUS_DEVICE(ssys_dev), &error_fatal);
-+               R_ ## reg ## _ ## field ## _LENGTH)
-+#define FIELD_SEX64(storage, reg, field)                                  \
+-    nvic = qdev_new(TYPE_ARMV7M);
-+    sextract64((storage), R_ ## reg ## _ ## field ## _SHIFT,              \
+-    object_property_add_child(soc_container, "v7m", OBJECT(nvic));
-+               R_ ## reg ## _ ## field ## _LENGTH)
+-    qdev_prop_set_uint32(nvic, "num-irq", NUM_IRQ_LINES);
-+
+-    qdev_prop_set_uint8(nvic, "num-prio-bits", NUM_PRIO_BITS);
- /* Extract a field from an array of registers */
+-    qdev_prop_set_string(nvic, "cpu-type", ms->cpu_type);
- #define ARRAY_FIELD_EX32(regs, reg, field)                                \
+-    qdev_prop_set_bit(nvic, "enable-bitband", true);
-     FIELD_EX32((regs)[R_ ## reg], reg, field)
+-    qdev_connect_clock_in(nvic, "cpuclk",
-@@ -XXX,XX +XXX,XX @@
++    armv7m = qdev_new(TYPE_ARMV7M);
-     _d; })
++    object_property_add_child(soc_container, "v7m", OBJECT(armv7m));
- #define FIELD_DP64(storage, reg, field, val) ({                           \
++    qdev_prop_set_uint32(armv7m, "num-irq", NUM_IRQ_LINES);
-     struct {                                                              \
++    qdev_prop_set_uint8(armv7m, "num-prio-bits", NUM_PRIO_BITS);
--        uint64_t v:R_ ## reg ## _ ## field ## _LENGTH;                \
++    qdev_prop_set_string(armv7m, "cpu-type", ms->cpu_type);
-+        uint64_t v:R_ ## reg ## _ ## field ## _LENGTH;                    \
++    qdev_prop_set_bit(armv7m, "enable-bitband", true);
-+    } _v = { .v = val };                                                  \
++    qdev_connect_clock_in(armv7m, "cpuclk",
-+    uint64_t _d;                                                          \
+                           qdev_get_clock_out(ssys_dev, "SYSCLK"));
-+    _d = deposit64((storage), R_ ## reg ## _ ## field ## _SHIFT,          \
+     /* This SoC does not connect the systick reference clock */
-+                  R_ ## reg ## _ ## field ## _LENGTH, _v.v);              \
+-    object_property_set_link(OBJECT(nvic), "memory",
-+    _d; })
++    object_property_set_link(OBJECT(armv7m), "memory",
-+
+                              OBJECT(get_system_memory()), &error_abort);
-+#define FIELD_SDP8(storage, reg, field, val) ({                           \
+     /* This will exit with an error if the user passed us a bad cpu_type */
-+    struct {                                                              \
+-    sysbus_realize_and_unref(SYS_BUS_DEVICE(nvic), &error_fatal);
-+        signed int v:R_ ## reg ## _ ## field ## _LENGTH;                  \
++    sysbus_realize_and_unref(SYS_BUS_DEVICE(armv7m), &error_fatal);
-+    } _v = { .v = val };                                                  \
++    nvic = armv7m;
-+    uint8_t _d;                                                           \
-+    _d = deposit32((storage), R_ ## reg ## _ ## field ## _SHIFT,          \
+     /* Now we can wire up the IRQ and MMIO of the system registers */
-+                  R_ ## reg ## _ ## field ## _LENGTH, _v.v);              \
+     sysbus_mmio_map(SYS_BUS_DEVICE(ssys_dev), 0, 0x400fe000);
 +    _d; })
 +#define FIELD_SDP16(storage, reg, field, val) ({                          \
 +    struct {                                                              \
 +        signed int v:R_ ## reg ## _ ## field ## _LENGTH;                  \
 +    } _v = { .v = val };                                                  \
 +    uint16_t _d;                                                          \
 +    _d = deposit32((storage), R_ ## reg ## _ ## field ## _SHIFT,          \
 +                  R_ ## reg ## _ ## field ## _LENGTH, _v.v);              \
 +    _d; })
 +#define FIELD_SDP32(storage, reg, field, val) ({                          \
 +    struct {                                                              \
 +        signed int v:R_ ## reg ## _ ## field ## _LENGTH;                  \
 +    } _v = { .v = val };                                                  \
 +    uint32_t _d;                                                          \
 +    _d = deposit32((storage), R_ ## reg ## _ ## field ## _SHIFT,          \
 +                  R_ ## reg ## _ ## field ## _LENGTH, _v.v);              \
 +    _d; })
 +#define FIELD_SDP64(storage, reg, field, val) ({                          \
 +    struct {                                                              \
 +        int64_t v:R_ ## reg ## _ ## field ## _LENGTH;                     \
      } _v = { .v = val };                                                  \
      uint64_t _d;                                                          \
      _d = deposit64((storage), R_ ## reg ## _ ## field ## _SHIFT,          \
 --
-.25.1
+.34.1

-[PULL 01/26] mps3-an547: Add missing user ahb interfaces
+[PULL 03/36] hw/arm/v7m: Remove use of &first_cpu in machine_init()
-From: Jimmy Brisson <jimmy.brisson@linaro.org>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-With these interfaces missing, TFM would delegate peripherals 0, 1,
+When instanciating the machine model, the machine_init()
-, 3 and 8, and qemu would ignore the delegation of interface 8, as
+implementations usually create the CPUs, so have access
-it thought interface 4 was eth & USB.
+to its first CPU. Use that rather then the &first_cpu
 global.
-This patch corrects this behavior and allows TFM to delegate the
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
-eth & USB peripheral to NS mode.
+Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
+Reviewed-by: Samuel Tardieu <sam@rfc1149.net>
-(The old QEMU behaviour was based on revision B of the AN547
+Message-id: 20250112225614.33723-4-philmd@linaro.org
 appnote; revision C corrects this error in the documentation,
 and this commit brings QEMU in to line with how the FPGA
 image really behaves.)
 Signed-off-by: Jimmy Brisson <jimmy.brisson@linaro.org>
 Message-id: 20220210210227.3203883-1-jimmy.brisson@linaro.org
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
 [PMM: added commit message note clarifying that the old behaviour
 was a docs issue, not because there were two different versions
 of the FPGA image]
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- hw/arm/mps2-tz.c | 4 ++++
+ hw/arm/b-l475e-iot01a.c    | 2 +-
-file changed, 4 insertions(+)
+ hw/arm/microbit.c          | 2 +-
  hw/arm/mps2-tz.c           | 2 +-
  hw/arm/mps2.c              | 2 +-
  hw/arm/msf2-som.c          | 2 +-
  hw/arm/musca.c             | 2 +-
  hw/arm/netduino2.c         | 2 +-
  hw/arm/netduinoplus2.c     | 2 +-
  hw/arm/olimex-stm32-h405.c | 2 +-
  hw/arm/stellaris.c         | 2 +-
  hw/arm/stm32vldiscovery.c  | 2 +-
 files changed, 11 insertions(+), 11 deletions(-)
+diff --git a/hw/arm/b-l475e-iot01a.c b/hw/arm/b-l475e-iot01a.c
+index XXXXXXX..XXXXXXX 100644
+--- a/hw/arm/b-l475e-iot01a.c
++++ b/hw/arm/b-l475e-iot01a.c
+@@ -XXX,XX +XXX,XX @@ static void bl475e_init(MachineState *machine)
+     sysbus_realize(SYS_BUS_DEVICE(&s->soc), &error_fatal);
+     sc = STM32L4X5_SOC_GET_CLASS(&s->soc);
+-    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename, 0,
++    armv7m_load_kernel(s->soc.armv7m.cpu, machine->kernel_filename, 0,
+                        sc->flash_size);
+     if (object_class_by_name(TYPE_DM163)) {
+diff --git a/hw/arm/microbit.c b/hw/arm/microbit.c
+index XXXXXXX..XXXXXXX 100644
+--- a/hw/arm/microbit.c
++++ b/hw/arm/microbit.c
+@@ -XXX,XX +XXX,XX @@ static void microbit_init(MachineState *machine)
+     memory_region_add_subregion_overlap(&s->nrf51.container, NRF51_TWI_BASE,
+                                         mr, -1);
+-    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename,
++    armv7m_load_kernel(s->nrf51.armv7m.cpu, machine->kernel_filename,
+, s->nrf51.flash_size);
+ }
 diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/mps2-tz.c
 +++ b/hw/arm/mps2-tz.c
 @@ -XXX,XX +XXX,XX @@ static void mps2tz_common_init(MachineState *machine)
-                 { "gpio1", make_unimp_dev, &mms->gpio[1], 0x41101000, 0x1000 },
+                                     mms->remap_irq);
-                 { "gpio2", make_unimp_dev, &mms->gpio[2], 0x41102000, 0x1000 },
+     }
-                 { "gpio3", make_unimp_dev, &mms->gpio[3], 0x41103000, 0x1000 },
-+                { /* port 4 USER AHB interface 0 */ },
+-    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename,
-+                { /* port 5 USER AHB interface 1 */ },
++    armv7m_load_kernel(mms->iotkit.armv7m[0].cpu, machine->kernel_filename,
-+                { /* port 6 USER AHB interface 2 */ },
+, boot_ram_size(mms));
-+                { /* port 7 USER AHB interface 3 */ },
+ }
-                 { "eth-usb", make_eth_usb, NULL, 0x41400000, 0x200000, { 49 } },
-             },
+diff --git a/hw/arm/mps2.c b/hw/arm/mps2.c
-         },
+index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/mps2.c
 +++ b/hw/arm/mps2.c
@@ -XXX,XX +XXX,XX @@ static void mps2_common_init(MachineState *machine)
                   qdev_get_gpio_in(armv7m,
                                    mmc->fpga_type == FPGA_AN511 ? 47 : 13));
 -    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename,
 +    armv7m_load_kernel(mms->armv7m.cpu, machine->kernel_filename,
 , 0x400000);
  }
 diff --git a/hw/arm/msf2-som.c b/hw/arm/msf2-som.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/msf2-som.c
 +++ b/hw/arm/msf2-som.c
@@ -XXX,XX +XXX,XX @@ static void emcraft_sf2_s2s010_init(MachineState *machine)
      cs_line = qdev_get_gpio_in_named(spi_flash, SSI_GPIO_CS, 0);
      sysbus_connect_irq(SYS_BUS_DEVICE(&soc->spi[0]), 1, cs_line);
 -    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename,
 +    armv7m_load_kernel(soc->armv7m.cpu, machine->kernel_filename,
 , soc->envm_size);
  }
 diff --git a/hw/arm/musca.c b/hw/arm/musca.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/musca.c
 +++ b/hw/arm/musca.c
@@ -XXX,XX +XXX,XX @@ static void musca_init(MachineState *machine)
                                                       "cfg_sec_resp", 0));
      }
 -    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename,
 +    armv7m_load_kernel(mms->sse.armv7m[0].cpu, machine->kernel_filename,
 , 0x2000000);
  }
 diff --git a/hw/arm/netduino2.c b/hw/arm/netduino2.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/netduino2.c
 +++ b/hw/arm/netduino2.c
@@ -XXX,XX +XXX,XX @@ static void netduino2_init(MachineState *machine)
      qdev_connect_clock_in(dev, "sysclk", sysclk);
      sysbus_realize_and_unref(SYS_BUS_DEVICE(dev), &error_fatal);
 -    armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename,
 +    armv7m_load_kernel(STM32F205_SOC(dev)->armv7m.cpu, machine->kernel_filename,
 , FLASH_SIZE);
  }
 diff --git a/hw/arm/netduinoplus2.c b/hw/arm/netduinoplus2.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/netduinoplus2.c
 +++ b/hw/arm/netduinoplus2.c
@@ -XXX,XX +XXX,XX @@ static void netduinoplus2_init(MachineState *machine)
      qdev_connect_clock_in(dev, "sysclk", sysclk);
      sysbus_realize_and_unref(SYS_BUS_DEVICE(dev), &error_fatal);
 -    armv7m_load_kernel(ARM_CPU(first_cpu),
 +    armv7m_load_kernel(STM32F405_SOC(dev)->armv7m.cpu,
                         machine->kernel_filename,
 , FLASH_SIZE);
  }
 diff --git a/hw/arm/olimex-stm32-h405.c b/hw/arm/olimex-stm32-h405.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/olimex-stm32-h405.c
 +++ b/hw/arm/olimex-stm32-h405.c
@@ -XXX,XX +XXX,XX @@ static void olimex_stm32_h405_init(MachineState *machine)
      qdev_connect_clock_in(dev, "sysclk", sysclk);
      sysbus_realize_and_unref(SYS_BUS_DEVICE(dev), &error_fatal);
 -    armv7m_load_kernel(ARM_CPU(first_cpu),
 +    armv7m_load_kernel(STM32F405_SOC(dev)->armv7m.cpu,
                         machine->kernel_filename,
 , FLASH_SIZE);
  }
 diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/stellaris.c
 +++ b/hw/arm/stellaris.c
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
      create_unimplemented_device("hibernation", 0x400fc000, 0x1000);
      create_unimplemented_device("flash-control", 0x400fd000, 0x1000);
 -    armv7m_load_kernel(ARM_CPU(first_cpu), ms->kernel_filename, 0, flash_size);
 +    armv7m_load_kernel(ARMV7M(armv7m)->cpu, ms->kernel_filename, 0, flash_size);
  }
  /* FIXME: Figure out how to generate these from stellaris_boards.  */
 diff --git a/hw/arm/stm32vldiscovery.c b/hw/arm/stm32vldiscovery.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/stm32vldiscovery.c
 +++ b/hw/arm/stm32vldiscovery.c
@@ -XXX,XX +XXX,XX @@ static void stm32vldiscovery_init(MachineState *machine)
      qdev_connect_clock_in(dev, "sysclk", sysclk);
      sysbus_realize_and_unref(SYS_BUS_DEVICE(dev), &error_fatal);
 -    armv7m_load_kernel(ARM_CPU(first_cpu),
 +    armv7m_load_kernel(STM32F100_SOC(dev)->armv7m.cpu,
                         machine->kernel_filename,
 , FLASH_SIZE);
  }
 --
-.25.1
+.34.1

-[PULL 22/26] target/arm: Advertise all page sizes for -cpu max
+[PULL 04/36] hw/char/imx_serial: Fix reset value of UFCR register
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Bernhard Beschow <shentey@gmail.com>
-We support 16k pages, but do not advertize that in ID_AA64MMFR0.
+The value of the UCFR register is respected when echoing characters to the
 terminal, but its reset value is reserved. Fix the reset value to the one
 documented in the datasheet.
-The value 0 in the TGRAN*_2 fields indicates that stage2 lookups defer
+While at it move the related attribute out of the section of unimplemented
-to the same support as stage1 lookups.  This setting is deprecated, so
+registers since its value is actually respected.
 indicate support for all stage2 page sizes directly.
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
+Signed-off-by: Bernhard Beschow <shentey@gmail.com>
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Message-id: 20220301215958.157011-16-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/cpu64.c | 4 ++++
+ include/hw/char/imx_serial.h | 2 +-
-file changed, 4 insertions(+)
+ hw/char/imx_serial.c         | 1 +
 files changed, 2 insertions(+), 1 deletion(-)
-diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
+diff --git a/include/hw/char/imx_serial.h b/include/hw/char/imx_serial.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/cpu64.c
+--- a/include/hw/char/imx_serial.h
-+++ b/target/arm/cpu64.c
++++ b/include/hw/char/imx_serial.h
-@@ -XXX,XX +XXX,XX @@ static void aarch64_max_initfn(Object *obj)
+@@ -XXX,XX +XXX,XX @@ struct IMXSerialState {
+     uint32_t ucr1;
-     t = cpu->isar.id_aa64mmfr0;
+     uint32_t ucr2;
-     t = FIELD_DP64(t, ID_AA64MMFR0, PARANGE, 6); /* FEAT_LPA: 52 bits */
+     uint32_t uts1;
-+    t = FIELD_DP64(t, ID_AA64MMFR0, TGRAN16, 1);   /* 16k pages supported */
++    uint32_t ufcr;
-+    t = FIELD_DP64(t, ID_AA64MMFR0, TGRAN16_2, 2); /* 16k stage2 supported */
-+    t = FIELD_DP64(t, ID_AA64MMFR0, TGRAN64_2, 2); /* 64k stage2 supported */
+     /*
-+    t = FIELD_DP64(t, ID_AA64MMFR0, TGRAN4_2, 2);  /*  4k stage2 supported */
+      * The registers below are implemented just so that the
-     cpu->isar.id_aa64mmfr0 = t;
+      * guest OS sees what it has written
+      */
-     t = cpu->isar.id_aa64mmfr1;
+     uint32_t onems;
 -    uint32_t ufcr;
      uint32_t ubmr;
      uint32_t ubrc;
      uint32_t ucr3;
 diff --git a/hw/char/imx_serial.c b/hw/char/imx_serial.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/char/imx_serial.c
 +++ b/hw/char/imx_serial.c
@@ -XXX,XX +XXX,XX @@ static void imx_serial_reset(IMXSerialState *s)
      s->ucr3 = 0x700;
      s->ubmr = 0;
      s->ubrc = 4;
 +    s->ufcr = BIT(11) | BIT(0);
      fifo32_reset(&s->rx_fifo);
      timer_del(&s->ageing_timer);
 --
-.25.1
+.34.1

-[PULL 18/26] target/arm: Extend arm_fi_to_lfsc to level -1
+[PULL 05/36] hw/char/imx_serial: Update all state before restarting ageing timer
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Bernhard Beschow <shentey@gmail.com>
-With FEAT_LPA2, rather than introducing translation level 4,
+Fixes characters to be "echoed" after each keystroke rather than after every
-we introduce level -1, below the current level 0.  Extend
+other since imx_serial_rx_fifo_ageing_timer_restart() would see ~UTS1_RXEMPTY
-arm_fi_to_lfsc to handle these faults.
+only after every other keystroke.
-Assert that this new translation level does not leak into
+Signed-off-by: Bernhard Beschow <shentey@gmail.com>
 fault types for which it is not defined, which allows some
 masking of fi->level to be removed.
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-12-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/internals.h | 35 +++++++++++++++++++++++++++++------
+ hw/char/imx_serial.c | 6 +++---
-file changed, 29 insertions(+), 6 deletions(-)
+file changed, 3 insertions(+), 3 deletions(-)
-diff --git a/target/arm/internals.h b/target/arm/internals.h
+diff --git a/hw/char/imx_serial.c b/hw/char/imx_serial.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/internals.h
+--- a/hw/char/imx_serial.c
-+++ b/target/arm/internals.h
++++ b/hw/char/imx_serial.c
-@@ -XXX,XX +XXX,XX @@ static inline uint32_t arm_fi_to_lfsc(ARMMMUFaultInfo *fi)
+@@ -XXX,XX +XXX,XX @@ static void imx_put_data(void *opaque, uint32_t value)
-     case ARMFault_None:
+     if (fifo32_num_used(&s->rx_fifo) >= rxtl) {
-         return 0;
+         s->usr1 |= USR1_RRDY;
-     case ARMFault_AddressSize:
+     }
--        fsc = fi->level & 3;
+-
-+        assert(fi->level >= -1 && fi->level <= 3);
+-    imx_serial_rx_fifo_ageing_timer_restart(s);
-+        if (fi->level < 0) {
+-
-+            fsc = 0b101001;
+     s->usr2 |= USR2_RDR;
-+        } else {
+     s->uts1 &= ~UTS1_RXEMPTY;
-+            fsc = fi->level;
+     if (value & URXD_BRK) {
-+        }
+         s->usr2 |= USR2_BRCD;
-         break;
+     }
-     case ARMFault_AccessFlag:
++
--        fsc = (fi->level & 3) | (0x2 << 2);
++    imx_serial_rx_fifo_ageing_timer_restart(s);
-+        assert(fi->level >= 0 && fi->level <= 3);
++
-+        fsc = 0b001000 | fi->level;
+     imx_update(s);
-         break;
+ }
-     case ARMFault_Permission:
 -        fsc = (fi->level & 3) | (0x3 << 2);
 +        assert(fi->level >= 0 && fi->level <= 3);
 +        fsc = 0b001100 | fi->level;
          break;
      case ARMFault_Translation:
 -        fsc = (fi->level & 3) | (0x1 << 2);
 +        assert(fi->level >= -1 && fi->level <= 3);
 +        if (fi->level < 0) {
 +            fsc = 0b101011;
 +        } else {
 +            fsc = 0b000100 | fi->level;
 +        }
          break;
      case ARMFault_SyncExternal:
          fsc = 0x10 | (fi->ea << 12);
          break;
      case ARMFault_SyncExternalOnWalk:
 -        fsc = (fi->level & 3) | (0x5 << 2) | (fi->ea << 12);
 +        assert(fi->level >= -1 && fi->level <= 3);
 +        if (fi->level < 0) {
 +            fsc = 0b010011;
 +        } else {
 +            fsc = 0b010100 | fi->level;
 +        }
 +        fsc |= fi->ea << 12;
          break;
      case ARMFault_SyncParity:
          fsc = 0x18;
          break;
      case ARMFault_SyncParityOnWalk:
 -        fsc = (fi->level & 3) | (0x7 << 2);
 +        assert(fi->level >= -1 && fi->level <= 3);
 +        if (fi->level < 0) {
 +            fsc = 0b011011;
 +        } else {
 +            fsc = 0b011100 | fi->level;
 +        }
          break;
      case ARMFault_AsyncParity:
          fsc = 0x19;
 --
-.25.1
+.34.1

-[PULL 19/26] target/arm: Introduce tlbi_aa64_get_range
+[PULL 06/36] hw/pci-host/designware: Expose MSI IRQ
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Bernhard Beschow <shentey@gmail.com>
-Merge tlbi_aa64_range_get_length and tlbi_aa64_range_get_base,
+Fixes INTD and MSI interrupts poking the same IRQ line without keeping track of
-returning a structure containing both results.  Pass in the
+each other's IRQ level. Furthermore, SoCs such as the i.MX 8M Plus don't share
-ARMMMUIdx, rather than the digested two_ranges boolean.
+the MSI IRQ with the INTx lines, so expose it as a dedicated pin.
-This is in preparation for FEAT_LPA2, where the interpretation
+Signed-off-by: Bernhard Beschow <shentey@gmail.com>
 of 'value' depends on the effective value of DS for the regime.
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-13-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/helper.c | 58 +++++++++++++++++++--------------------------
+ include/hw/arm/fsl-imx6.h        |  4 +++-
-file changed, 24 insertions(+), 34 deletions(-)
+ include/hw/arm/fsl-imx7.h        |  4 +++-
  include/hw/pci-host/designware.h |  1 +
  hw/arm/fsl-imx6.c                | 13 ++++++++++++-
  hw/arm/fsl-imx7.c                | 13 ++++++++++++-
  hw/pci-host/designware.c         |  7 +++----
  hw/arm/Kconfig                   |  2 ++
 files changed, 36 insertions(+), 8 deletions(-)
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+diff --git a/include/hw/arm/fsl-imx6.h b/include/hw/arm/fsl-imx6.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
+--- a/include/hw/arm/fsl-imx6.h
-+++ b/target/arm/helper.c
++++ b/include/hw/arm/fsl-imx6.h
-@@ -XXX,XX +XXX,XX @@ static void tlbi_aa64_vae3is_write(CPUARMState *env, const ARMCPRegInfo *ri,
+@@ -XXX,XX +XXX,XX @@
  #include "hw/usb/chipidea.h"
  #include "hw/usb/imx-usb-phy.h"
  #include "hw/pci-host/designware.h"
 +#include "hw/or-irq.h"
  #include "exec/memory.h"
  #include "cpu.h"
  #include "qom/object.h"
@@ -XXX,XX +XXX,XX @@ struct FslIMX6State {
      ChipideaState      usb[FSL_IMX6_NUM_USBS];
      IMXFECState        eth;
      DesignwarePCIEHost pcie;
 +    OrIRQState         pcie4_msi_irq;
      MemoryRegion       rom;
      MemoryRegion       caam;
      MemoryRegion       ocram;
@@ -XXX,XX +XXX,XX @@ struct FslIMX6State {
  #define FSL_IMX6_PCIE1_IRQ 120
  #define FSL_IMX6_PCIE2_IRQ 121
  #define FSL_IMX6_PCIE3_IRQ 122
 -#define FSL_IMX6_PCIE4_IRQ 123
 +#define FSL_IMX6_PCIE4_MSI_IRQ 123
  #define FSL_IMX6_DCIC1_IRQ 124
  #define FSL_IMX6_DCIC2_IRQ 125
  #define FSL_IMX6_MLB150_HIGH_IRQ 126
 diff --git a/include/hw/arm/fsl-imx7.h b/include/hw/arm/fsl-imx7.h
 index XXXXXXX..XXXXXXX 100644
 --- a/include/hw/arm/fsl-imx7.h
 +++ b/include/hw/arm/fsl-imx7.h
@@ -XXX,XX +XXX,XX @@
  #include "hw/net/imx_fec.h"
  #include "hw/pci-host/designware.h"
  #include "hw/usb/chipidea.h"
 +#include "hw/or-irq.h"
  #include "cpu.h"
  #include "qom/object.h"
  #include "qemu/units.h"
@@ -XXX,XX +XXX,XX @@ struct FslIMX7State {
      IMX7GPRState       gpr;
      ChipideaState      usb[FSL_IMX7_NUM_USBS];
      DesignwarePCIEHost pcie;
 +    OrIRQState         pcie4_msi_irq;
      MemoryRegion       rom;
      MemoryRegion       caam;
      MemoryRegion       ocram;
@@ -XXX,XX +XXX,XX @@ enum FslIMX7IRQs {
      FSL_IMX7_PCI_INTA_IRQ = 125,
      FSL_IMX7_PCI_INTB_IRQ = 124,
      FSL_IMX7_PCI_INTC_IRQ = 123,
 -    FSL_IMX7_PCI_INTD_IRQ = 122,
 +    FSL_IMX7_PCI_INTD_MSI_IRQ = 122,
      FSL_IMX7_UART7_IRQ    = 126,
 diff --git a/include/hw/pci-host/designware.h b/include/hw/pci-host/designware.h
 index XXXXXXX..XXXXXXX 100644
 --- a/include/hw/pci-host/designware.h
 +++ b/include/hw/pci-host/designware.h
@@ -XXX,XX +XXX,XX @@ struct DesignwarePCIEHost {
          MemoryRegion io;
          qemu_irq     irqs[4];
 +        qemu_irq     msi;
      } pci;
      MemoryRegion mmio;
 diff --git a/hw/arm/fsl-imx6.c b/hw/arm/fsl-imx6.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/arm/fsl-imx6.c
 +++ b/hw/arm/fsl-imx6.c
@@ -XXX,XX +XXX,XX @@ static void fsl_imx6_init(Object *obj)
      object_initialize_child(obj, "eth", &s->eth, TYPE_IMX_ENET);
      object_initialize_child(obj, "pcie", &s->pcie, TYPE_DESIGNWARE_PCIE_HOST);
 +    object_initialize_child(obj, "pcie4-msi-irq", &s->pcie4_msi_irq,
 +                            TYPE_OR_IRQ);
  }
- #ifdef TARGET_AARCH64
+ static void fsl_imx6_realize(DeviceState *dev, Error **errp)
--static uint64_t tlbi_aa64_range_get_length(CPUARMState *env,
+@@ -XXX,XX +XXX,XX @@ static void fsl_imx6_realize(DeviceState *dev, Error **errp)
--                                           uint64_t value)
+     sysbus_realize(SYS_BUS_DEVICE(&s->pcie), &error_abort);
--{
+     sysbus_mmio_map(SYS_BUS_DEVICE(&s->pcie), 0, FSL_IMX6_PCIe_REG_ADDR);
--    unsigned int page_shift;
--    unsigned int page_size_granule;
++    object_property_set_int(OBJECT(&s->pcie4_msi_irq), "num-lines", 2,
--    uint64_t num;
++                            &error_abort);
--    uint64_t scale;
++    qdev_realize(DEVICE(&s->pcie4_msi_irq), NULL, &error_abort);
--    uint64_t exponent;
++
-+typedef struct {
++    irq = qdev_get_gpio_in(DEVICE(&s->a9mpcore), FSL_IMX6_PCIE4_MSI_IRQ);
-+    uint64_t base;
++    qdev_connect_gpio_out(DEVICE(&s->pcie4_msi_irq), 0, irq);
-     uint64_t length;
++
-+} TLBIRange;
+     irq = qdev_get_gpio_in(DEVICE(&s->a9mpcore), FSL_IMX6_PCIE1_IRQ);
-+
+     sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 0, irq);
-+static TLBIRange tlbi_aa64_get_range(CPUARMState *env, ARMMMUIdx mmuidx,
+     irq = qdev_get_gpio_in(DEVICE(&s->a9mpcore), FSL_IMX6_PCIE2_IRQ);
-+                                     uint64_t value)
+     sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 1, irq);
-+{
+     irq = qdev_get_gpio_in(DEVICE(&s->a9mpcore), FSL_IMX6_PCIE3_IRQ);
-+    unsigned int page_size_granule, page_shift, num, scale, exponent;
+     sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 2, irq);
-+    TLBIRange ret = { };
+-    irq = qdev_get_gpio_in(DEVICE(&s->a9mpcore), FSL_IMX6_PCIE4_IRQ);
++    irq = qdev_get_gpio_in(DEVICE(&s->pcie4_msi_irq), 0);
--    num = extract64(value, 39, 5);
+     sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 3, irq);
--    scale = extract64(value, 44, 2);
++    irq = qdev_get_gpio_in(DEVICE(&s->pcie4_msi_irq), 1);
-     page_size_granule = extract64(value, 46, 2);
++    sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 4, irq);
-     if (page_size_granule == 0) {
+     /*
-         qemu_log_mask(LOG_GUEST_ERROR, "Invalid page size granule %d\n",
+      * PCIe PHY
-                       page_size_granule);
+diff --git a/hw/arm/fsl-imx7.c b/hw/arm/fsl-imx7.c
--        return 0;
+index XXXXXXX..XXXXXXX 100644
-+        return ret;
+--- a/hw/arm/fsl-imx7.c
-     }
++++ b/hw/arm/fsl-imx7.c
+@@ -XXX,XX +XXX,XX @@ static void fsl_imx7_init(Object *obj)
-     page_shift = (page_size_granule - 1) * 2 + 12;
+      * PCIE
       */
      object_initialize_child(obj, "pcie", &s->pcie, TYPE_DESIGNWARE_PCIE_HOST);
 +    object_initialize_child(obj, "pcie4-msi-irq", &s->pcie4_msi_irq,
 +                            TYPE_OR_IRQ);
      /*
       * USBs
@@ -XXX,XX +XXX,XX @@ static void fsl_imx7_realize(DeviceState *dev, Error **errp)
      sysbus_realize(SYS_BUS_DEVICE(&s->pcie), &error_abort);
      sysbus_mmio_map(SYS_BUS_DEVICE(&s->pcie), 0, FSL_IMX7_PCIE_REG_ADDR);
 +    object_property_set_int(OBJECT(&s->pcie4_msi_irq), "num-lines", 2,
 +                            &error_abort);
 +    qdev_realize(DEVICE(&s->pcie4_msi_irq), NULL, &error_abort);
 +
 +    irq = qdev_get_gpio_in(DEVICE(&s->a7mpcore), FSL_IMX7_PCI_INTD_MSI_IRQ);
 +    qdev_connect_gpio_out(DEVICE(&s->pcie4_msi_irq), 0, irq);
 +
      irq = qdev_get_gpio_in(DEVICE(&s->a7mpcore), FSL_IMX7_PCI_INTA_IRQ);
      sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 0, irq);
      irq = qdev_get_gpio_in(DEVICE(&s->a7mpcore), FSL_IMX7_PCI_INTB_IRQ);
      sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 1, irq);
      irq = qdev_get_gpio_in(DEVICE(&s->a7mpcore), FSL_IMX7_PCI_INTC_IRQ);
      sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 2, irq);
 -    irq = qdev_get_gpio_in(DEVICE(&s->a7mpcore), FSL_IMX7_PCI_INTD_IRQ);
 +    irq = qdev_get_gpio_in(DEVICE(&s->pcie4_msi_irq), 0);
      sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 3, irq);
 +    irq = qdev_get_gpio_in(DEVICE(&s->pcie4_msi_irq), 1);
 +    sysbus_connect_irq(SYS_BUS_DEVICE(&s->pcie), 4, irq);
      /*
       * USBs
 diff --git a/hw/pci-host/designware.c b/hw/pci-host/designware.c
 index XXXXXXX..XXXXXXX 100644
 --- a/hw/pci-host/designware.c
 +++ b/hw/pci-host/designware.c
@@ -XXX,XX +XXX,XX @@
  #define DESIGNWARE_PCIE_ATU_DEVFN(x)               (((x) >> 16) & 0xff)
  #define DESIGNWARE_PCIE_ATU_UPPER_TARGET           0x91C
 -#define DESIGNWARE_PCIE_IRQ_MSI                    3
 -
-+    num = extract64(value, 39, 5);
+ static DesignwarePCIEHost *
-+    scale = extract64(value, 44, 2);
+ designware_pcie_root_to_host(DesignwarePCIERoot *root)
      exponent = (5 * scale) + 1;
 -    length = (num + 1) << (exponent + page_shift);
 -    return length;
 -}
 +    ret.length = (num + 1) << (exponent + page_shift);
 -static uint64_t tlbi_aa64_range_get_base(CPUARMState *env, uint64_t value,
 -                                        bool two_ranges)
 -{
 -    /* TODO: ARMv8.7 FEAT_LPA2 */
 -    uint64_t pageaddr;
 -
 -    if (two_ranges) {
 -        pageaddr = sextract64(value, 0, 37) << TARGET_PAGE_BITS;
 +    if (regime_has_2_ranges(mmuidx)) {
 +        ret.base = sextract64(value, 0, 37) << TARGET_PAGE_BITS;
      } else {
 -        pageaddr = extract64(value, 0, 37) << TARGET_PAGE_BITS;
 +        ret.base = extract64(value, 0, 37) << TARGET_PAGE_BITS;
      }
 -    return pageaddr;
 +    return ret;
  }
  static void do_rvae_write(CPUARMState *env, uint64_t value,
                            int idxmap, bool synced)
  {
-     ARMMMUIdx one_idx = ARM_MMU_IDX_A | ctz32(idxmap);
+@@ -XXX,XX +XXX,XX @@ static void designware_pcie_root_msi_write(void *opaque, hwaddr addr,
--    bool two_ranges = regime_has_2_ranges(one_idx);
+     root->msi.intr[0].status |= BIT(val) & root->msi.intr[0].enable;
--    uint64_t baseaddr, length;
-+    TLBIRange range;
+     if (root->msi.intr[0].status & ~root->msi.intr[0].mask) {
-     int bits;
+-        qemu_set_irq(host->pci.irqs[DESIGNWARE_PCIE_IRQ_MSI], 1);
++        qemu_set_irq(host->pci.msi, 1);
 -    baseaddr = tlbi_aa64_range_get_base(env, value, two_ranges);
 -    length = tlbi_aa64_range_get_length(env, value);
 -    bits = tlbbits_for_regime(env, one_idx, baseaddr);
 +    range = tlbi_aa64_get_range(env, one_idx, value);
 +    bits = tlbbits_for_regime(env, one_idx, range.base);
      if (synced) {
          tlb_flush_range_by_mmuidx_all_cpus_synced(env_cpu(env),
 -                                                  baseaddr,
 -                                                  length,
 +                                                  range.base,
 +                                                  range.length,
                                                    idxmap,
                                                    bits);
      } else {
 -        tlb_flush_range_by_mmuidx(env_cpu(env), baseaddr,
 -                                  length, idxmap, bits);
 +        tlb_flush_range_by_mmuidx(env_cpu(env), range.base,
 +                                  range.length, idxmap, bits);
      }
  }
+@@ -XXX,XX +XXX,XX @@ static void designware_pcie_root_config_write(PCIDevice *d, uint32_t address,
+     case DESIGNWARE_PCIE_MSI_INTR0_STATUS:
+         root->msi.intr[0].status ^= val;
+         if (!root->msi.intr[0].status) {
+-            qemu_set_irq(host->pci.irqs[DESIGNWARE_PCIE_IRQ_MSI], 0);
++            qemu_set_irq(host->pci.msi, 0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static void designware_pcie_host_realize(DeviceState *dev, Error **errp)
+     for (i = 0; i < ARRAY_SIZE(s->pci.irqs); i++) {
+         sysbus_init_irq(sbd, &s->pci.irqs[i]);
+     }
++    sysbus_init_irq(sbd, &s->pci.msi);
+     memory_region_init_io(&s->mmio,
+                           OBJECT(s),
+diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig
+index XXXXXXX..XXXXXXX 100644
+--- a/hw/arm/Kconfig
++++ b/hw/arm/Kconfig
+@@ -XXX,XX +XXX,XX @@ config FSL_IMX6
+     select PL310  # cache controller
+     select PCI_EXPRESS_DESIGNWARE
+     select SDHCI
++    select OR_IRQ
+ config ASPEED_SOC
+     bool
+@@ -XXX,XX +XXX,XX @@ config FSL_IMX7
+     select WDT_IMX2
+     select PCI_EXPRESS_DESIGNWARE
+     select SDHCI
++    select OR_IRQ
+     select UNIMP
+ config ARM_SMMUV3
 --
-.25.1
+.34.1

-[PULL 17/26] target/arm: Implement FEAT_LPA
+[PULL 07/36] hw/arm/stellaris: Link each board schematic
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-This feature widens physical addresses (and intermediate physical
+Board schematic is useful to corroborate GPIOs/IRQs wiring.
 addresses for 2-stage translation) from 48 to 52 bits, when using
 k pages.  The only thing left at this point is to handle the
 extra bits in the TTBR and in the table descriptors.
-Note that PAR_EL1 and HPFAR_EL2 are nominally extended, but we don't
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
 mask out the high bits when writing to those registers, so no changes
 are required there.
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250110160204.74997-2-philmd@linaro.org
-Message-id: 20220301215958.157011-11-richard.henderson@linaro.org
+[PMM: Use https:// URLs]
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- docs/system/arm/emulation.rst |  1 +
+ hw/arm/stellaris.c | 8 ++++++++
- target/arm/cpu-param.h        |  2 +-
+file changed, 8 insertions(+)
  target/arm/cpu64.c            |  2 +-
  target/arm/helper.c           | 19 ++++++++++++++++---
 files changed, 19 insertions(+), 5 deletions(-)
-diff --git a/docs/system/arm/emulation.rst b/docs/system/arm/emulation.rst
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
---- a/docs/system/arm/emulation.rst
+--- a/hw/arm/stellaris.c
-+++ b/docs/system/arm/emulation.rst
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@ the following architecture extensions:
+@@ -XXX,XX +XXX,XX @@ static void lm3s6965evb_init(MachineState *machine)
- - FEAT_I8MM (AArch64 Int8 matrix multiplication instructions)
+     stellaris_init(machine, &stellaris_boards[1]);
- - FEAT_JSCVT (JavaScript conversion instructions)
+ }
- - FEAT_LOR (Limited ordering regions)
-+- FEAT_LPA (Large Physical Address space)
++/*
- - FEAT_LRCPC (Load-acquire RCpc instructions)
++ * Stellaris LM3S811 Evaluation Board Schematics:
- - FEAT_LRCPC2 (Load-acquire RCpc instructions v2)
++ * https://www.ti.com/lit/ug/symlink/spmu030.pdf
- - FEAT_LSE (Large System Extensions)
++ */
-diff --git a/target/arm/cpu-param.h b/target/arm/cpu-param.h
+ static void lm3s811evb_class_init(ObjectClass *oc, void *data)
-index XXXXXXX..XXXXXXX 100644
+ {
---- a/target/arm/cpu-param.h
+     MachineClass *mc = MACHINE_CLASS(oc);
-+++ b/target/arm/cpu-param.h
+@@ -XXX,XX +XXX,XX @@ static const TypeInfo lm3s811evb_type = {
-@@ -XXX,XX +XXX,XX @@
+     .class_init = lm3s811evb_class_init,
  #ifdef TARGET_AARCH64
  # define TARGET_LONG_BITS             64
 -# define TARGET_PHYS_ADDR_SPACE_BITS  48
 +# define TARGET_PHYS_ADDR_SPACE_BITS  52
  # define TARGET_VIRT_ADDR_SPACE_BITS  52
  #else
  # define TARGET_LONG_BITS             32
 diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu64.c
 +++ b/target/arm/cpu64.c
@@ -XXX,XX +XXX,XX @@ static void aarch64_max_initfn(Object *obj)
      cpu->isar.id_aa64pfr1 = t;
      t = cpu->isar.id_aa64mmfr0;
 -    t = FIELD_DP64(t, ID_AA64MMFR0, PARANGE, 5); /* PARange: 48 bits */
 +    t = FIELD_DP64(t, ID_AA64MMFR0, PARANGE, 6); /* FEAT_LPA: 52 bits */
      cpu->isar.id_aa64mmfr0 = t;
      t = cpu->isar.id_aa64mmfr1;
 diff --git a/target/arm/helper.c b/target/arm/helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/helper.c
 +++ b/target/arm/helper.c
@@ -XXX,XX +XXX,XX @@ static const uint8_t pamax_map[] = {
      [3] = 42,
      [4] = 44,
      [5] = 48,
 +    [6] = 52,
  };
- /* The cpu-specific constant value of PAMax; also used by hw/arm/virt. */
++/*
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
++ * Stellaris: LM3S6965 Evaluation Board Schematics:
-     descaddr = extract64(ttbr, 0, 48);
++ * https://www.ti.com/lit/ug/symlink/spmu029.pdf
++ */
-     /*
+ static void lm3s6965evb_class_init(ObjectClass *oc, void *data)
--     * If the base address is out of range, raise AddressSizeFault.
+ {
-+     * For FEAT_LPA and PS=6, bits [51:48] of descaddr are in [5:2] of TTBR.
+     MachineClass *mc = MACHINE_CLASS(oc);
 +     *
 +     * Otherwise, if the base address is out of range, raise AddressSizeFault.
       * In the pseudocode, this is !IsZero(baseregister<47:outputsize>),
       * but we've just cleared the bits above 47, so simplify the test.
       */
 -    if (descaddr >> outputsize) {
 +    if (outputsize > 48) {
 +        descaddr |= extract64(ttbr, 2, 4) << 48;
 +    } else if (descaddr >> outputsize) {
          level = 0;
          fault_type = ARMFault_AddressSize;
          goto do_fault;
@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
          }
          descaddr = descriptor & descaddrmask;
 -        if (descaddr >> outputsize) {
 +
 +        /*
 +         * For FEAT_LPA and PS=6, bits [51:48] of descaddr are in [15:12]
 +         * of descriptor.  Otherwise, if descaddr is out of range, raise
 +         * AddressSizeFault.
 +         */
 +        if (outputsize > 48) {
 +            descaddr |= extract64(descriptor, 12, 4) << 48;
 +        } else if (descaddr >> outputsize) {
              fault_type = ARMFault_AddressSize;
              goto do_fault;
          }
 --
-.25.1
+.34.1

-[PULL 04/26] hw/i2c: flatten pca954x mux device
+[PULL 08/36] hw/arm/stellaris: Constify read-only arrays
-From: Patrick Venture <venture@google.com>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-Previously this device created N subdevices which each owned an i2c bus.
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
-Now this device simply owns the N i2c busses directly.
+Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
+Message-id: 20250110160204.74997-3-philmd@linaro.org
 Tested: Verified devices behind mux are still accessible via qmp and i2c
 from within an arm32 SoC.
 Reviewed-by: Hao Wu <wuhaotsh@google.com>
 Signed-off-by: Patrick Venture <venture@google.com>
 Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
 Tested-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
 Message-id: 20220202164533.1283668-1-venture@google.com
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- hw/i2c/i2c_mux_pca954x.c | 77 +++++++---------------------------------
+ hw/arm/stellaris.c | 6 +++---
-file changed, 13 insertions(+), 64 deletions(-)
+file changed, 3 insertions(+), 3 deletions(-)
-diff --git a/hw/i2c/i2c_mux_pca954x.c b/hw/i2c/i2c_mux_pca954x.c
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
---- a/hw/i2c/i2c_mux_pca954x.c
+--- a/hw/arm/stellaris.c
-+++ b/hw/i2c/i2c_mux_pca954x.c
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@
+@@ -XXX,XX +XXX,XX @@ static void ssys_update(ssys_state *s)
- #define PCA9548_CHANNEL_COUNT 8
+   qemu_set_irq(s->irq, (s->int_status & s->int_mask) != 0);
  #define PCA9546_CHANNEL_COUNT 4
 -/*
 - * struct Pca954xChannel - The i2c mux device will have N of these states
 - * that own the i2c channel bus.
 - * @bus: The owned channel bus.
 - * @enabled: Is this channel active?
 - */
 -typedef struct Pca954xChannel {
 -    SysBusDevice parent;
 -
 -    I2CBus       *bus;
 -
 -    bool         enabled;
 -} Pca954xChannel;
 -
 -#define TYPE_PCA954X_CHANNEL "pca954x-channel"
 -#define PCA954X_CHANNEL(obj) \
 -    OBJECT_CHECK(Pca954xChannel, (obj), TYPE_PCA954X_CHANNEL)
 -
  /*
   * struct Pca954xState - The pca954x state object.
   * @control: The value written to the mux control.
@@ -XXX,XX +XXX,XX @@ typedef struct Pca954xState {
      uint8_t control;
 -    /* The channel i2c buses. */
 -    Pca954xChannel channel[PCA9548_CHANNEL_COUNT];
 +    bool enabled[PCA9548_CHANNEL_COUNT];
 +    I2CBus *bus[PCA9548_CHANNEL_COUNT];
  } Pca954xState;
  /*
@@ -XXX,XX +XXX,XX @@ static bool pca954x_match(I2CSlave *candidate, uint8_t address,
      }
      for (i = 0; i < mc->nchans; i++) {
 -        if (!mux->channel[i].enabled) {
 +        if (!mux->enabled[i]) {
              continue;
          }
 -        if (i2c_scan_bus(mux->channel[i].bus, address, broadcast,
 +        if (i2c_scan_bus(mux->bus[i], address, broadcast,
                           current_devs)) {
              if (!broadcast) {
                  return true;
@@ -XXX,XX +XXX,XX @@ static void pca954x_enable_channel(Pca954xState *s, uint8_t enable_mask)
       */
      for (i = 0; i < mc->nchans; i++) {
          if (enable_mask & (1 << i)) {
 -            s->channel[i].enabled = true;
 +            s->enabled[i] = true;
          } else {
 -            s->channel[i].enabled = false;
 +            s->enabled[i] = false;
          }
      }
  }
-@@ -XXX,XX +XXX,XX @@ I2CBus *pca954x_i2c_get_bus(I2CSlave *mux, uint8_t channel)
-     Pca954xState *pca954x = PCA954X(mux);
+-static uint32_t pllcfg_sandstorm[16] = {
++static const uint32_t pllcfg_sandstorm[16] = {
-     g_assert(channel < pc->nchans);
+x31c0, /* 1 Mhz */
--    return I2C_BUS(qdev_get_child_bus(DEVICE(&pca954x->channel[channel]),
+x1ae0, /* 1.8432 Mhz */
--                                      "i2c-bus"));
+x18c0, /* 2 Mhz */
--}
+@@ -XXX,XX +XXX,XX @@ static uint32_t pllcfg_sandstorm[16] = {
--
+x585b /* 8.192 Mhz */
--static void pca954x_channel_init(Object *obj)
+ };
--{
--    Pca954xChannel *s = PCA954X_CHANNEL(obj);
+-static uint32_t pllcfg_fury[16] = {
--    s->bus = i2c_init_bus(DEVICE(s), "i2c-bus");
++static const uint32_t pllcfg_fury[16] = {
--
+x3200, /* 1 Mhz */
--    /* Start all channels as disabled. */
+x1b20, /* 1.8432 Mhz */
--    s->enabled = false;
+x1900, /* 2 Mhz */
--}
+@@ -XXX,XX +XXX,XX @@ static void stellaris_adc_init(Object *obj)
 -
 -static void pca954x_channel_class_init(ObjectClass *klass, void *data)
 -{
 -    DeviceClass *dc = DEVICE_CLASS(klass);
 -    dc->desc = "Pca954x Channel";
 +    return pca954x->bus[channel];
  }
- static void pca9546_class_init(ObjectClass *klass, void *data)
+ /* Board init.  */
-@@ -XXX,XX +XXX,XX @@ static void pca9548_class_init(ObjectClass *klass, void *data)
+-static stellaris_board_info stellaris_boards[] = {
-     s->nchans = PCA9548_CHANNEL_COUNT;
++static const stellaris_board_info stellaris_boards[] = {
- }
+   { "LM3S811EVB",
+,
--static void pca954x_realize(DeviceState *dev, Error **errp)
+x0032000e,
 -{
 -    Pca954xState *s = PCA954X(dev);
 -    Pca954xClass *c = PCA954X_GET_CLASS(s);
 -    int i;
 -
 -    /* SMBus modules. Cannot fail. */
 -    for (i = 0; i < c->nchans; i++) {
 -        sysbus_realize(SYS_BUS_DEVICE(&s->channel[i]), &error_abort);
 -    }
 -}
 -
  static void pca954x_init(Object *obj)
  {
      Pca954xState *s = PCA954X(obj);
      Pca954xClass *c = PCA954X_GET_CLASS(obj);
      int i;
 -    /* Only initialize the children we expect. */
 +    /* SMBus modules. Cannot fail. */
      for (i = 0; i < c->nchans; i++) {
 -        object_initialize_child(obj, "channel[*]", &s->channel[i],
 -                                TYPE_PCA954X_CHANNEL);
 +        g_autofree gchar *bus_name = g_strdup_printf("i2c.%d", i);
 +
 +        /* start all channels as disabled. */
 +        s->enabled[i] = false;
 +        s->bus[i] = i2c_init_bus(DEVICE(s), bus_name);
      }
  }
@@ -XXX,XX +XXX,XX @@ static void pca954x_class_init(ObjectClass *klass, void *data)
      rc->phases.enter = pca954x_enter_reset;
      dc->desc = "Pca954x i2c-mux";
 -    dc->realize = pca954x_realize;
      k->write_data = pca954x_write_data;
      k->receive_byte = pca954x_read_byte;
@@ -XXX,XX +XXX,XX @@ static const TypeInfo pca954x_info[] = {
          .parent        = TYPE_PCA954X,
          .class_init    = pca9548_class_init,
      },
 -    {
 -        .name = TYPE_PCA954X_CHANNEL,
 -        .parent = TYPE_SYS_BUS_DEVICE,
 -        .class_init = pca954x_channel_class_init,
 -        .instance_size = sizeof(Pca954xChannel),
 -        .instance_init = pca954x_channel_init,
 -    }
  };
  DEFINE_TYPES(pca954x_info)
 --
-.25.1
+.34.1

-[PULL 11/26] target/arm: Move arm_pamax out of line
+[PULL 09/36] hw/arm/stellaris: Remove incorrect unimplemented i2c-0 at 0x40002000
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-We will shortly share parts of this function with other portions
+There is nothing mapped at 0x40002000.
 of address translation.
+I2C#0 is already mapped at 0x40021000.
+Remove the invalid mapping added in commits aecfbbc97a2 & 394c8bbfb7a.
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
+Message-id: 20250110160204.74997-4-philmd@linaro.org
 Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
 Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20220301215958.157011-5-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/internals.h | 19 +------------------
+ hw/arm/stellaris.c | 2 --
- target/arm/helper.c    | 22 ++++++++++++++++++++++
+file changed, 2 deletions(-)
 files changed, 23 insertions(+), 18 deletions(-)
-diff --git a/target/arm/internals.h b/target/arm/internals.h
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/internals.h
+--- a/hw/arm/stellaris.c
-+++ b/target/arm/internals.h
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@ static inline void update_spsel(CPUARMState *env, uint32_t imm)
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-  * Returns the implementation defined bit-width of physical addresses.
+      * http://www.ti.com/lit/ds/symlink/lm3s6965.pdf
-  * The ARMv8 reference manuals refer to this as PAMax().
+      *
-  */
+      * 40000000 wdtimer
--static inline unsigned int arm_pamax(ARMCPU *cpu)
+-     * 40002000 i2c (unimplemented)
--{
+      * 40004000 GPIO
--    static const unsigned int pamax_map[] = {
+      * 40005000 GPIO
--        [0] = 32,
+      * 40006000 GPIO
--        [1] = 36,
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
--        [2] = 40,
+     /* Add dummy regions for the devices we don't implement yet,
--        [3] = 42,
+      * so guest accesses don't cause unlogged crashes.
--        [4] = 44,
+      */
--        [5] = 48,
+-    create_unimplemented_device("i2c-0", 0x40002000, 0x1000);
--    };
+     create_unimplemented_device("i2c-2", 0x40021000, 0x1000);
--    unsigned int parange =
+     create_unimplemented_device("PWM", 0x40028000, 0x1000);
--        FIELD_EX64(cpu->isar.id_aa64mmfr0, ID_AA64MMFR0, PARANGE);
+     create_unimplemented_device("QEI-0", 0x4002c000, 0x1000);
 -
 -    /* id_aa64mmfr0 is a read-only register so values outside of the
 -     * supported mappings can be considered an implementation error.  */
 -    assert(parange < ARRAY_SIZE(pamax_map));
 -    return pamax_map[parange];
 -}
 +unsigned int arm_pamax(ARMCPU *cpu);
  /* Return true if extended addresses are enabled.
   * This is always the case if our translation regime is 64 bit,
 diff --git a/target/arm/helper.c b/target/arm/helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/helper.c
 +++ b/target/arm/helper.c
@@ -XXX,XX +XXX,XX @@ static uint8_t convert_stage2_attrs(CPUARMState *env, uint8_t s2attrs)
  }
  #endif /* !CONFIG_USER_ONLY */
 +/* The cpu-specific constant value of PAMax; also used by hw/arm/virt. */
 +unsigned int arm_pamax(ARMCPU *cpu)
 +{
 +    static const unsigned int pamax_map[] = {
 +        [0] = 32,
 +        [1] = 36,
 +        [2] = 40,
 +        [3] = 42,
 +        [4] = 44,
 +        [5] = 48,
 +    };
 +    unsigned int parange =
 +        FIELD_EX64(cpu->isar.id_aa64mmfr0, ID_AA64MMFR0, PARANGE);
 +
 +    /*
 +     * id_aa64mmfr0 is a read-only register so values outside of the
 +     * supported mappings can be considered an implementation error.
 +     */
 +    assert(parange < ARRAY_SIZE(pamax_map));
 +    return pamax_map[parange];
 +}
 +
  static int aa64_va_parameter_tbi(uint64_t tcr, ARMMMUIdx mmu_idx)
  {
      if (regime_has_2_ranges(mmu_idx)) {
 --
-.25.1
+.34.1

-[PULL 06/26] target/arm: Fix early free of TCG temp in handle_simd_shift_fpint_conv()
+[PULL 10/36] hw/arm/stellaris: Replace magic numbers by definitions
-From: Wentao_Liang <Wentao_Liang_g@163.com>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-handle_simd_shift_fpint_conv() was accidentally freeing the TCG
+Add definitions for the number of controllers.
 temporary tcg_fpstatus too early, before the last use of it.  Move
 the free down to where it belongs.
-Signed-off-by: Wentao_Liang <Wentao_Liang_g@163.com>
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
-Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-[PMM: cleaned up commit message]
+Message-id: 20250110160204.74997-5-philmd@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/translate-a64.c | 2 +-
+ hw/arm/stellaris.c | 25 +++++++++++++++----------
-file changed, 1 insertion(+), 1 deletion(-)
+file changed, 15 insertions(+), 10 deletions(-)
-diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/translate-a64.c
+--- a/hw/arm/stellaris.c
-+++ b/target/arm/translate-a64.c
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,
+@@ -XXX,XX +XXX,XX @@
  #define NUM_IRQ_LINES 64
  #define NUM_PRIO_BITS 3
 +#define NUM_GPIO    7
 +#define NUM_UART    4
 +#define NUM_GPTM    4
 +#define NUM_I2C     2
 +
  typedef const struct {
      const char *name;
      uint32_t did0;
@@ -XXX,XX +XXX,XX @@ static const stellaris_board_info stellaris_boards[] = {
  static void stellaris_init(MachineState *ms, stellaris_board_info *board)
  {
 -    static const int uart_irq[] = {5, 6, 33, 34};
 -    static const int timer_irq[] = {19, 21, 23, 35};
 -    static const uint32_t gpio_addr[7] =
 +    static const int uart_irq[NUM_UART] = {5, 6, 33, 34};
 +    static const int timer_irq[NUM_GPTM] = {19, 21, 23, 35};
 +    static const uint32_t gpio_addr[NUM_GPIO] =
        { 0x40004000, 0x40005000, 0x40006000, 0x40007000,
 x40024000, 0x40025000, 0x40026000};
 -    static const int gpio_irq[7] = {0, 1, 2, 3, 4, 30, 31};
 +    static const int gpio_irq[NUM_GPIO] = {0, 1, 2, 3, 4, 30, 31};
      /* Memory map of SoC devices, from
       * Stellaris LM3S6965 Microcontroller Data Sheet (rev I)
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
       */
      Object *soc_container;
 -    DeviceState *gpio_dev[7], *armv7m, *nvic;
 -    qemu_irq gpio_in[7][8];
 -    qemu_irq gpio_out[7][8];
 +    DeviceState *gpio_dev[NUM_GPIO], *armv7m, *nvic;
 +    qemu_irq gpio_in[NUM_GPIO][8];
 +    qemu_irq gpio_out[NUM_GPIO][8];
      qemu_irq adc;
      int sram_size;
      int flash_size;
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
      } else {
          adc = NULL;
      }
 -    for (i = 0; i < 4; i++) {
 +    for (i = 0; i < NUM_GPTM; i++) {
          if (board->dc2 & (0x10000 << i)) {
              SysBusDevice *sbd;
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
      }
 -    for (i = 0; i < 7; i++) {
 +    for (i = 0; i < NUM_GPIO; i++) {
          if (board->dc4 & (1 << i)) {
              gpio_dev[i] = sysbus_create_simple("pl061_luminary", gpio_addr[i],
                                                 qdev_get_gpio_in(nvic,
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
          }
      }
--    tcg_temp_free_ptr(tcg_fpstatus);
+-    for (i = 0; i < 4; i++) {
-     tcg_temp_free_i32(tcg_shift);
++    for (i = 0; i < NUM_UART; i++) {
-     gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
+         if (board->dc2 & (1 << i)) {
-+    tcg_temp_free_ptr(tcg_fpstatus);
+             SysBusDevice *sbd;
      tcg_temp_free_i32(tcg_rmode);
  }
 --
-.25.1
+.34.1

-[PULL 14/26] target/arm: Honor TCR_ELx.{I}PS
+[PULL 11/36] hw/arm/stellaris: Use DEVCAP macro to access DeviceCapability registers
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
-This field controls the output (intermediate) physical address size
+Add definitions (DCx_periph) for the DeviceCapability bits,
-of the translation process.  V8 requires to raise an AddressSize
+replace direct bitmask checks with the DEV_CAP() macro,
-fault if the page tables are programmed incorrectly, such that any
+which use the extract/deposit API.
 intermediate descriptor address, or the final translated address,
 is out of range.
-Add a PS field to ARMVAParameters, and properly compute outputsize
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
 in get_phys_addr_lpae.  Test the descaddr as extracted from TTBR
 and from page table entries.
 Restrict descaddrmask so that we won't raise the fault for v7.
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
+Message-id: 20250110160204.74997-6-philmd@linaro.org
 Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20220301215958.157011-8-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/internals.h |  1 +
+ hw/arm/stellaris.c | 37 +++++++++++++++++++++++++++++--------
- target/arm/helper.c    | 72 ++++++++++++++++++++++++++++++++----------
+file changed, 29 insertions(+), 8 deletions(-)
 files changed, 57 insertions(+), 16 deletions(-)
-diff --git a/target/arm/internals.h b/target/arm/internals.h
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/internals.h
+--- a/hw/arm/stellaris.c
-+++ b/target/arm/internals.h
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@ static inline uint32_t aarch64_pstate_valid_mask(const ARMISARegisters *id)
+@@ -XXX,XX +XXX,XX @@
   */
- typedef struct ARMVAParameters {
-     unsigned tsz    : 8;
+ #include "qemu/osdep.h"
-+    unsigned ps     : 3;
++#include "qemu/bitops.h"
-     unsigned select : 1;
+ #include "qapi/error.h"
-     bool tbi        : 1;
+ #include "hw/core/split-irq.h"
-     bool epd        : 1;
+ #include "hw/sysbus.h"
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+@@ -XXX,XX +XXX,XX @@
-index XXXXXXX..XXXXXXX 100644
+ #define NUM_GPTM    4
---- a/target/arm/helper.c
+ #define NUM_I2C     2
-+++ b/target/arm/helper.c
-@@ -XXX,XX +XXX,XX @@ static uint8_t convert_stage2_attrs(CPUARMState *env, uint8_t s2attrs)
++/*
- }
++ * See Stellaris Data Sheet chapter 5.2.5 "System Control",
- #endif /* !CONFIG_USER_ONLY */
++ * Register 13 .. 17: Device Capabilities 0 .. 4 (DC0 .. DC4).
++ */
-+/* This mapping is common between ID_AA64MMFR0.PARANGE and TCR_ELx.{I}PS. */
++#define DC1_WDT          3
-+static const uint8_t pamax_map[] = {
++#define DC1_HIB          6
-+    [0] = 32,
++#define DC1_MPU          7
-+    [1] = 36,
++#define DC1_ADC          16
-+    [2] = 40,
++#define DC1_PWM          20
-+    [3] = 42,
++#define DC2_UART(n)     (n)
-+    [4] = 44,
++#define DC2_SSI          4
-+    [5] = 48,
++#define DC2_QEI(n)      (8 + n)
-+};
++#define DC2_I2C(n)      (12 + 2 * n)
 +#define DC2_GPTM(n)     (16 + n)
 +#define DC2_COMP(n)     (24 + n)
 +#define DC4_GPIO(n)     (n)
 +#define DC4_EMAC         28
 +
- /* The cpu-specific constant value of PAMax; also used by hw/arm/virt. */
++#define DEV_CAP(_dc, _cap) extract32(board->dc##_dc, DC##_dc##_##_cap, 1)
- unsigned int arm_pamax(ARMCPU *cpu)
++
- {
+ typedef const struct {
--    static const unsigned int pamax_map[] = {
+     const char *name;
--        [0] = 32,
+     uint32_t did0;
--        [1] = 36,
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
--        [2] = 40,
+     sysbus_mmio_map(SYS_BUS_DEVICE(ssys_dev), 0, 0x400fe000);
--        [3] = 42,
+     sysbus_connect_irq(SYS_BUS_DEVICE(ssys_dev), 0, qdev_get_gpio_in(nvic, 28));
--        [4] = 44,
--        [5] = 48,
+-    if (board->dc1 & (1 << 16)) {
--    };
++    if (DEV_CAP(1, ADC)) {
-     unsigned int parange =
+         dev = sysbus_create_varargs(TYPE_STELLARIS_ADC, 0x40038000,
-         FIELD_EX64(cpu->isar.id_aa64mmfr0, ID_AA64MMFR0, PARANGE);
+                                     qdev_get_gpio_in(nvic, 14),
+                                     qdev_get_gpio_in(nvic, 15),
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
- {
+         adc = NULL;
-     uint64_t tcr = regime_tcr(env, mmu_idx)->raw_tcr;
+     }
-     bool epd, hpd, using16k, using64k, tsz_oob;
+     for (i = 0; i < NUM_GPTM; i++) {
--    int select, tsz, tbi, max_tsz, min_tsz;
+-        if (board->dc2 & (0x10000 << i)) {
-+    int select, tsz, tbi, max_tsz, min_tsz, ps;
++        if (DEV_CAP(2, GPTM(i))) {
+             SysBusDevice *sbd;
-     if (!regime_has_2_ranges(mmu_idx)) {
-         select = 0;
+             dev = qdev_new(TYPE_STELLARIS_GPTM);
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
              hpd = extract32(tcr, 24, 1);
          }
-         epd = false;
+     }
-+        ps = extract32(tcr, 16, 3);
-     } else {
+-    if (board->dc1 & (1 << 3)) { /* watchdog present */
-         /*
++    if (DEV_CAP(1, WDT)) {
-          * Bit 55 is always between the two regions, and is canonical for
+         dev = qdev_new(TYPE_LUMINARY_WATCHDOG);
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+         object_property_add_child(soc_container, "wdg", OBJECT(dev));
-             epd = extract32(tcr, 23, 1);
+         qdev_connect_clock_in(dev, "WDOGCLK",
-             hpd = extract64(tcr, 42, 1);
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
      for (i = 0; i < NUM_GPIO; i++) {
 -        if (board->dc4 & (1 << i)) {
 +        if (DEV_CAP(4, GPIO(i))) {
              gpio_dev[i] = sysbus_create_simple("pl061_luminary", gpio_addr[i],
                                                 qdev_get_gpio_in(nvic,
                                                                  gpio_irq[i]));
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
          }
-+        ps = extract64(tcr, 32, 3);
      }
-     if (cpu_isar_feature(aa64_st, env_archcpu(env))) {
+-    if (board->dc2 & (1 << 12)) {
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
++    if (DEV_CAP(2, I2C(0))) {
+         dev = sysbus_create_simple(TYPE_STELLARIS_I2C, 0x40020000,
-     return (ARMVAParameters) {
+                                    qdev_get_gpio_in(nvic, 8));
-         .tsz = tsz,
+         i2c = (I2CBus *)qdev_get_child_bus(dev, "i2c");
-+        .ps = ps,
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-         .select = select,
+     }
-         .tbi = tbi,
-         .epd = epd,
+     for (i = 0; i < NUM_UART; i++) {
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
+-        if (board->dc2 & (1 << i)) {
++        if (DEV_CAP(2, UART(i))) {
-     /* TODO: This code does not support shareability levels. */
+             SysBusDevice *sbd;
-     if (aarch64) {
-+        int ps;
+             dev = qdev_new("pl011_luminary");
-+
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-         param = aa64_va_parameters(env, address, mmu_idx,
+             sysbus_connect_irq(sbd, 0, qdev_get_gpio_in(nvic, uart_irq[i]));
                                     access_type != MMU_INST_FETCH);
          level = 0;
@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
          addrsize = 64 - 8 * param.tbi;
          inputsize = 64 - param.tsz;
 -        outputsize = arm_pamax(cpu);
 +
 +        /*
 +         * Bound PS by PARANGE to find the effective output address size.
 +         * ID_AA64MMFR0 is a read-only register so values outside of the
 +         * supported mappings can be considered an implementation error.
 +         */
 +        ps = FIELD_EX64(cpu->isar.id_aa64mmfr0, ID_AA64MMFR0, PARANGE);
 +        ps = MIN(ps, param.ps);
 +        assert(ps < ARRAY_SIZE(pamax_map));
 +        outputsize = pamax_map[ps];
      } else {
          param = aa32_va_parameters(env, address, mmu_idx);
          level = 1;
@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
      /* Now we can extract the actual base address from the TTBR */
      descaddr = extract64(ttbr, 0, 48);
 +
 +    /*
 +     * If the base address is out of range, raise AddressSizeFault.
 +     * In the pseudocode, this is !IsZero(baseregister<47:outputsize>),
 +     * but we've just cleared the bits above 47, so simplify the test.
 +     */
 +    if (descaddr >> outputsize) {
 +        level = 0;
 +        fault_type = ARMFault_AddressSize;
 +        goto do_fault;
 +    }
 +
      /*
       * We rely on this masking to clear the RES0 bits at the bottom of the TTBR
       * and also to mask out CnP (bit 0) which could validly be non-zero.
       */
      descaddr &= ~indexmask;
 -    /* The address field in the descriptor goes up to bit 39 for ARMv7
 -     * but up to bit 47 for ARMv8, but we use the descaddrmask
 -     * up to bit 39 for AArch32, because we don't need other bits in that case
 -     * to construct next descriptor address (anyway they should be all zeroes).
 +    /*
 +     * For AArch32, the address field in the descriptor goes up to bit 39
 +     * for both v7 and v8.  However, for v8 the SBZ bits [47:40] must be 0
 +     * or an AddressSize fault is raised.  So for v8 we extract those SBZ
 +     * bits as part of the address, which will be checked via outputsize.
 +     * For AArch64, the address field always goes up to bit 47 (with extra
 +     * bits for FEAT_LPA placed elsewhere).  AArch64 implies v8.
       */
 -    descaddrmask = ((1ull << (aarch64 ? 48 : 40)) - 1) &
 -                   ~indexmask_grainsize;
 +    if (arm_feature(env, ARM_FEATURE_V8)) {
 +        descaddrmask = MAKE_64BIT_MASK(0, 48);
 +    } else {
 +        descaddrmask = MAKE_64BIT_MASK(0, 40);
 +    }
 +    descaddrmask &= ~indexmask_grainsize;
      /* Secure accesses start with the page table in secure memory and
       * can be downgraded to non-secure at any step. Non-secure accesses
@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
              /* Invalid, or the Reserved level 3 encoding */
              goto do_fault;
          }
-+
+     }
-         descaddr = descriptor & descaddrmask;
+-    if (board->dc2 & (1 << 4)) {
-+        if (descaddr >> outputsize) {
++    if (DEV_CAP(2, SSI)) {
-+            fault_type = ARMFault_AddressSize;
+         dev = sysbus_create_simple("pl022", 0x40008000,
-+            goto do_fault;
+                                    qdev_get_gpio_in(nvic, 7));
-+        }
+         if (board->peripherals & BP_OLED_SSI) {
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-         if ((descriptor & 2) && (level < 3)) {
+             qemu_irq_raise(gpio_out[GPIO_D][0]);
-             /* Table entry. The top five bits are attributes which may
+         }
      }
 -    if (board->dc4 & (1 << 28)) {
 +    if (DEV_CAP(4, EMAC)) {
          DeviceState *enet;
          enet = qdev_new("stellaris_enet");
 --
-.25.1
+.34.1

-[PULL 03/26] hw/input/tsc210x: Don't abort on bad SPI word widths
+[PULL 12/36] hw/arm/stellaris: Map both I2C controllers
-The tsc210x doesn't support anything other than 16-bit reads on the
+From: Philippe Mathieu-Daudé <philmd@linaro.org>
 SPI bus, but the guest can program the SPI controller to attempt
 them anyway. If this happens, don't abort QEMU, just log this as
 a guest error.
-This fixes our machine_arm_n8x0.py:N8x0Machine.test_n800
+There are 2 I2C controllers, map them both, removing
-acceptance test, which hits this assertion.
+the unimplemented one. Keep the OLED controller on the
 first I2C bus.
-The reason we hit the assertion is because the guest kernel thinks
+Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org>
-there is a TSC2005 on this SPI bus address, not a TSC210x.  (The n810
+Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-*does* have a TSC2005 at this address.) The TSC2005 supports the
+Message-id: 20250110160204.74997-7-philmd@linaro.org
--bit accesses which the guest driver makes, and the TSC210x does
+[PMM: tweak to appease maybe-use-uninitialized warning]
-not (that is, our TSC210x emulation is not missing support for a word
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-width the hardware can handle).  It's not clear whether the problem
+---
-here is that the guest kernel incorrectly thinks the n800 has the
+ hw/arm/stellaris.c | 21 +++++++++++++--------
-same device at this SPI bus address as the n810, or that QEMU's n810
+file changed, 13 insertions(+), 8 deletions(-)
 board model doesn't get the SPI devices right.  At this late date
 there no longer appears to be any reliable information on the web
 about the hardware behaviour, but I am inclined to think this is a
 guest kernel bug.  In any case, we prefer not to abort QEMU for
 guest-triggerable conditions, so logging the error is the right thing
 to do.
-Resolves: https://gitlab.com/qemu-project/qemu/-/issues/736
+diff --git a/hw/arm/stellaris.c b/hw/arm/stellaris.c
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
 Message-id: 20220221140750.514557-1-peter.maydell@linaro.org
 ---
  hw/input/tsc210x.c | 8 ++++++--
 file changed, 6 insertions(+), 2 deletions(-)
 diff --git a/hw/input/tsc210x.c b/hw/input/tsc210x.c
 index XXXXXXX..XXXXXXX 100644
---- a/hw/input/tsc210x.c
+--- a/hw/arm/stellaris.c
-+++ b/hw/input/tsc210x.c
++++ b/hw/arm/stellaris.c
-@@ -XXX,XX +XXX,XX @@
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
- #include "hw/hw.h"
+       { 0x40004000, 0x40005000, 0x40006000, 0x40007000,
- #include "audio/audio.h"
+x40024000, 0x40025000, 0x40026000};
- #include "qemu/timer.h"
+     static const int gpio_irq[NUM_GPIO] = {0, 1, 2, 3, 4, 30, 31};
-+#include "qemu/log.h"
++    static const uint32_t i2c_addr[NUM_I2C] = {0x40020000, 0x40021000};
- #include "sysemu/reset.h"
++    static const int i2c_irq[NUM_I2C] = {8, 37};
- #include "ui/console.h"
- #include "hw/arm/omap.h"            /* For I2SCodec */
+     /* Memory map of SoC devices, from
-@@ -XXX,XX +XXX,XX @@ uint32_t tsc210x_txrx(void *opaque, uint32_t value, int len)
+      * Stellaris LM3S6965 Microcontroller Data Sheet (rev I)
-     TSC210xState *s = opaque;
+@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
-     uint32_t ret = 0;
+     qemu_irq adc;
+     int sram_size;
--    if (len != 16)
+     int flash_size;
--        hw_error("%s: FIXME: bad SPI word width %i\n", __func__, len);
+-    I2CBus *i2c;
-+    if (len != 16) {
++    DeviceState *i2c_dev[NUM_I2C] = { };
-+        qemu_log_mask(LOG_GUEST_ERROR,
+     DeviceState *dev;
-+                      "%s: bad SPI word width %i\n", __func__, len);
+     DeviceState *ssys_dev;
-+        return 0;
+     int i;
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
          }
      }
 -    if (DEV_CAP(2, I2C(0))) {
 -        dev = sysbus_create_simple(TYPE_STELLARIS_I2C, 0x40020000,
 -                                   qdev_get_gpio_in(nvic, 8));
 -        i2c = (I2CBus *)qdev_get_child_bus(dev, "i2c");
 -        if (board->peripherals & BP_OLED_I2C) {
 -            i2c_slave_create_simple(i2c, "ssd0303", 0x3d);
 +    for (i = 0; i < NUM_I2C; i++) {
 +        if (DEV_CAP(2, I2C(i))) {
 +            i2c_dev[i] = sysbus_create_simple(TYPE_STELLARIS_I2C, i2c_addr[i],
 +                                              qdev_get_gpio_in(nvic,
 +                                                               i2c_irq[i]));
          }
      }
 +    if (board->peripherals & BP_OLED_I2C) {
 +        I2CBus *bus = (I2CBus *)qdev_get_child_bus(i2c_dev[0], "i2c");
 +
 +        i2c_slave_create_simple(bus, "ssd0303", 0x3d);
 +    }
-     /* TODO: sequential reads etc - how do we make sure the host doesn't
+     for (i = 0; i < NUM_UART; i++) {
-      * unintentionally read out a conversion result from a register while
+         if (DEV_CAP(2, UART(i))) {
@@ -XXX,XX +XXX,XX @@ static void stellaris_init(MachineState *ms, stellaris_board_info *board)
      /* Add dummy regions for the devices we don't implement yet,
       * so guest accesses don't cause unlogged crashes.
       */
 -    create_unimplemented_device("i2c-2", 0x40021000, 0x1000);
      create_unimplemented_device("PWM", 0x40028000, 0x1000);
      create_unimplemented_device("QEI-0", 0x4002c000, 0x1000);
      create_unimplemented_device("QEI-1", 0x4002d000, 0x1000);
 --
-.25.1
+.34.1

-[PULL 07/26] tests/qtest: add qtests for npcm7xx sdhci
+[PULL 13/36] tests/functional: Add a test for the arm microbit machine
-From: Shengtan Mao <stmao@google.com>
+From: Thomas Huth <thuth@redhat.com>
-Reviewed-by: Hao Wu <wuhaotsh@google.com>
+We don't have any functional tests for this machine yet, thus let's
-Reviewed-by: Chris Rauer <crauer@google.com>
+add a test with a MicroPython binary that is available online
-Signed-off-by: Shengtan Mao <stmao@google.com>
+(thanks to Joel Stanley for providing it, see:
-Signed-off-by: Patrick Venture <venture@google.com>
+ https://www.mail-archive.com/qemu-devel@nongnu.org/msg606064.html ).
-Message-id: 20220225174451.192304-1-wuhaotsh@google.com
 Signed-off-by: Thomas Huth <thuth@redhat.com>
 Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
 Message-id: 20250124101709.1591761-1-thuth@redhat.com
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- tests/qtest/npcm7xx_sdhci-test.c | 215 +++++++++++++++++++++++++++++++
+ MAINTAINERS                           |  1 +
- tests/qtest/meson.build          |   1 +
+ tests/functional/meson.build          |  1 +
-files changed, 216 insertions(+)
+ tests/functional/test_arm_microbit.py | 31 +++++++++++++++++++++++++++
- create mode 100644 tests/qtest/npcm7xx_sdhci-test.c
+files changed, 33 insertions(+)
  create mode 100755 tests/functional/test_arm_microbit.py
-diff --git a/tests/qtest/npcm7xx_sdhci-test.c b/tests/qtest/npcm7xx_sdhci-test.c
+diff --git a/MAINTAINERS b/MAINTAINERS
-new file mode 100644
+index XXXXXXX..XXXXXXX 100644
 --- a/MAINTAINERS
 +++ b/MAINTAINERS
@@ -XXX,XX +XXX,XX @@ F: hw/*/microbit*.c
  F: include/hw/*/nrf51*.h
  F: include/hw/*/microbit*.h
  F: tests/qtest/microbit-test.c
 +F: tests/functional/test_arm_microbit.py
  F: docs/system/arm/nrf.rst
  ARM PL011 Rust device
 diff --git a/tests/functional/meson.build b/tests/functional/meson.build
 index XXXXXXX..XXXXXXX 100644
 --- a/tests/functional/meson.build
 +++ b/tests/functional/meson.build
@@ -XXX,XX +XXX,XX @@ tests_arm_system_thorough = [
    'arm_cubieboard',
    'arm_emcraft_sf2',
    'arm_integratorcp',
 +  'arm_microbit',
    'arm_orangepi',
    'arm_quanta_gsj',
    'arm_raspi2',
 diff --git a/tests/functional/test_arm_microbit.py b/tests/functional/test_arm_microbit.py
 new file mode 100755
 index XXXXXXX..XXXXXXX
 --- /dev/null
-+++ b/tests/qtest/npcm7xx_sdhci-test.c
++++ b/tests/functional/test_arm_microbit.py
 @@ -XXX,XX +XXX,XX @@
-+/*
++#!/usr/bin/env python3
-+ * QTests for NPCM7xx SD-3.0 / MMC-4.51 Host Controller
++#
-+ *
++# SPDX-License-Identifier: GPL-2.0-or-later
-+ * Copyright (c) 2022 Google LLC
++#
-+ *
++# Copyright 2025, The QEMU Project Developers.
-+ * This program is free software; you can redistribute it and/or modify it
++#
-+ * under the terms of the GNU General Public License as published by the
++# A functional test that runs MicroPython on the arm microbit machine.
 + * Free Software Foundation; either version 2 of the License, or
 + * (at your option) any later version.
 + *
 + * This program is distributed in the hope that it will be useful, but WITHOUT
 + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
 + * for more details.
 + */
 +
-+#include "qemu/osdep.h"
++from qemu_test import QemuSystemTest, Asset, exec_command_and_wait_for_pattern
-+#include "hw/sd/npcm7xx_sdhci.h"
++from qemu_test import wait_for_console_pattern
 +
-+#include "libqos/libqtest.h"
-+#include "libqtest-single.h"
-+#include "libqos/sdhci-cmd.h"
 +
-+#define NPCM7XX_REG_SIZE 0x100
++class MicrobitMachine(QemuSystemTest):
 +#define NPCM7XX_MMC_BA 0xF0842000
 +#define NPCM7XX_BLK_SIZE 512
 +#define NPCM7XX_TEST_IMAGE_SIZE (1 << 30)
 +
-+char *sd_path;
++    ASSET_MICRO = Asset('https://ozlabs.org/~joel/microbit-micropython.hex',
 +        '021641f93dfb11767d4978dbb3ca7f475d1b13c69e7f4aec3382f212636bffd6')
 +
-+static QTestState *setup_sd_card(void)
++    def test_arm_microbit(self):
-+{
++        self.set_machine('microbit')
 +    QTestState *qts = qtest_initf(
 +        "-machine kudo-bmc "
 +        "-device sd-card,drive=drive0 "
 +        "-drive id=drive0,if=none,file=%s,format=raw,auto-read-only=off",
 +        sd_path);
 +
-+    qtest_writew(qts, NPCM7XX_MMC_BA + SDHC_SWRST, SDHC_RESET_ALL);
++        micropython = self.ASSET_MICRO.fetch()
-+    qtest_writew(qts, NPCM7XX_MMC_BA + SDHC_CLKCON,
++        self.vm.set_console()
-+                 SDHC_CLOCK_SDCLK_EN | SDHC_CLOCK_INT_STABLE |
++        self.vm.add_args('-device', f'loader,file={micropython}')
-+                     SDHC_CLOCK_INT_EN);
++        self.vm.launch()
-+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0, 0, SDHC_APP_CMD);
++        wait_for_console_pattern(self, 'Type "help()" for more information.')
-+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0x41200000, 0, (41 << 8));
++        exec_command_and_wait_for_pattern(self, 'import machine as mch', '>>>')
-+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0, 0, SDHC_ALL_SEND_CID);
++        exec_command_and_wait_for_pattern(self, 'mch.reset()', 'MicroPython')
-+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0, 0, SDHC_SEND_RELATIVE_ADDR);
++        wait_for_console_pattern(self, '>>>')
 +    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0x45670000, 0,
 +                   SDHC_SELECT_DESELECT_CARD);
 +
-+    return qts;
++if __name__ == '__main__':
-+}
++    QemuSystemTest.main()
 +
 +static void write_sdread(QTestState *qts, const char *msg)
 +{
 +    int fd, ret;
 +    size_t len = strlen(msg);
 +    char *rmsg = g_malloc(len);
 +
 +    /* write message to sd */
 +    fd = open(sd_path, O_WRONLY);
 +    g_assert(fd >= 0);
 +    ret = write(fd, msg, len);
 +    close(fd);
 +    g_assert(ret == len);
 +
 +    /* read message using sdhci */
 +    ret = sdhci_read_cmd(qts, NPCM7XX_MMC_BA, rmsg, len);
 +    g_assert(ret == len);
 +    g_assert(!memcmp(rmsg, msg, len));
 +
 +    g_free(rmsg);
 +}
 +
 +/* Check MMC can read values from sd */
 +static void test_read_sd(void)
 +{
 +    QTestState *qts = setup_sd_card();
 +
 +    write_sdread(qts, "hello world");
 +    write_sdread(qts, "goodbye");
 +
 +    qtest_quit(qts);
 +}
 +
 +static void sdwrite_read(QTestState *qts, const char *msg)
 +{
 +    int fd, ret;
 +    size_t len = strlen(msg);
 +    char *rmsg = g_malloc(len);
 +
 +    /* write message using sdhci */
 +    sdhci_write_cmd(qts, NPCM7XX_MMC_BA, msg, len, NPCM7XX_BLK_SIZE);
 +
 +    /* read message from sd */
 +    fd = open(sd_path, O_RDONLY);
 +    g_assert(fd >= 0);
 +    ret = read(fd, rmsg, len);
 +    close(fd);
 +    g_assert(ret == len);
 +
 +    g_assert(!memcmp(rmsg, msg, len));
 +
 +    g_free(rmsg);
 +}
 +
 +/* Check MMC can write values to sd */
 +static void test_write_sd(void)
 +{
 +    QTestState *qts = setup_sd_card();
 +
 +    sdwrite_read(qts, "hello world");
 +    sdwrite_read(qts, "goodbye");
 +
 +    qtest_quit(qts);
 +}
 +
 +/* Check SDHCI has correct default values. */
 +static void test_reset(void)
 +{
 +    QTestState *qts = qtest_init("-machine kudo-bmc");
 +    uint64_t addr = NPCM7XX_MMC_BA;
 +    uint64_t end_addr = addr + NPCM7XX_REG_SIZE;
 +    uint16_t prstvals_resets[] = {NPCM7XX_PRSTVALS_0_RESET,
 +                                  NPCM7XX_PRSTVALS_1_RESET,
 +                                  0,
 +                                  NPCM7XX_PRSTVALS_3_RESET,
 +                                  0,
 +                                  0};
 +    int i;
 +    uint32_t mask;
 +
 +    while (addr < end_addr) {
 +        switch (addr - NPCM7XX_MMC_BA) {
 +        case SDHC_PRNSTS:
 +            /*
 +             * ignores bits 20 to 24: they are changed when reading registers
 +             */
 +            mask = 0x1f00000;
 +            g_assert_cmphex(qtest_readl(qts, addr) | mask, ==,
 +                            NPCM7XX_PRSNTS_RESET | mask);
 +            addr += 4;
 +            break;
 +        case SDHC_BLKGAP:
 +            g_assert_cmphex(qtest_readb(qts, addr), ==, NPCM7XX_BLKGAP_RESET);
 +            addr += 1;
 +            break;
 +        case SDHC_CAPAB:
 +            g_assert_cmphex(qtest_readq(qts, addr), ==, NPCM7XX_CAPAB_RESET);
 +            addr += 8;
 +            break;
 +        case SDHC_MAXCURR:
 +            g_assert_cmphex(qtest_readq(qts, addr), ==, NPCM7XX_MAXCURR_RESET);
 +            addr += 8;
 +            break;
 +        case SDHC_HCVER:
 +            g_assert_cmphex(qtest_readw(qts, addr), ==, NPCM7XX_HCVER_RESET);
 +            addr += 2;
 +            break;
 +        case NPCM7XX_PRSTVALS:
 +            for (i = 0; i < NPCM7XX_PRSTVALS_SIZE; ++i) {
 +                g_assert_cmphex(qtest_readw(qts, addr + 2 * i), ==,
 +                                prstvals_resets[i]);
 +            }
 +            addr += NPCM7XX_PRSTVALS_SIZE * 2;
 +            break;
 +        default:
 +            g_assert_cmphex(qtest_readb(qts, addr), ==, 0);
 +            addr += 1;
 +        }
 +    }
 +
 +    qtest_quit(qts);
 +}
 +
 +static void drive_destroy(void)
 +{
 +    unlink(sd_path);
 +    g_free(sd_path);
 +}
 +
 +static void drive_create(void)
 +{
 +    int fd, ret;
 +    GError *error = NULL;
 +
 +    /* Create a temporary raw image */
 +    fd = g_file_open_tmp("sdhci_XXXXXX", &sd_path, &error);
 +    if (fd == -1) {
 +        fprintf(stderr, "unable to create sdhci file: %s\n", error->message);
 +        g_error_free(error);
 +    }
 +    g_assert(sd_path != NULL);
 +
 +    ret = ftruncate(fd, NPCM7XX_TEST_IMAGE_SIZE);
 +    g_assert_cmpint(ret, ==, 0);
 +    g_message("%s", sd_path);
 +    close(fd);
 +}
 +
 +int main(int argc, char **argv)
 +{
 +    int ret;
 +
 +    drive_create();
 +
 +    g_test_init(&argc, &argv, NULL);
 +
 +    qtest_add_func("npcm7xx_sdhci/reset", test_reset);
 +    qtest_add_func("npcm7xx_sdhci/write_sd", test_write_sd);
 +    qtest_add_func("npcm7xx_sdhci/read_sd", test_read_sd);
 +
 +    ret = g_test_run();
 +    drive_destroy();
 +    return ret;
 +}
 diff --git a/tests/qtest/meson.build b/tests/qtest/meson.build
 index XXXXXXX..XXXXXXX 100644
 --- a/tests/qtest/meson.build
 +++ b/tests/qtest/meson.build
@@ -XXX,XX +XXX,XX @@ qtests_npcm7xx = \
     'npcm7xx_gpio-test',
     'npcm7xx_pwm-test',
     'npcm7xx_rng-test',
 +   'npcm7xx_sdhci-test',
     'npcm7xx_smbus-test',
     'npcm7xx_timer-test',
     'npcm7xx_watchdog_timer-test'] + \
 --
-.25.1
+.34.1

-[PULL 21/26] target/arm: Validate tlbi TG matches translation granule in use
+[PULL 14/36] target/arm: arm_reset_sve_state() should set FPSR, not FPCR
-From: Richard Henderson <richard.henderson@linaro.org>
+The pseudocode ResetSVEState() does:
     FPSR = ZeroExtend(0x0800009f<31:0>, 64);
 but QEMU's arm_reset_sve_state() called vfp_set_fpcr() by accident.
-For FEAT_LPA2, we will need other ARMVAParameters, which themselves
+Before the advent of FEAT_AFP, this was only setting a collection of
-depend on the translation granule in use.  We might as well validate
+RES0 bits, which vfp_set_fpsr() would then ignore, so the only effect
-that the given TG matches; the architecture "does not require that
+was that we didn't actually set the FPSR the way we are supposed to
-the instruction invalidates any entries" if this is not true.
+do.  Once FEAT_AFP is implemented, setting the bottom bits of FPSR
 will change the floating point behaviour.
-Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
+Call vfp_set_fpsr(), as we ought to.
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-15-richard.henderson@linaro.org
+(Note for stable backports: commit 7f2a01e7368f9 moved this function
 from sme_helper.c to helper.c, but it had the same bug before the
 move too.)
 Cc: qemu-stable@nongnu.org
 Fixes: f84734b87461 ("target/arm: Implement SMSTART, SMSTOP")
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-4-peter.maydell@linaro.org
 ---
- target/arm/helper.c | 10 +++++++---
+ target/arm/helper.c | 2 +-
-file changed, 7 insertions(+), 3 deletions(-)
+file changed, 1 insertion(+), 1 deletion(-)
 diff --git a/target/arm/helper.c b/target/arm/helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/helper.c
 +++ b/target/arm/helper.c
-@@ -XXX,XX +XXX,XX @@ static TLBIRange tlbi_aa64_get_range(CPUARMState *env, ARMMMUIdx mmuidx,
+@@ -XXX,XX +XXX,XX @@ static void arm_reset_sve_state(CPUARMState *env)
-                                      uint64_t value)
+     memset(env->vfp.zregs, 0, sizeof(env->vfp.zregs));
- {
+     /* Recall that FFR is stored as pregs[16]. */
-     unsigned int page_size_granule, page_shift, num, scale, exponent;
+     memset(env->vfp.pregs, 0, sizeof(env->vfp.pregs));
-+    /* Extract one bit to represent the va selector in use. */
+-    vfp_set_fpcr(env, 0x0800009f);
-+    uint64_t select = sextract64(value, 36, 1);
++    vfp_set_fpsr(env, 0x0800009f);
-+    ARMVAParameters param = aa64_va_parameters(env, select, mmuidx, true);
+ }
-     TLBIRange ret = { };
+ void aarch64_set_svcr(CPUARMState *env, uint64_t new, uint64_t mask)
      page_size_granule = extract64(value, 46, 2);
 -    if (page_size_granule == 0) {
 -        qemu_log_mask(LOG_GUEST_ERROR, "Invalid page size granule %d\n",
 +    /* The granule encoded in value must match the granule in use. */
 +    if (page_size_granule != (param.using64k ? 3 : param.using16k ? 2 : 1)) {
 +        qemu_log_mask(LOG_GUEST_ERROR, "Invalid tlbi page size granule %d\n",
                        page_size_granule);
          return ret;
      }
@@ -XXX,XX +XXX,XX @@ static TLBIRange tlbi_aa64_get_range(CPUARMState *env, ARMMMUIdx mmuidx,
      ret.length = (num + 1) << (exponent + page_shift);
 -    if (regime_has_2_ranges(mmuidx)) {
 +    if (param.select) {
          ret.base = sextract64(value, 0, 37);
      } else {
          ret.base = extract64(value, 0, 37);
 --
-.25.1
+.34.1

-[PULL 20/26] target/arm: Fix TLBIRange.base for 16k and 64k pages
+[PULL 15/36] target/arm: Use FPSR_ constants in vfp_exceptbits_from_host()
-From: Richard Henderson <richard.henderson@linaro.org>
+Use the FPSR_ named constants in vfp_exceptbits_from_host(),
 rather than hardcoded magic numbers.
-The shift of the BaseADDR field depends on the translation
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-granule in use.
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20250124162836.2332150-5-peter.maydell@linaro.org
 ---
  target/arm/vfp_helper.c | 12 ++++++------
 file changed, 6 insertions(+), 6 deletions(-)
-Fixes: 84940ed8255 ("target/arm: Add support for FEAT_TLBIRANGE")
+diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
 Reported-by: Peter Maydell <peter.maydell@linaro.org>
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
 Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20220301215958.157011-14-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
  target/arm/helper.c | 5 +++--
 file changed, 3 insertions(+), 2 deletions(-)
 diff --git a/target/arm/helper.c b/target/arm/helper.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
+--- a/target/arm/vfp_helper.c
-+++ b/target/arm/helper.c
++++ b/target/arm/vfp_helper.c
-@@ -XXX,XX +XXX,XX @@ static TLBIRange tlbi_aa64_get_range(CPUARMState *env, ARMMMUIdx mmuidx,
+@@ -XXX,XX +XXX,XX @@ static inline int vfp_exceptbits_from_host(int host_bits)
-     ret.length = (num + 1) << (exponent + page_shift);
+     int target_bits = 0;
-     if (regime_has_2_ranges(mmuidx)) {
+     if (host_bits & float_flag_invalid) {
--        ret.base = sextract64(value, 0, 37) << TARGET_PAGE_BITS;
+-        target_bits |= 1;
-+        ret.base = sextract64(value, 0, 37);
++        target_bits |= FPSR_IOC;
      } else {
 -        ret.base = extract64(value, 0, 37) << TARGET_PAGE_BITS;
 +        ret.base = extract64(value, 0, 37);
      }
-+    ret.base <<= page_shift;
+     if (host_bits & float_flag_divbyzero) {
+-        target_bits |= 2;
-     return ret;
++        target_bits |= FPSR_DZC;
      }
      if (host_bits & float_flag_overflow) {
 -        target_bits |= 4;
 +        target_bits |= FPSR_OFC;
      }
      if (host_bits & (float_flag_underflow | float_flag_output_denormal)) {
 -        target_bits |= 8;
 +        target_bits |= FPSR_UFC;
      }
      if (host_bits & float_flag_inexact) {
 -        target_bits |= 0x10;
 +        target_bits |= FPSR_IXC;
      }
      if (host_bits & float_flag_input_denormal) {
 -        target_bits |= 0x80;
 +        target_bits |= FPSR_IDC;
      }
      return target_bits;
  }
 --
-.25.1
+.34.1

-New patch
+[PULL 16/36] target/arm: Use uint32_t in vfp_exceptbits_from_host()
+In vfp_exceptbits_from_host(), we accumulate the FPSR flags in
+an "int", and our return type is also "int". However, the only
+callsite returns the same information as a uint32_t, and
+more generally we handle FPSR values in the code as uint32_t,
+not int. Bring this function in to line with that convention.
+There is no behaviour change because none of the FPSR bits
+we set in this function are bit 31. The input argument to
+the function remains 'int' because that is the return type
+of the softfloat get_float_exception_flags().
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-6-peter.maydell@linaro.org
+---
+ target/arm/vfp_helper.c | 4 ++--
+file changed, 2 insertions(+), 2 deletions(-)
+diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/vfp_helper.c
++++ b/target/arm/vfp_helper.c
+@@ -XXX,XX +XXX,XX @@
+ #ifdef CONFIG_TCG
+ /* Convert host exception flags to vfp form.  */
+-static inline int vfp_exceptbits_from_host(int host_bits)
++static inline uint32_t vfp_exceptbits_from_host(int host_bits)
+ {
+-    int target_bits = 0;
++    uint32_t target_bits = 0;
+     if (host_bits & float_flag_invalid) {
+         target_bits |= FPSR_IOC;
+--
+.34.1

-[PULL 23/26] target/arm: Implement FEAT_LPA2
+[PULL 17/36] target/arm: Define new fp_status_a32 and fp_status_a64
-From: Richard Henderson <richard.henderson@linaro.org>
+We want to split the existing fp_status in the Arm CPUState into
 separate float_status fields for AArch32 and AArch64.  (This is
 because new control bits defined by FEAT_AFP only have an effect for
 AArch64, not AArch32.) To make this split we will:
  * define new fp_status_a32 and fp_status_a64 which have
    identical behaviour to the existing fp_status
  * move existing uses of fp_status to fp_status_a32 or
    fp_status_a64 as appropriate
  * delete the old fp_status when it has no uses left
-This feature widens physical addresses (and intermediate physical
+In this patch we add the new float_status fields.
 addresses for 2-stage translation) from 48 to 52 bits, when using
 k or 16k pages.
-This introduces the DS bit to TCR_ELx, which is RES0 unless the
+We will also need to split fp_status_f16, but we will do that
-page size is enabled and supports LPA2, resulting in the effective
+as a separate series of patches.
 value of DS for a given table walk.  The DS bit changes the format
 of the page table descriptor slightly, moving the PS field out to
 TCR so that all pages have the same sharability and repurposing
 those bits of the page table descriptor for the highest bits of
 the output address.
-Do not yet enable FEAT_LPA2; we need extra plumbing to avoid
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-tickling an old kernel bug.
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20250124162836.2332150-7-peter.maydell@linaro.org
 ---
  target/arm/cpu.h           |  4 ++++
  target/arm/tcg/translate.h | 12 ++++++++++++
  target/arm/cpu.c           |  2 ++
  target/arm/vfp_helper.c    | 12 ++++++++++++
 files changed, 30 insertions(+)
-Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-17-richard.henderson@linaro.org
-Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
----
- docs/system/arm/emulation.rst |   1 +
- target/arm/cpu.h              |  22 ++++++++
- target/arm/internals.h        |   2 +
- target/arm/helper.c           | 102 +++++++++++++++++++++++++++++-----
-files changed, 112 insertions(+), 15 deletions(-)
-diff --git a/docs/system/arm/emulation.rst b/docs/system/arm/emulation.rst
-index XXXXXXX..XXXXXXX 100644
---- a/docs/system/arm/emulation.rst
-+++ b/docs/system/arm/emulation.rst
-@@ -XXX,XX +XXX,XX @@ the following architecture extensions:
- - FEAT_JSCVT (JavaScript conversion instructions)
- - FEAT_LOR (Limited ordering regions)
- - FEAT_LPA (Large Physical Address space)
-+- FEAT_LPA2 (Large Physical and virtual Address space v2)
- - FEAT_LRCPC (Load-acquire RCpc instructions)
- - FEAT_LRCPC2 (Load-acquire RCpc instructions v2)
- - FEAT_LSE (Large System Extensions)
 diff --git a/target/arm/cpu.h b/target/arm/cpu.h
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu.h
 +++ b/target/arm/cpu.h
-@@ -XXX,XX +XXX,XX @@ static inline bool isar_feature_aa64_i8mm(const ARMISARegisters *id)
+@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
-     return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, I8MM) != 0;
+         /* There are a number of distinct float control structures:
           *
           *  fp_status: is the "normal" fp status.
 +         *  fp_status_a32: is the "normal" fp status for AArch32 insns
 +         *  fp_status_a64: is the "normal" fp status for AArch64 insns
           *  fp_status_fp16: used for half-precision calculations
           *  standard_fp_status : the ARM "Standard FPSCR Value"
           *  standard_fp_status_fp16 : used for half-precision
@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
           * an explicit FPSCR read.
           */
          float_status fp_status;
 +        float_status fp_status_a32;
 +        float_status fp_status_a64;
          float_status fp_status_f16;
          float_status standard_fp_status;
          float_status standard_fp_status_f16;
 diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/tcg/translate.h
 +++ b/target/arm/tcg/translate.h
@@ -XXX,XX +XXX,XX @@ static inline CPUARMTBFlags arm_tbflags_from_tb(const TranslationBlock *tb)
   */
  typedef enum ARMFPStatusFlavour {
      FPST_FPCR,
 +    FPST_A32,
 +    FPST_A64,
      FPST_FPCR_F16,
      FPST_STD,
      FPST_STD_F16,
@@ -XXX,XX +XXX,XX @@ typedef enum ARMFPStatusFlavour {
   *
   * FPST_FPCR
   *   for non-FP16 operations controlled by the FPCR
 + * FPST_A32
 + *   for AArch32 non-FP16 operations controlled by the FPCR
 + * FPST_A64
 + *   for AArch64 non-FP16 operations controlled by the FPCR
   * FPST_FPCR_F16
   *   for operations controlled by the FPCR where FPCR.FZ16 is to be used
   * FPST_STD
@@ -XXX,XX +XXX,XX @@ static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour)
      case FPST_FPCR:
          offset = offsetof(CPUARMState, vfp.fp_status);
          break;
 +    case FPST_A32:
 +        offset = offsetof(CPUARMState, vfp.fp_status_a32);
 +        break;
 +    case FPST_A64:
 +        offset = offsetof(CPUARMState, vfp.fp_status_a64);
 +        break;
      case FPST_FPCR_F16:
          offset = offsetof(CPUARMState, vfp.fp_status_f16);
          break;
 diff --git a/target/arm/cpu.c b/target/arm/cpu.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu.c
 +++ b/target/arm/cpu.c
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset_hold(Object *obj, ResetType type)
      set_default_nan_mode(1, &env->vfp.standard_fp_status);
      set_default_nan_mode(1, &env->vfp.standard_fp_status_f16);
      arm_set_default_fp_behaviours(&env->vfp.fp_status);
 +    arm_set_default_fp_behaviours(&env->vfp.fp_status_a32);
 +    arm_set_default_fp_behaviours(&env->vfp.fp_status_a64);
      arm_set_default_fp_behaviours(&env->vfp.standard_fp_status);
      arm_set_default_fp_behaviours(&env->vfp.fp_status_f16);
      arm_set_default_fp_behaviours(&env->vfp.standard_fp_status_f16);
 diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/vfp_helper.c
 +++ b/target/arm/vfp_helper.c
@@ -XXX,XX +XXX,XX @@ static uint32_t vfp_get_fpsr_from_host(CPUARMState *env)
      uint32_t i;
      i = get_float_exception_flags(&env->vfp.fp_status);
 +    i |= get_float_exception_flags(&env->vfp.fp_status_a32);
 +    i |= get_float_exception_flags(&env->vfp.fp_status_a64);
      i |= get_float_exception_flags(&env->vfp.standard_fp_status);
      /* FZ16 does not generate an input denormal exception.  */
      i |= (get_float_exception_flags(&env->vfp.fp_status_f16)
@@ -XXX,XX +XXX,XX @@ static void vfp_clear_float_status_exc_flags(CPUARMState *env)
       * be the architecturally up-to-date exception flag information first.
       */
      set_float_exception_flags(0, &env->vfp.fp_status);
 +    set_float_exception_flags(0, &env->vfp.fp_status_a32);
 +    set_float_exception_flags(0, &env->vfp.fp_status_a64);
      set_float_exception_flags(0, &env->vfp.fp_status_f16);
      set_float_exception_flags(0, &env->vfp.standard_fp_status);
      set_float_exception_flags(0, &env->vfp.standard_fp_status_f16);
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
              break;
          }
          set_float_rounding_mode(i, &env->vfp.fp_status);
 +        set_float_rounding_mode(i, &env->vfp.fp_status_a32);
 +        set_float_rounding_mode(i, &env->vfp.fp_status_a64);
          set_float_rounding_mode(i, &env->vfp.fp_status_f16);
      }
      if (changed & FPCR_FZ16) {
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
          bool ftz_enabled = val & FPCR_FZ;
          set_flush_to_zero(ftz_enabled, &env->vfp.fp_status);
          set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status);
 +        set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_a32);
 +        set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_a32);
 +        set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_a64);
 +        set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_a64);
      }
      if (changed & FPCR_DN) {
          bool dnan_enabled = val & FPCR_DN;
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status);
 +        set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a32);
 +        set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a64);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16);
      }
  }
-+static inline bool isar_feature_aa64_tgran4_lpa2(const ARMISARegisters *id)
-+{
-+    return FIELD_SEX64(id->id_aa64mmfr0, ID_AA64MMFR0, TGRAN4) >= 1;
-+}
-+
-+static inline bool isar_feature_aa64_tgran4_2_lpa2(const ARMISARegisters *id)
-+{
-+    unsigned t = FIELD_EX64(id->id_aa64mmfr0, ID_AA64MMFR0, TGRAN4_2);
-+    return t >= 3 || (t == 0 && isar_feature_aa64_tgran4_lpa2(id));
-+}
-+
-+static inline bool isar_feature_aa64_tgran16_lpa2(const ARMISARegisters *id)
-+{
-+    return FIELD_EX64(id->id_aa64mmfr0, ID_AA64MMFR0, TGRAN16) >= 2;
-+}
-+
-+static inline bool isar_feature_aa64_tgran16_2_lpa2(const ARMISARegisters *id)
-+{
-+    unsigned t = FIELD_EX64(id->id_aa64mmfr0, ID_AA64MMFR0, TGRAN16_2);
-+    return t >= 3 || (t == 0 && isar_feature_aa64_tgran16_lpa2(id));
-+}
-+
- static inline bool isar_feature_aa64_ccidx(const ARMISARegisters *id)
- {
-     return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, CCIDX) != 0;
-diff --git a/target/arm/internals.h b/target/arm/internals.h
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/internals.h
-+++ b/target/arm/internals.h
-@@ -XXX,XX +XXX,XX @@ static inline uint32_t aarch64_pstate_valid_mask(const ARMISARegisters *id)
- typedef struct ARMVAParameters {
-     unsigned tsz    : 8;
-     unsigned ps     : 3;
-+    unsigned sh     : 2;
-     unsigned select : 1;
-     bool tbi        : 1;
-     bool epd        : 1;
-@@ -XXX,XX +XXX,XX @@ typedef struct ARMVAParameters {
-     bool using16k   : 1;
-     bool using64k   : 1;
-     bool tsz_oob    : 1;  /* tsz has been clamped to legal range */
-+    bool ds         : 1;
- } ARMVAParameters;
- ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-diff --git a/target/arm/helper.c b/target/arm/helper.c
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
-+++ b/target/arm/helper.c
-@@ -XXX,XX +XXX,XX @@ static TLBIRange tlbi_aa64_get_range(CPUARMState *env, ARMMMUIdx mmuidx,
-     } else {
-         ret.base = extract64(value, 0, 37);
-     }
-+    if (param.ds) {
-+        /*
-+         * With DS=1, BaseADDR is always shifted 16 so that it is able
-+         * to address all 52 va bits.  The input address is perforce
-+         * aligned on a 64k boundary regardless of translation granule.
-+         */
-+        page_shift = 16;
-+    }
-     ret.base <<= page_shift;
-     return ret;
-@@ -XXX,XX +XXX,XX @@ static bool check_s2_mmu_setup(ARMCPU *cpu, bool is_aa64, int level,
-     const int grainsize = stride + 3;
-     int startsizecheck;
--    /* Negative levels are never allowed.  */
--    if (level < 0) {
-+    /*
-+     * Negative levels are usually not allowed...
-+     * Except for FEAT_LPA2, 4k page table, 52-bit address space, which
-+     * begins with level -1.  Note that previous feature tests will have
-+     * eliminated this combination if it is not enabled.
-+     */
-+    if (level < (inputsize == 52 && stride == 9 ? -1 : 0)) {
-         return false;
-     }
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-                                    ARMMMUIdx mmu_idx, bool data)
- {
-     uint64_t tcr = regime_tcr(env, mmu_idx)->raw_tcr;
--    bool epd, hpd, using16k, using64k, tsz_oob;
--    int select, tsz, tbi, max_tsz, min_tsz, ps;
-+    bool epd, hpd, using16k, using64k, tsz_oob, ds;
-+    int select, tsz, tbi, max_tsz, min_tsz, ps, sh;
-+    ARMCPU *cpu = env_archcpu(env);
-     if (!regime_has_2_ranges(mmu_idx)) {
-         select = 0;
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-             hpd = extract32(tcr, 24, 1);
-         }
-         epd = false;
-+        sh = extract32(tcr, 12, 2);
-         ps = extract32(tcr, 16, 3);
-+        ds = extract64(tcr, 32, 1);
-     } else {
-         /*
-          * Bit 55 is always between the two regions, and is canonical for
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-         if (!select) {
-             tsz = extract32(tcr, 0, 6);
-             epd = extract32(tcr, 7, 1);
-+            sh = extract32(tcr, 12, 2);
-             using64k = extract32(tcr, 14, 1);
-             using16k = extract32(tcr, 15, 1);
-             hpd = extract64(tcr, 41, 1);
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-             using64k = tg == 3;
-             tsz = extract32(tcr, 16, 6);
-             epd = extract32(tcr, 23, 1);
-+            sh = extract32(tcr, 28, 2);
-             hpd = extract64(tcr, 42, 1);
-         }
-         ps = extract64(tcr, 32, 3);
-+        ds = extract64(tcr, 59, 1);
-     }
--    if (cpu_isar_feature(aa64_st, env_archcpu(env))) {
-+    if (cpu_isar_feature(aa64_st, cpu)) {
-         max_tsz = 48 - using64k;
-     } else {
-         max_tsz = 39;
-     }
-+    /*
-+     * DS is RES0 unless FEAT_LPA2 is supported for the given page size;
-+     * adjust the effective value of DS, as documented.
-+     */
-     min_tsz = 16;
-     if (using64k) {
--        if (cpu_isar_feature(aa64_lva, env_archcpu(env))) {
-+        if (cpu_isar_feature(aa64_lva, cpu)) {
-+            min_tsz = 12;
-+        }
-+        ds = false;
-+    } else if (ds) {
-+        switch (mmu_idx) {
-+        case ARMMMUIdx_Stage2:
-+        case ARMMMUIdx_Stage2_S:
-+            if (using16k) {
-+                ds = cpu_isar_feature(aa64_tgran16_2_lpa2, cpu);
-+            } else {
-+                ds = cpu_isar_feature(aa64_tgran4_2_lpa2, cpu);
-+            }
-+            break;
-+        default:
-+            if (using16k) {
-+                ds = cpu_isar_feature(aa64_tgran16_lpa2, cpu);
-+            } else {
-+                ds = cpu_isar_feature(aa64_tgran4_lpa2, cpu);
-+            }
-+            break;
-+        }
-+        if (ds) {
-             min_tsz = 12;
-         }
-     }
--    /* TODO: FEAT_LPA2 */
-     if (tsz > max_tsz) {
-         tsz = max_tsz;
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-     return (ARMVAParameters) {
-         .tsz = tsz,
-         .ps = ps,
-+        .sh = sh,
-         .select = select,
-         .tbi = tbi,
-         .epd = epd,
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
-         .using16k = using16k,
-         .using64k = using64k,
-         .tsz_oob = tsz_oob,
-+        .ds = ds,
-     };
- }
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
-          * VTCR_EL2.SL0 field (whose interpretation depends on the page size)
-          */
-         uint32_t sl0 = extract32(tcr->raw_tcr, 6, 2);
-+        uint32_t sl2 = extract64(tcr->raw_tcr, 33, 1);
-         uint32_t startlevel;
-         bool ok;
--        if (!aarch64 || stride == 9) {
-+        /* SL2 is RES0 unless DS=1 & 4kb granule. */
-+        if (param.ds && stride == 9 && sl2) {
-+            if (sl0 != 0) {
-+                level = 0;
-+                fault_type = ARMFault_Translation;
-+                goto do_fault;
-+            }
-+            startlevel = -1;
-+        } else if (!aarch64 || stride == 9) {
-             /* AArch32 or 4KB pages */
-             startlevel = 2 - sl0;
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
-      * for both v7 and v8.  However, for v8 the SBZ bits [47:40] must be 0
-      * or an AddressSize fault is raised.  So for v8 we extract those SBZ
-      * bits as part of the address, which will be checked via outputsize.
--     * For AArch64, the address field always goes up to bit 47 (with extra
--     * bits for FEAT_LPA placed elsewhere).  AArch64 implies v8.
-+     * For AArch64, the address field goes up to bit 47, or 49 with FEAT_LPA2;
-+     * the highest bits of a 52-bit output are placed elsewhere.
-      */
--    if (arm_feature(env, ARM_FEATURE_V8)) {
-+    if (param.ds) {
-+        descaddrmask = MAKE_64BIT_MASK(0, 50);
-+    } else if (arm_feature(env, ARM_FEATURE_V8)) {
-         descaddrmask = MAKE_64BIT_MASK(0, 48);
-     } else {
-         descaddrmask = MAKE_64BIT_MASK(0, 40);
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
-         /*
-          * For FEAT_LPA and PS=6, bits [51:48] of descaddr are in [15:12]
--         * of descriptor.  Otherwise, if descaddr is out of range, raise
--         * AddressSizeFault.
-+         * of descriptor.  For FEAT_LPA2 and effective DS, bits [51:50] of
-+         * descaddr are in [9:8].  Otherwise, if descaddr is out of range,
-+         * raise AddressSizeFault.
-          */
-         if (outputsize > 48) {
--            descaddr |= extract64(descriptor, 12, 4) << 48;
-+            if (param.ds) {
-+                descaddr |= extract64(descriptor, 8, 2) << 50;
-+            } else {
-+                descaddr |= extract64(descriptor, 12, 4) << 48;
-+            }
-         } else if (descaddr >> outputsize) {
-             fault_type = ARMFault_AddressSize;
-             goto do_fault;
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
-         assert(attrindx <= 7);
-         cacheattrs->attrs = extract64(mair, attrindx * 8, 8);
-     }
--    cacheattrs->shareability = extract32(attrs, 6, 2);
-+
-+    /*
-+     * For FEAT_LPA2 and effective DS, the SH field in the attributes
-+     * was re-purposed for output address bits.  The SH attribute in
-+     * that case comes from TCR_ELx, which we extracted earlier.
-+     */
-+    if (param.ds) {
-+        cacheattrs->shareability = param.sh;
-+    } else {
-+        cacheattrs->shareability = extract32(attrs, 6, 2);
-+    }
-     *phys_ptr = descaddr;
-     *page_size_ptr = page_size;
 --
-.25.1
+.34.1

-New patch
+[PULL 18/36] target/arm: Use vfp.fp_status_a64 in A64-only helper functions
+Switch from vfp.fp_status to vfp.fp_status_a64 for helpers which:
+ * directly reference an fp_status field
+ * are called only from the A64 decoder
+ * are not called inside a set_rmode/restore_rmode sequence
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Message-id: 20250124162836.2332150-8-peter.maydell@linaro.org
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+---
+ target/arm/tcg/sme_helper.c | 2 +-
+ target/arm/tcg/vec_helper.c | 8 ++++----
+files changed, 5 insertions(+), 5 deletions(-)
+diff --git a/target/arm/tcg/sme_helper.c b/target/arm/tcg/sme_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/sme_helper.c
++++ b/target/arm/tcg/sme_helper.c
+@@ -XXX,XX +XXX,XX @@ void HELPER(sme_fmopa_h)(void *vza, void *vzn, void *vzm, void *vpn,
+      * round-to-odd -- see above.
+      */
+     fpst_f16 = env->vfp.fp_status_f16;
+-    fpst_std = env->vfp.fp_status;
++    fpst_std = env->vfp.fp_status_a64;
+     set_default_nan_mode(true, &fpst_std);
+     set_default_nan_mode(true, &fpst_f16);
+     fpst_odd = fpst_std;
+diff --git a/target/arm/tcg/vec_helper.c b/target/arm/tcg/vec_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/vec_helper.c
++++ b/target/arm/tcg/vec_helper.c
+@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fmlal_a32)(void *vd, void *vn, void *vm,
+ void HELPER(gvec_fmlal_a64)(void *vd, void *vn, void *vm,
+                             CPUARMState *env, uint32_t desc)
+ {
+-    do_fmlal(vd, vn, vm, &env->vfp.fp_status, desc,
++    do_fmlal(vd, vn, vm, &env->vfp.fp_status_a64, desc,
+              get_flush_inputs_to_zero(&env->vfp.fp_status_f16));
+ }
+@@ -XXX,XX +XXX,XX @@ void HELPER(sve2_fmlal_zzzw_s)(void *vd, void *vn, void *vm, void *va,
+     intptr_t i, oprsz = simd_oprsz(desc);
+     uint16_t negn = extract32(desc, SIMD_DATA_SHIFT, 1) << 15;
+     intptr_t sel = extract32(desc, SIMD_DATA_SHIFT + 1, 1) * sizeof(float16);
+-    float_status *status = &env->vfp.fp_status;
++    float_status *status = &env->vfp.fp_status_a64;
+     bool fz16 = get_flush_inputs_to_zero(&env->vfp.fp_status_f16);
+     for (i = 0; i < oprsz; i += sizeof(float32)) {
+@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fmlal_idx_a32)(void *vd, void *vn, void *vm,
+ void HELPER(gvec_fmlal_idx_a64)(void *vd, void *vn, void *vm,
+                                 CPUARMState *env, uint32_t desc)
+ {
+-    do_fmlal_idx(vd, vn, vm, &env->vfp.fp_status, desc,
++    do_fmlal_idx(vd, vn, vm, &env->vfp.fp_status_a64, desc,
+                  get_flush_inputs_to_zero(&env->vfp.fp_status_f16));
+ }
+@@ -XXX,XX +XXX,XX @@ void HELPER(sve2_fmlal_zzxw_s)(void *vd, void *vn, void *vm, void *va,
+     uint16_t negn = extract32(desc, SIMD_DATA_SHIFT, 1) << 15;
+     intptr_t sel = extract32(desc, SIMD_DATA_SHIFT + 1, 1) * sizeof(float16);
+     intptr_t idx = extract32(desc, SIMD_DATA_SHIFT + 2, 3) * sizeof(float16);
+-    float_status *status = &env->vfp.fp_status;
++    float_status *status = &env->vfp.fp_status_a64;
+     bool fz16 = get_flush_inputs_to_zero(&env->vfp.fp_status_f16);
+     for (i = 0; i < oprsz; i += 16) {
+--
+.34.1

-New patch
+[PULL 19/36] target/arm: Use fp_status_a64 or fp_status_a32 in is_ebf()
+In is_ebf(), we might be called for A64 or A32, but we have
+the CPUARMState* so we can select fp_status_a64 or
+fp_status_a32 accordingly.
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+---
+ target/arm/tcg/vec_helper.c | 2 +-
+file changed, 1 insertion(+), 1 deletion(-)
+diff --git a/target/arm/tcg/vec_helper.c b/target/arm/tcg/vec_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/vec_helper.c
++++ b/target/arm/tcg/vec_helper.c
+@@ -XXX,XX +XXX,XX @@ bool is_ebf(CPUARMState *env, float_status *statusp, float_status *oddstatusp)
+      */
+     bool ebf = is_a64(env) && env->vfp.fpcr & FPCR_EBF;
+-    *statusp = env->vfp.fp_status;
++    *statusp = is_a64(env) ? env->vfp.fp_status_a64 : env->vfp.fp_status_a32;
+     set_default_nan_mode(true, statusp);
+     if (ebf) {
+--
+.34.1

-New patch
+[PULL 20/36] target/arm: Use fp_status_a32 in vjvct helper
+Use fp_status_a32 in the vjcvt helper function; this is called only
+from the A32/T32 decoder and is not used inside a
+set_rmode/restore_rmode sequence.
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-9-peter.maydell@linaro.org
+---
+ target/arm/vfp_helper.c | 2 +-
+file changed, 1 insertion(+), 1 deletion(-)
+diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/vfp_helper.c
++++ b/target/arm/vfp_helper.c
+@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(fjcvtzs)(float64 value, float_status *status)
+ uint32_t HELPER(vjcvt)(float64 value, CPUARMState *env)
+ {
+-    uint64_t pair = HELPER(fjcvtzs)(value, &env->vfp.fp_status);
++    uint64_t pair = HELPER(fjcvtzs)(value, &env->vfp.fp_status_a32);
+     uint32_t result = pair;
+     uint32_t z = (pair >> 32) == 0;
+--
+.34.1

-New patch
+[PULL 21/36] target/arm: Use fp_status_a32 in vfp_cmp helpers
+The helpers vfp_cmps, vfp_cmpes, vfp_cmpd, vfp_cmped are used only from
+the A32 decoder; the A64 decoder uses separate vfp_cmps_a64 etc helpers
+(because for A64 we update the main NZCV flags and for A32 we update
+the FPSCR NZCV flags). So we can make these helpers use the fp_status_a32
+field instead of fp_status.
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-10-peter.maydell@linaro.org
+---
+ target/arm/vfp_helper.c | 4 ++--
+file changed, 2 insertions(+), 2 deletions(-)
+diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/vfp_helper.c
++++ b/target/arm/vfp_helper.c
+@@ -XXX,XX +XXX,XX @@ void VFP_HELPER(cmpe, P)(ARGTYPE a, ARGTYPE b, CPUARMState *env) \
+         FLOATTYPE ## _compare(a, b, &env->vfp.FPST)); \
+ }
+ DO_VFP_cmp(h, float16, dh_ctype_f16, fp_status_f16)
+-DO_VFP_cmp(s, float32, float32, fp_status)
+-DO_VFP_cmp(d, float64, float64, fp_status)
++DO_VFP_cmp(s, float32, float32, fp_status_a32)
++DO_VFP_cmp(d, float64, float64, fp_status_a32)
+ #undef DO_VFP_cmp
+ /* Integer to float and float to integer conversions */
+--
+.34.1

-New patch
+[PULL 22/36] target/arm: Use FPST_A32 in A32 decoder
+In the A32 decoder, use FPST_A32 rather than FPST_FPCR.  By
+doing an automated conversion of the whole file we avoid possibly
+using more than one fpst value in a set_rmode/op/restore_rmode
+sequence.
+Patch created with
+  perl -p -i -e 's/FPST_FPCR(?!_)/FPST_A32/g' target/arm/tcg/translate-vfp.c
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-11-peter.maydell@linaro.org
+---
+ target/arm/tcg/translate-vfp.c | 54 +++++++++++++++++-----------------
+file changed, 27 insertions(+), 27 deletions(-)
+diff --git a/target/arm/tcg/translate-vfp.c b/target/arm/tcg/translate-vfp.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/translate-vfp.c
++++ b/target/arm/tcg/translate-vfp.c
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINT(DisasContext *s, arg_VRINT *a)
+     if (sz == 1) {
+         fpst = fpstatus_ptr(FPST_FPCR_F16);
+     } else {
+-        fpst = fpstatus_ptr(FPST_FPCR);
++        fpst = fpstatus_ptr(FPST_A32);
+     }
+     tcg_rmode = gen_set_rmode(rounding, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT(DisasContext *s, arg_VCVT *a)
+     if (sz == 1) {
+         fpst = fpstatus_ptr(FPST_FPCR_F16);
+     } else {
+-        fpst = fpstatus_ptr(FPST_FPCR);
++        fpst = fpstatus_ptr(FPST_A32);
+     }
+     tcg_shift = tcg_constant_i32(0);
+@@ -XXX,XX +XXX,XX @@ static bool do_vfp_3op_sp(DisasContext *s, VFPGen3OpSPFn *fn,
+     f0 = tcg_temp_new_i32();
+     f1 = tcg_temp_new_i32();
+     fd = tcg_temp_new_i32();
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     vfp_load_reg32(f0, vn);
+     vfp_load_reg32(f1, vm);
+@@ -XXX,XX +XXX,XX @@ static bool do_vfp_3op_dp(DisasContext *s, VFPGen3OpDPFn *fn,
+     f0 = tcg_temp_new_i64();
+     f1 = tcg_temp_new_i64();
+     fd = tcg_temp_new_i64();
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     vfp_load_reg64(f0, vn);
+     vfp_load_reg64(f1, vm);
+@@ -XXX,XX +XXX,XX @@ static bool do_vfm_sp(DisasContext *s, arg_VFMA_sp *a, bool neg_n, bool neg_d)
+         /* VFNMA, VFNMS */
+         gen_vfp_negs(vd, vd);
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     gen_helper_vfp_muladds(vd, vn, vm, vd, fpst);
+     vfp_store_reg32(vd, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool do_vfm_dp(DisasContext *s, arg_VFMA_dp *a, bool neg_n, bool neg_d)
+         /* VFNMA, VFNMS */
+         gen_vfp_negd(vd, vd);
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     gen_helper_vfp_muladdd(vd, vn, vm, vd, fpst);
+     vfp_store_reg64(vd, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static void gen_VSQRT_hp(TCGv_i32 vd, TCGv_i32 vm)
+ static void gen_VSQRT_sp(TCGv_i32 vd, TCGv_i32 vm)
+ {
+-    gen_helper_vfp_sqrts(vd, vm, fpstatus_ptr(FPST_FPCR));
++    gen_helper_vfp_sqrts(vd, vm, fpstatus_ptr(FPST_A32));
+ }
+ static void gen_VSQRT_dp(TCGv_i64 vd, TCGv_i64 vm)
+ {
+-    gen_helper_vfp_sqrtd(vd, vm, fpstatus_ptr(FPST_FPCR));
++    gen_helper_vfp_sqrtd(vd, vm, fpstatus_ptr(FPST_A32));
+ }
+ DO_VFP_2OP(VSQRT, hp, gen_VSQRT_hp, aa32_fp16_arith)
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_f32_f16(DisasContext *s, arg_VCVT_f32_f16 *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     ahp_mode = get_ahp_flag();
+     tmp = tcg_temp_new_i32();
+     /* The T bit tells us if we want the low or high 16 bits of Vm */
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_f64_f16(DisasContext *s, arg_VCVT_f64_f16 *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     ahp_mode = get_ahp_flag();
+     tmp = tcg_temp_new_i32();
+     /* The T bit tells us if we want the low or high 16 bits of Vm */
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_b16_f32(DisasContext *s, arg_VCVT_b16_f32 *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg32(tmp, a->vm);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_f16_f32(DisasContext *s, arg_VCVT_f16_f32 *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     ahp_mode = get_ahp_flag();
+     tmp = tcg_temp_new_i32();
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_f16_f64(DisasContext *s, arg_VCVT_f16_f64 *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     ahp_mode = get_ahp_flag();
+     tmp = tcg_temp_new_i32();
+     vm = tcg_temp_new_i64();
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTR_sp(DisasContext *s, arg_VRINTR_sp *a)
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg32(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     gen_helper_rints(tmp, tmp, fpst);
+     vfp_store_reg32(tmp, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTR_dp(DisasContext *s, arg_VRINTR_dp *a)
+     tmp = tcg_temp_new_i64();
+     vfp_load_reg64(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     gen_helper_rintd(tmp, tmp, fpst);
+     vfp_store_reg64(tmp, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTZ_sp(DisasContext *s, arg_VRINTZ_sp *a)
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg32(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     tcg_rmode = gen_set_rmode(FPROUNDING_ZERO, fpst);
+     gen_helper_rints(tmp, tmp, fpst);
+     gen_restore_rmode(tcg_rmode, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTZ_dp(DisasContext *s, arg_VRINTZ_dp *a)
+     tmp = tcg_temp_new_i64();
+     vfp_load_reg64(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     tcg_rmode = gen_set_rmode(FPROUNDING_ZERO, fpst);
+     gen_helper_rintd(tmp, tmp, fpst);
+     gen_restore_rmode(tcg_rmode, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTX_sp(DisasContext *s, arg_VRINTX_sp *a)
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg32(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     gen_helper_rints_exact(tmp, tmp, fpst);
+     vfp_store_reg32(tmp, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTX_dp(DisasContext *s, arg_VRINTX_dp *a)
+     tmp = tcg_temp_new_i64();
+     vfp_load_reg64(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     gen_helper_rintd_exact(tmp, tmp, fpst);
+     vfp_store_reg64(tmp, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_sp(DisasContext *s, arg_VCVT_sp *a)
+     vm = tcg_temp_new_i32();
+     vd = tcg_temp_new_i64();
+     vfp_load_reg32(vm, a->vm);
+-    gen_helper_vfp_fcvtds(vd, vm, fpstatus_ptr(FPST_FPCR));
++    gen_helper_vfp_fcvtds(vd, vm, fpstatus_ptr(FPST_A32));
+     vfp_store_reg64(vd, a->vd);
+     return true;
+ }
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_dp(DisasContext *s, arg_VCVT_dp *a)
+     vd = tcg_temp_new_i32();
+     vm = tcg_temp_new_i64();
+     vfp_load_reg64(vm, a->vm);
+-    gen_helper_vfp_fcvtsd(vd, vm, fpstatus_ptr(FPST_FPCR));
++    gen_helper_vfp_fcvtsd(vd, vm, fpstatus_ptr(FPST_A32));
+     vfp_store_reg32(vd, a->vd);
+     return true;
+ }
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_int_sp(DisasContext *s, arg_VCVT_int_sp *a)
+     vm = tcg_temp_new_i32();
+     vfp_load_reg32(vm, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     if (a->s) {
+         /* i32 -> f32 */
+         gen_helper_vfp_sitos(vm, vm, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_int_dp(DisasContext *s, arg_VCVT_int_dp *a)
+     vm = tcg_temp_new_i32();
+     vd = tcg_temp_new_i64();
+     vfp_load_reg32(vm, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     if (a->s) {
+         /* i32 -> f64 */
+         gen_helper_vfp_sitod(vd, vm, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_fix_sp(DisasContext *s, arg_VCVT_fix_sp *a)
+     vd = tcg_temp_new_i32();
+     vfp_load_reg32(vd, a->vd);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     shift = tcg_constant_i32(frac_bits);
+     /* Switch on op:U:sx bits */
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_fix_dp(DisasContext *s, arg_VCVT_fix_dp *a)
+     vd = tcg_temp_new_i64();
+     vfp_load_reg64(vd, a->vd);
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     shift = tcg_constant_i32(frac_bits);
+     /* Switch on op:U:sx bits */
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_sp_int(DisasContext *s, arg_VCVT_sp_int *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     vm = tcg_temp_new_i32();
+     vfp_load_reg32(vm, a->vm);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_dp_int(DisasContext *s, arg_VCVT_dp_int *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A32);
+     vm = tcg_temp_new_i64();
+     vd = tcg_temp_new_i32();
+     vfp_load_reg64(vm, a->vm);
+--
+.34.1

-New patch
+[PULL 23/36] target/arm: Use FPST_A64 in A64 decoder
+In the A64 decoder, use FPST_A64 rather than FPST_FPCR.  By
+doing an automated conversion of the whole file we avoid possibly
+using more than one fpst value in a set_rmode/op/restore_rmode
+sequence.
+Patch created with
+  perl -p -i -e 's/FPST_FPCR(?!_)/FPST_A64/g' target/arm/tcg/translate-{a64,sve,sme}.c
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-12-peter.maydell@linaro.org
+---
+ target/arm/tcg/translate-a64.c |  70 +++++++++++-----------
+ target/arm/tcg/translate-sme.c |   4 +-
+ target/arm/tcg/translate-sve.c | 106 ++++++++++++++++-----------------
+files changed, 90 insertions(+), 90 deletions(-)
+diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/translate-a64.c
++++ b/target/arm/tcg/translate-a64.c
+@@ -XXX,XX +XXX,XX @@ static void gen_gvec_op3_fpst(DisasContext *s, bool is_q, int rd, int rn,
+                               int rm, bool is_fp16, int data,
+                               gen_helper_gvec_3_ptr *fn)
+ {
+-    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_FPCR);
++    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_A64);
+     tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd),
+                        vec_full_reg_offset(s, rn),
+                        vec_full_reg_offset(s, rm), fpst,
+@@ -XXX,XX +XXX,XX @@ static void gen_gvec_op4_fpst(DisasContext *s, bool is_q, int rd, int rn,
+                               int rm, int ra, bool is_fp16, int data,
+                               gen_helper_gvec_4_ptr *fn)
+ {
+-    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_FPCR);
++    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_A64);
+     tcg_gen_gvec_4_ptr(vec_full_reg_offset(s, rd),
+                        vec_full_reg_offset(s, rn),
+                        vec_full_reg_offset(s, rm),
+@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar(DisasContext *s, arg_rrr_e *a, const FPScalar *f)
+         if (fp_access_check(s)) {
+             TCGv_i64 t0 = read_fp_dreg(s, a->rn);
+             TCGv_i64 t1 = read_fp_dreg(s, a->rm);
+-            f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++            f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             write_fp_dreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar(DisasContext *s, arg_rrr_e *a, const FPScalar *f)
+         if (fp_access_check(s)) {
+             TCGv_i32 t0 = read_fp_sreg(s, a->rn);
+             TCGv_i32 t1 = read_fp_sreg(s, a->rm);
+-            f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++            f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             write_fp_sreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fcmp0_s(DisasContext *s, arg_rr_e *a,
+             TCGv_i64 t0 = read_fp_dreg(s, a->rn);
+             TCGv_i64 t1 = tcg_constant_i64(0);
+             if (swap) {
+-                f->gen_d(t0, t1, t0, fpstatus_ptr(FPST_FPCR));
++                f->gen_d(t0, t1, t0, fpstatus_ptr(FPST_A64));
+             } else {
+-                f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++                f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             }
+             write_fp_dreg(s, a->rd, t0);
+         }
+@@ -XXX,XX +XXX,XX @@ static bool do_fcmp0_s(DisasContext *s, arg_rr_e *a,
+             TCGv_i32 t0 = read_fp_sreg(s, a->rn);
+             TCGv_i32 t1 = tcg_constant_i32(0);
+             if (swap) {
+-                f->gen_s(t0, t1, t0, fpstatus_ptr(FPST_FPCR));
++                f->gen_s(t0, t1, t0, fpstatus_ptr(FPST_A64));
+             } else {
+-                f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++                f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             }
+             write_fp_sreg(s, a->rd, t0);
+         }
+@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar_idx(DisasContext *s, arg_rrx_e *a, const FPScalar *f)
+             TCGv_i64 t1 = tcg_temp_new_i64();
+             read_vec_element(s, t1, a->rm, a->idx, MO_64);
+-            f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++            f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             write_fp_dreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar_idx(DisasContext *s, arg_rrx_e *a, const FPScalar *f)
+             TCGv_i32 t1 = tcg_temp_new_i32();
+             read_vec_element_i32(s, t1, a->rm, a->idx, MO_32);
+-            f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++            f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             write_fp_sreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fmla_scalar_idx(DisasContext *s, arg_rrx_e *a, bool neg)
+             if (neg) {
+                 gen_vfp_negd(t1, t1);
+             }
+-            gen_helper_vfp_muladdd(t0, t1, t2, t0, fpstatus_ptr(FPST_FPCR));
++            gen_helper_vfp_muladdd(t0, t1, t2, t0, fpstatus_ptr(FPST_A64));
+             write_fp_dreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fmla_scalar_idx(DisasContext *s, arg_rrx_e *a, bool neg)
+             if (neg) {
+                 gen_vfp_negs(t1, t1);
+             }
+-            gen_helper_vfp_muladds(t0, t1, t2, t0, fpstatus_ptr(FPST_FPCR));
++            gen_helper_vfp_muladds(t0, t1, t2, t0, fpstatus_ptr(FPST_A64));
+             write_fp_sreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar_pair(DisasContext *s, arg_rr_e *a, const FPScalar *f)
+             read_vec_element(s, t0, a->rn, 0, MO_64);
+             read_vec_element(s, t1, a->rn, 1, MO_64);
+-            f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++            f->gen_d(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             write_fp_dreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar_pair(DisasContext *s, arg_rr_e *a, const FPScalar *f)
+             read_vec_element_i32(s, t0, a->rn, 0, MO_32);
+             read_vec_element_i32(s, t1, a->rn, 1, MO_32);
+-            f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_FPCR));
++            f->gen_s(t0, t0, t1, fpstatus_ptr(FPST_A64));
+             write_fp_sreg(s, a->rd, t0);
+         }
+         break;
+@@ -XXX,XX +XXX,XX @@ static bool do_fmadd(DisasContext *s, arg_rrrr_e *a, bool neg_a, bool neg_n)
+             if (neg_n) {
+                 gen_vfp_negd(tn, tn);
+             }
+-            fpst = fpstatus_ptr(FPST_FPCR);
++            fpst = fpstatus_ptr(FPST_A64);
+             gen_helper_vfp_muladdd(ta, tn, tm, ta, fpst);
+             write_fp_dreg(s, a->rd, ta);
+         }
+@@ -XXX,XX +XXX,XX @@ static bool do_fmadd(DisasContext *s, arg_rrrr_e *a, bool neg_a, bool neg_n)
+             if (neg_n) {
+                 gen_vfp_negs(tn, tn);
+             }
+-            fpst = fpstatus_ptr(FPST_FPCR);
++            fpst = fpstatus_ptr(FPST_A64);
+             gen_helper_vfp_muladds(ta, tn, tm, ta, fpst);
+             write_fp_sreg(s, a->rd, ta);
+         }
+@@ -XXX,XX +XXX,XX @@ static bool do_fp_reduction(DisasContext *s, arg_qrr_e *a,
+     if (fp_access_check(s)) {
+         MemOp esz = a->esz;
+         int elts = (a->q ? 16 : 8) >> esz;
+-        TCGv_ptr fpst = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++        TCGv_ptr fpst = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+         TCGv_i32 res = do_reduction_op(s, a->rn, esz, 0, elts, fpst, fn);
+         write_fp_sreg(s, a->rd, res);
+     }
+@@ -XXX,XX +XXX,XX @@ static void handle_fp_compare(DisasContext *s, int size,
+                               bool cmp_with_zero, bool signal_all_nans)
+ {
+     TCGv_i64 tcg_flags = tcg_temp_new_i64();
+-    TCGv_ptr fpst = fpstatus_ptr(size == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    TCGv_ptr fpst = fpstatus_ptr(size == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     if (size == MO_64) {
+         TCGv_i64 tcg_vn, tcg_vm;
+@@ -XXX,XX +XXX,XX @@ static bool do_fp1_scalar(DisasContext *s, arg_rr_e *a,
+         return check == 0;
+     }
+-    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     if (rmode >= 0) {
+         tcg_rmode = gen_set_rmode(rmode, fpst);
+     }
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_ds(DisasContext *s, arg_rr *a)
+     if (fp_access_check(s)) {
+         TCGv_i32 tcg_rn = read_fp_sreg(s, a->rn);
+         TCGv_i64 tcg_rd = tcg_temp_new_i64();
+-        TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+         gen_helper_vfp_fcvtds(tcg_rd, tcg_rn, fpst);
+         write_fp_dreg(s, a->rd, tcg_rd);
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_hs(DisasContext *s, arg_rr *a)
+     if (fp_access_check(s)) {
+         TCGv_i32 tmp = read_fp_sreg(s, a->rn);
+         TCGv_i32 ahp = get_ahp_flag();
+-        TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+         gen_helper_vfp_fcvt_f32_to_f16(tmp, tmp, fpst, ahp);
+         /* write_fp_sreg is OK here because top half of result is zero */
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_sd(DisasContext *s, arg_rr *a)
+     if (fp_access_check(s)) {
+         TCGv_i64 tcg_rn = read_fp_dreg(s, a->rn);
+         TCGv_i32 tcg_rd = tcg_temp_new_i32();
+-        TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+         gen_helper_vfp_fcvtsd(tcg_rd, tcg_rn, fpst);
+         write_fp_sreg(s, a->rd, tcg_rd);
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_hd(DisasContext *s, arg_rr *a)
+         TCGv_i64 tcg_rn = read_fp_dreg(s, a->rn);
+         TCGv_i32 tcg_rd = tcg_temp_new_i32();
+         TCGv_i32 ahp = get_ahp_flag();
+-        TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+         gen_helper_vfp_fcvt_f64_to_f16(tcg_rd, tcg_rn, fpst, ahp);
+         /* write_fp_sreg is OK here because top half of tcg_rd is zero */
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_sh(DisasContext *s, arg_rr *a)
+     if (fp_access_check(s)) {
+         TCGv_i32 tcg_rn = read_fp_hreg(s, a->rn);
+         TCGv_i32 tcg_rd = tcg_temp_new_i32();
+-        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_A64);
+         TCGv_i32 tcg_ahp = get_ahp_flag();
+         gen_helper_vfp_fcvt_f16_to_f32(tcg_rd, tcg_rn, tcg_fpst, tcg_ahp);
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_dh(DisasContext *s, arg_rr *a)
+     if (fp_access_check(s)) {
+         TCGv_i32 tcg_rn = read_fp_hreg(s, a->rn);
+         TCGv_i64 tcg_rd = tcg_temp_new_i64();
+-        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_A64);
+         TCGv_i32 tcg_ahp = get_ahp_flag();
+         gen_helper_vfp_fcvt_f16_to_f64(tcg_rd, tcg_rn, tcg_fpst, tcg_ahp);
+@@ -XXX,XX +XXX,XX @@ static bool do_cvtf_scalar(DisasContext *s, MemOp esz, int rd, int shift,
+     TCGv_i32 tcg_shift, tcg_single;
+     TCGv_i64 tcg_double;
+-    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     tcg_shift = tcg_constant_i32(shift);
+     switch (esz) {
+@@ -XXX,XX +XXX,XX @@ static void do_fcvt_scalar(DisasContext *s, MemOp out, MemOp esz,
+     TCGv_ptr tcg_fpstatus;
+     TCGv_i32 tcg_shift, tcg_rmode, tcg_single;
+-    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     tcg_shift = tcg_constant_i32(shift);
+     tcg_rmode = gen_set_rmode(rmode, tcg_fpstatus);
+@@ -XXX,XX +XXX,XX @@ static bool trans_FJCVTZS(DisasContext *s, arg_FJCVTZS *a)
+     }
+     if (fp_access_check(s)) {
+         TCGv_i64 t = read_fp_dreg(s, a->rn);
+-        TCGv_ptr fpstatus = fpstatus_ptr(FPST_FPCR);
++        TCGv_ptr fpstatus = fpstatus_ptr(FPST_A64);
+         gen_helper_fjcvtzs(t, t, fpstatus);
+@@ -XXX,XX +XXX,XX @@ static void gen_fcvtxn_sd(TCGv_i64 d, TCGv_i64 n)
+      * with von Neumann rounding (round to odd)
+      */
+     TCGv_i32 tmp = tcg_temp_new_i32();
+-    gen_helper_fcvtx_f64_to_f32(tmp, n, fpstatus_ptr(FPST_FPCR));
++    gen_helper_fcvtx_f64_to_f32(tmp, n, fpstatus_ptr(FPST_A64));
+     tcg_gen_extu_i32_i64(d, tmp);
+ }
+@@ -XXX,XX +XXX,XX @@ static void gen_fcvtn_hs(TCGv_i64 d, TCGv_i64 n)
+ {
+     TCGv_i32 tcg_lo = tcg_temp_new_i32();
+     TCGv_i32 tcg_hi = tcg_temp_new_i32();
+-    TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++    TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+     TCGv_i32 ahp = get_ahp_flag();
+     tcg_gen_extr_i64_i32(tcg_lo, tcg_hi, n);
+@@ -XXX,XX +XXX,XX @@ static void gen_fcvtn_hs(TCGv_i64 d, TCGv_i64 n)
+ static void gen_fcvtn_sd(TCGv_i64 d, TCGv_i64 n)
+ {
+     TCGv_i32 tmp = tcg_temp_new_i32();
+-    TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++    TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+     gen_helper_vfp_fcvtsd(tmp, n, fpst);
+     tcg_gen_extu_i32_i64(d, tmp);
+@@ -XXX,XX +XXX,XX @@ TRANS(FCVTXN_v, do_2misc_narrow_vector, a, f_scalar_fcvtxn)
+ static void gen_bfcvtn_hs(TCGv_i64 d, TCGv_i64 n)
+ {
+-    TCGv_ptr fpst = fpstatus_ptr(FPST_FPCR);
++    TCGv_ptr fpst = fpstatus_ptr(FPST_A64);
+     TCGv_i32 tmp = tcg_temp_new_i32();
+     gen_helper_bfcvt_pair(tmp, n, fpst);
+     tcg_gen_extu_i32_i64(d, tmp);
+@@ -XXX,XX +XXX,XX @@ static bool do_fp1_vector(DisasContext *s, arg_qrr_e *a,
+         return check == 0;
+     }
+-    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     if (rmode >= 0) {
+         tcg_rmode = gen_set_rmode(rmode, fpst);
+     }
+@@ -XXX,XX +XXX,XX @@ static bool do_gvec_op2_fpst(DisasContext *s, MemOp esz, bool is_q,
+         return check == 0;
+     }
+-    fpst = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    fpst = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     tcg_gen_gvec_2_ptr(vec_full_reg_offset(s, rd),
+                        vec_full_reg_offset(s, rn), fpst,
+                        is_q ? 16 : 8, vec_full_reg_size(s),
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVTL_v(DisasContext *s, arg_qrr_e *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR);
++    fpst = fpstatus_ptr(FPST_A64);
+     if (a->esz == MO_64) {
+         /* 32 -> 64 bit fp conversion */
+         TCGv_i64 tcg_res[2];
+diff --git a/target/arm/tcg/translate-sme.c b/target/arm/tcg/translate-sme.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/translate-sme.c
++++ b/target/arm/tcg/translate-sme.c
+@@ -XXX,XX +XXX,XX @@ static bool do_outprod_env(DisasContext *s, arg_op *a, MemOp esz,
+ TRANS_FEAT(FMOPA_h, aa64_sme, do_outprod_env, a,
+            MO_32, gen_helper_sme_fmopa_h)
+ TRANS_FEAT(FMOPA_s, aa64_sme, do_outprod_fpst, a,
+-           MO_32, FPST_FPCR, gen_helper_sme_fmopa_s)
++           MO_32, FPST_A64, gen_helper_sme_fmopa_s)
+ TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a,
+-           MO_64, FPST_FPCR, gen_helper_sme_fmopa_d)
++           MO_64, FPST_A64, gen_helper_sme_fmopa_d)
+ TRANS_FEAT(BFMOPA, aa64_sme, do_outprod_env, a, MO_32, gen_helper_sme_bfmopa)
+diff --git a/target/arm/tcg/translate-sve.c b/target/arm/tcg/translate-sve.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/translate-sve.c
++++ b/target/arm/tcg/translate-sve.c
+@@ -XXX,XX +XXX,XX @@ static bool gen_gvec_fpst_arg_zz(DisasContext *s, gen_helper_gvec_2_ptr *fn,
+                                  arg_rr_esz *a, int data)
+ {
+     return gen_gvec_fpst_zz(s, fn, a->rd, a->rn, data,
+-                            a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++                            a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+ }
+ /* Invoke an out-of-line helper on 3 Zregs. */
+@@ -XXX,XX +XXX,XX @@ static bool gen_gvec_fpst_arg_zzz(DisasContext *s, gen_helper_gvec_3_ptr *fn,
+                                   arg_rrr_esz *a, int data)
+ {
+     return gen_gvec_fpst_zzz(s, fn, a->rd, a->rn, a->rm, data,
+-                             a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++                             a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+ }
+ /* Invoke an out-of-line helper on 4 Zregs. */
+@@ -XXX,XX +XXX,XX @@ static bool gen_gvec_fpst_arg_zpzz(DisasContext *s, gen_helper_gvec_4_ptr *fn,
+                                    arg_rprr_esz *a)
+ {
+     return gen_gvec_fpst_zzzp(s, fn, a->rd, a->rn, a->rm, a->pg, 0,
+-                              a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++                              a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+ }
+ /* Invoke a vector expander on two Zregs and an immediate.  */
+@@ -XXX,XX +XXX,XX @@ static bool do_FMLA_zzxz(DisasContext *s, arg_rrxr_esz *a, bool sub)
+     };
+     return gen_gvec_fpst_zzzz(s, fns[a->esz], a->rd, a->rn, a->rm, a->ra,
+                               (a->index << 1) | sub,
+-                              a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++                              a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+ }
+ TRANS_FEAT(FMLA_zzxz, aa64_sve, do_FMLA_zzxz, a, false)
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const fmul_idx_fns[4] = {
+ };
+ TRANS_FEAT(FMUL_zzx, aa64_sve, gen_gvec_fpst_zzz,
+            fmul_idx_fns[a->esz], a->rd, a->rn, a->rm, a->index,
+-           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ /*
+  *** SVE Floating Point Fast Reduction Group
+@@ -XXX,XX +XXX,XX @@ static bool do_reduce(DisasContext *s, arg_rpr_esz *a,
+     tcg_gen_addi_ptr(t_zn, tcg_env, vec_full_reg_offset(s, a->rn));
+     tcg_gen_addi_ptr(t_pg, tcg_env, pred_full_reg_offset(s, a->pg));
+-    status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     fn(temp, t_zn, t_pg, status, t_desc);
+@@ -XXX,XX +XXX,XX @@ static bool do_ppz_fp(DisasContext *s, arg_rpr_esz *a,
+     if (sve_access_check(s)) {
+         unsigned vsz = vec_full_reg_size(s);
+         TCGv_ptr status =
+-            fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++            fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+         tcg_gen_gvec_3_ptr(pred_full_reg_offset(s, a->rd),
+                            vec_full_reg_offset(s, a->rn),
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const ftmad_fns[4] = {
+ };
+ TRANS_FEAT_NONSTREAMING(FTMAD, aa64_sve, gen_gvec_fpst_zzz,
+                         ftmad_fns[a->esz], a->rd, a->rn, a->rm, a->imm,
+-                        a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++                        a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ /*
+  *** SVE Floating Point Accumulating Reduction Group
+@@ -XXX,XX +XXX,XX @@ static bool trans_FADDA(DisasContext *s, arg_rprr_esz *a)
+     t_pg = tcg_temp_new_ptr();
+     tcg_gen_addi_ptr(t_rm, tcg_env, vec_full_reg_offset(s, a->rm));
+     tcg_gen_addi_ptr(t_pg, tcg_env, pred_full_reg_offset(s, a->pg));
+-    t_fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    t_fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     t_desc = tcg_constant_i32(simd_desc(vsz, vsz, 0));
+     fns[a->esz - 1](t_val, t_val, t_rm, t_pg, t_fpst, t_desc);
+@@ -XXX,XX +XXX,XX @@ static void do_fp_scalar(DisasContext *s, int zd, int zn, int pg, bool is_fp16,
+     tcg_gen_addi_ptr(t_zn, tcg_env, vec_full_reg_offset(s, zn));
+     tcg_gen_addi_ptr(t_pg, tcg_env, pred_full_reg_offset(s, pg));
+-    status = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_FPCR);
++    status = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_A64);
+     desc = tcg_constant_i32(simd_desc(vsz, vsz, 0));
+     fn(t_zd, t_zn, t_pg, scalar, status, desc);
+ }
+@@ -XXX,XX +XXX,XX @@ static bool do_fp_cmp(DisasContext *s, arg_rprr_esz *a,
+     }
+     if (sve_access_check(s)) {
+         unsigned vsz = vec_full_reg_size(s);
+-        TCGv_ptr status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++        TCGv_ptr status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+         tcg_gen_gvec_4_ptr(pred_full_reg_offset(s, a->rd),
+                            vec_full_reg_offset(s, a->rn),
+                            vec_full_reg_offset(s, a->rm),
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_4_ptr * const fcadd_fns[] = {
+ };
+ TRANS_FEAT(FCADD, aa64_sve, gen_gvec_fpst_zzzp, fcadd_fns[a->esz],
+            a->rd, a->rn, a->rm, a->pg, a->rot,
+-           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ #define DO_FMLA(NAME, name) \
+     static gen_helper_gvec_5_ptr * const name##_fns[4] = {              \
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FCADD, aa64_sve, gen_gvec_fpst_zzzp, fcadd_fns[a->esz],
+     };                                                                  \
+     TRANS_FEAT(NAME, aa64_sve, gen_gvec_fpst_zzzzp, name##_fns[a->esz], \
+                a->rd, a->rn, a->rm, a->ra, a->pg, 0,                    \
+-               a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++               a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ DO_FMLA(FMLA_zpzzz, fmla_zpzzz)
+ DO_FMLA(FMLS_zpzzz, fmls_zpzzz)
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_5_ptr * const fcmla_fns[4] = {
+ };
+ TRANS_FEAT(FCMLA_zpzzz, aa64_sve, gen_gvec_fpst_zzzzp, fcmla_fns[a->esz],
+            a->rd, a->rn, a->rm, a->ra, a->pg, a->rot,
+-           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ static gen_helper_gvec_4_ptr * const fcmla_idx_fns[4] = {
+     NULL, gen_helper_gvec_fcmlah_idx, gen_helper_gvec_fcmlas_idx, NULL
+ };
+ TRANS_FEAT(FCMLA_zzxz, aa64_sve, gen_gvec_fpst_zzzz, fcmla_idx_fns[a->esz],
+            a->rd, a->rn, a->rm, a->ra, a->index * 4 + a->rot,
+-           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ /*
+  *** SVE Floating Point Unary Operations Predicated Group
+  */
+ TRANS_FEAT(FCVT_sh, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvt_sh, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvt_sh, a, 0, FPST_A64)
+ TRANS_FEAT(FCVT_hs, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvt_hs, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvt_hs, a, 0, FPST_A64)
+ TRANS_FEAT(BFCVT, aa64_sve_bf16, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_bfcvt, a, 0, FPST_FPCR)
++           gen_helper_sve_bfcvt, a, 0, FPST_A64)
+ TRANS_FEAT(FCVT_dh, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvt_dh, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvt_dh, a, 0, FPST_A64)
+ TRANS_FEAT(FCVT_hd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvt_hd, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvt_hd, a, 0, FPST_A64)
+ TRANS_FEAT(FCVT_ds, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvt_ds, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvt_ds, a, 0, FPST_A64)
+ TRANS_FEAT(FCVT_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvt_sd, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvt_sd, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZS_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
+            gen_helper_sve_fcvtzs_hh, a, 0, FPST_FPCR_F16)
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FCVTZU_hd, aa64_sve, gen_gvec_fpst_arg_zpz,
+            gen_helper_sve_fcvtzu_hd, a, 0, FPST_FPCR_F16)
+ TRANS_FEAT(FCVTZS_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzs_ss, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzs_ss, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZU_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzu_ss, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzu_ss, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZS_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzs_sd, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzs_sd, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZU_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzu_sd, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzu_sd, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZS_ds, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzs_ds, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzs_ds, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZU_ds, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzu_ds, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzu_ds, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZS_dd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzs_dd, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzs_dd, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTZU_dd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_fcvtzu_dd, a, 0, FPST_FPCR)
++           gen_helper_sve_fcvtzu_dd, a, 0, FPST_A64)
+ static gen_helper_gvec_3_ptr * const frint_fns[] = {
+     NULL,
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const frint_fns[] = {
+     gen_helper_sve_frint_d
+ };
+ TRANS_FEAT(FRINTI, aa64_sve, gen_gvec_fpst_arg_zpz, frint_fns[a->esz],
+-           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ static gen_helper_gvec_3_ptr * const frintx_fns[] = {
+     NULL,
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const frintx_fns[] = {
+     gen_helper_sve_frintx_d
+ };
+ TRANS_FEAT(FRINTX, aa64_sve, gen_gvec_fpst_arg_zpz, frintx_fns[a->esz],
+-           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+ static bool do_frint_mode(DisasContext *s, arg_rpr_esz *a,
+                           ARMFPRounding mode, gen_helper_gvec_3_ptr *fn)
+@@ -XXX,XX +XXX,XX @@ static bool do_frint_mode(DisasContext *s, arg_rpr_esz *a,
+     }
+     vsz = vec_full_reg_size(s);
+-    status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR);
++    status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
+     tmode = gen_set_rmode(mode, status);
+     tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, a->rd),
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const frecpx_fns[] = {
+     gen_helper_sve_frecpx_s, gen_helper_sve_frecpx_d,
+ };
+ TRANS_FEAT(FRECPX, aa64_sve, gen_gvec_fpst_arg_zpz, frecpx_fns[a->esz],
+-           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ static gen_helper_gvec_3_ptr * const fsqrt_fns[] = {
+     NULL,                   gen_helper_sve_fsqrt_h,
+     gen_helper_sve_fsqrt_s, gen_helper_sve_fsqrt_d,
+ };
+ TRANS_FEAT(FSQRT, aa64_sve, gen_gvec_fpst_arg_zpz, fsqrt_fns[a->esz],
+-           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ TRANS_FEAT(SCVTF_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
+            gen_helper_sve_scvt_hh, a, 0, FPST_FPCR_F16)
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(SCVTF_dh, aa64_sve, gen_gvec_fpst_arg_zpz,
+            gen_helper_sve_scvt_dh, a, 0, FPST_FPCR_F16)
+ TRANS_FEAT(SCVTF_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_scvt_ss, a, 0, FPST_FPCR)
++           gen_helper_sve_scvt_ss, a, 0, FPST_A64)
+ TRANS_FEAT(SCVTF_ds, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_scvt_ds, a, 0, FPST_FPCR)
++           gen_helper_sve_scvt_ds, a, 0, FPST_A64)
+ TRANS_FEAT(SCVTF_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_scvt_sd, a, 0, FPST_FPCR)
++           gen_helper_sve_scvt_sd, a, 0, FPST_A64)
+ TRANS_FEAT(SCVTF_dd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_scvt_dd, a, 0, FPST_FPCR)
++           gen_helper_sve_scvt_dd, a, 0, FPST_A64)
+ TRANS_FEAT(UCVTF_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
+            gen_helper_sve_ucvt_hh, a, 0, FPST_FPCR_F16)
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(UCVTF_dh, aa64_sve, gen_gvec_fpst_arg_zpz,
+            gen_helper_sve_ucvt_dh, a, 0, FPST_FPCR_F16)
+ TRANS_FEAT(UCVTF_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_ucvt_ss, a, 0, FPST_FPCR)
++           gen_helper_sve_ucvt_ss, a, 0, FPST_A64)
+ TRANS_FEAT(UCVTF_ds, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_ucvt_ds, a, 0, FPST_FPCR)
++           gen_helper_sve_ucvt_ds, a, 0, FPST_A64)
+ TRANS_FEAT(UCVTF_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_ucvt_sd, a, 0, FPST_FPCR)
++           gen_helper_sve_ucvt_sd, a, 0, FPST_A64)
+ TRANS_FEAT(UCVTF_dd, aa64_sve, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_ucvt_dd, a, 0, FPST_FPCR)
++           gen_helper_sve_ucvt_dd, a, 0, FPST_A64)
+ /*
+  *** SVE Memory - 32-bit Gather and Unsized Contiguous Group
+@@ -XXX,XX +XXX,XX @@ DO_ZPZZ_FP(FMINP, aa64_sve2, sve2_fminp_zpzz)
+ TRANS_FEAT_NONSTREAMING(FMMLA_s, aa64_sve_f32mm, gen_gvec_fpst_zzzz,
+                         gen_helper_fmmla_s, a->rd, a->rn, a->rm, a->ra,
+-                        0, FPST_FPCR)
++                        0, FPST_A64)
+ TRANS_FEAT_NONSTREAMING(FMMLA_d, aa64_sve_f64mm, gen_gvec_fpst_zzzz,
+                         gen_helper_fmmla_d, a->rd, a->rn, a->rm, a->ra,
+-                        0, FPST_FPCR)
++                        0, FPST_A64)
+ static gen_helper_gvec_4 * const sqdmlal_zzzw_fns[] = {
+     NULL,                           gen_helper_sve2_sqdmlal_zzzw_h,
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT_NONSTREAMING(RAX1, aa64_sve2_sha3, gen_gvec_fn_arg_zzz,
+                         gen_gvec_rax1, a)
+ TRANS_FEAT(FCVTNT_sh, aa64_sve2, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve2_fcvtnt_sh, a, 0, FPST_FPCR)
++           gen_helper_sve2_fcvtnt_sh, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTNT_ds, aa64_sve2, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve2_fcvtnt_ds, a, 0, FPST_FPCR)
++           gen_helper_sve2_fcvtnt_ds, a, 0, FPST_A64)
+ TRANS_FEAT(BFCVTNT, aa64_sve_bf16, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve_bfcvtnt, a, 0, FPST_FPCR)
++           gen_helper_sve_bfcvtnt, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTLT_hs, aa64_sve2, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve2_fcvtlt_hs, a, 0, FPST_FPCR)
++           gen_helper_sve2_fcvtlt_hs, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTLT_sd, aa64_sve2, gen_gvec_fpst_arg_zpz,
+-           gen_helper_sve2_fcvtlt_sd, a, 0, FPST_FPCR)
++           gen_helper_sve2_fcvtlt_sd, a, 0, FPST_A64)
+ TRANS_FEAT(FCVTX_ds, aa64_sve2, do_frint_mode, a,
+            FPROUNDING_ODD, gen_helper_sve_fcvt_ds)
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const flogb_fns[] = {
+     gen_helper_flogb_s, gen_helper_flogb_d
+ };
+ TRANS_FEAT(FLOGB, aa64_sve2, gen_gvec_fpst_arg_zpz, flogb_fns[a->esz],
+-           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR)
++           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
+ static bool do_FMLAL_zzzw(DisasContext *s, arg_rrrr_esz *a, bool sub, bool sel)
+ {
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT_NONSTREAMING(BFMMLA, aa64_sve_bf16, gen_gvec_env_arg_zzzz,
+ static bool do_BFMLAL_zzzw(DisasContext *s, arg_rrrr_esz *a, bool sel)
+ {
+     return gen_gvec_fpst_zzzz(s, gen_helper_gvec_bfmlal,
+-                              a->rd, a->rn, a->rm, a->ra, sel, FPST_FPCR);
++                              a->rd, a->rn, a->rm, a->ra, sel, FPST_A64);
+ }
+ TRANS_FEAT(BFMLALB_zzzw, aa64_sve_bf16, do_BFMLAL_zzzw, a, false)
+@@ -XXX,XX +XXX,XX @@ static bool do_BFMLAL_zzxw(DisasContext *s, arg_rrxr_esz *a, bool sel)
+ {
+     return gen_gvec_fpst_zzzz(s, gen_helper_gvec_bfmlal_idx,
+                               a->rd, a->rn, a->rm, a->ra,
+-                              (a->index << 1) | sel, FPST_FPCR);
++                              (a->index << 1) | sel, FPST_A64);
+ }
+ TRANS_FEAT(BFMLALB_zzxw, aa64_sve_bf16, do_BFMLAL_zzxw, a, false)
+--
+.34.1

-[PULL 16/26] target/arm: Implement FEAT_LVA
+[PULL 24/36] target/arm: Remove now-unused vfp.fp_status and FPST_FPCR
-From: Richard Henderson <richard.henderson@linaro.org>
+Now we have moved all the uses of vfp.fp_status and FPST_FPCR
 to either the A32 or A64 fields, we can remove these.
-This feature is relatively small, as it applies only to
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-k pages and thus requires no additional changes to the
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
-table descriptor walking algorithm, only a change to the
+Message-id: 20250124162836.2332150-13-peter.maydell@linaro.org
-minimum TSZ (which is the inverse of the maximum virtual
+---
-address space size).
+ target/arm/cpu.h           | 2 --
  target/arm/tcg/translate.h | 6 ------
  target/arm/cpu.c           | 1 -
  target/arm/vfp_helper.c    | 8 +-------
 files changed, 1 insertion(+), 16 deletions(-)
-Note that this feature widens VBAR_ELx, but we already
-treat the register as being 64 bits wide.
-Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-10-richard.henderson@linaro.org
-Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
----
- docs/system/arm/emulation.rst | 1 +
- target/arm/cpu-param.h        | 2 +-
- target/arm/cpu.h              | 5 +++++
- target/arm/cpu64.c            | 1 +
- target/arm/helper.c           | 9 ++++++++-
-files changed, 16 insertions(+), 2 deletions(-)
-diff --git a/docs/system/arm/emulation.rst b/docs/system/arm/emulation.rst
-index XXXXXXX..XXXXXXX 100644
---- a/docs/system/arm/emulation.rst
-+++ b/docs/system/arm/emulation.rst
-@@ -XXX,XX +XXX,XX @@ the following architecture extensions:
- - FEAT_LRCPC (Load-acquire RCpc instructions)
- - FEAT_LRCPC2 (Load-acquire RCpc instructions v2)
- - FEAT_LSE (Large System Extensions)
-+- FEAT_LVA (Large Virtual Address space)
- - FEAT_MTE (Memory Tagging Extension)
- - FEAT_MTE2 (Memory Tagging Extension)
- - FEAT_MTE3 (MTE Asymmetric Fault Handling)
-diff --git a/target/arm/cpu-param.h b/target/arm/cpu-param.h
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/cpu-param.h
-+++ b/target/arm/cpu-param.h
-@@ -XXX,XX +XXX,XX @@
- #ifdef TARGET_AARCH64
- # define TARGET_LONG_BITS             64
- # define TARGET_PHYS_ADDR_SPACE_BITS  48
--# define TARGET_VIRT_ADDR_SPACE_BITS  48
-+# define TARGET_VIRT_ADDR_SPACE_BITS  52
- #else
- # define TARGET_LONG_BITS             32
- # define TARGET_PHYS_ADDR_SPACE_BITS  40
 diff --git a/target/arm/cpu.h b/target/arm/cpu.h
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu.h
 +++ b/target/arm/cpu.h
-@@ -XXX,XX +XXX,XX @@ static inline bool isar_feature_aa64_ccidx(const ARMISARegisters *id)
+@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
-     return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, CCIDX) != 0;
- }
+         /* There are a number of distinct float control structures:
+          *
-+static inline bool isar_feature_aa64_lva(const ARMISARegisters *id)
+-         *  fp_status: is the "normal" fp status.
-+{
+          *  fp_status_a32: is the "normal" fp status for AArch32 insns
-+    return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, VARANGE) != 0;
+          *  fp_status_a64: is the "normal" fp status for AArch64 insns
-+}
+          *  fp_status_fp16: used for half-precision calculations
-+
+@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
- static inline bool isar_feature_aa64_tts2uxn(const ARMISARegisters *id)
+          * only thing which needs to read the exception flags being
           * an explicit FPSCR read.
           */
 -        float_status fp_status;
          float_status fp_status_a32;
          float_status fp_status_a64;
          float_status fp_status_f16;
 diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/tcg/translate.h
 +++ b/target/arm/tcg/translate.h
@@ -XXX,XX +XXX,XX @@ static inline CPUARMTBFlags arm_tbflags_from_tb(const TranslationBlock *tb)
   * Enum for argument to fpstatus_ptr().
   */
  typedef enum ARMFPStatusFlavour {
 -    FPST_FPCR,
      FPST_A32,
      FPST_A64,
      FPST_FPCR_F16,
@@ -XXX,XX +XXX,XX @@ typedef enum ARMFPStatusFlavour {
   * been set up to point to the requested field in the CPU state struct.
   * The options are:
   *
 - * FPST_FPCR
 - *   for non-FP16 operations controlled by the FPCR
   * FPST_A32
   *   for AArch32 non-FP16 operations controlled by the FPCR
   * FPST_A64
@@ -XXX,XX +XXX,XX @@ static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour)
      int offset;
      switch (flavour) {
 -    case FPST_FPCR:
 -        offset = offsetof(CPUARMState, vfp.fp_status);
 -        break;
      case FPST_A32:
          offset = offsetof(CPUARMState, vfp.fp_status_a32);
          break;
 diff --git a/target/arm/cpu.c b/target/arm/cpu.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu.c
 +++ b/target/arm/cpu.c
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset_hold(Object *obj, ResetType type)
      set_flush_inputs_to_zero(1, &env->vfp.standard_fp_status);
      set_default_nan_mode(1, &env->vfp.standard_fp_status);
      set_default_nan_mode(1, &env->vfp.standard_fp_status_f16);
 -    arm_set_default_fp_behaviours(&env->vfp.fp_status);
      arm_set_default_fp_behaviours(&env->vfp.fp_status_a32);
      arm_set_default_fp_behaviours(&env->vfp.fp_status_a64);
      arm_set_default_fp_behaviours(&env->vfp.standard_fp_status);
 diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/vfp_helper.c
 +++ b/target/arm/vfp_helper.c
@@ -XXX,XX +XXX,XX @@ static inline uint32_t vfp_exceptbits_from_host(int host_bits)
  static uint32_t vfp_get_fpsr_from_host(CPUARMState *env)
  {
-     return FIELD_EX64(id->id_aa64mmfr1, ID_AA64MMFR1, XNX) != 0;
+-    uint32_t i;
-diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
++    uint32_t i = 0;
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/cpu64.c
+-    i = get_float_exception_flags(&env->vfp.fp_status);
-+++ b/target/arm/cpu64.c
+     i |= get_float_exception_flags(&env->vfp.fp_status_a32);
-@@ -XXX,XX +XXX,XX @@ static void aarch64_max_initfn(Object *obj)
+     i |= get_float_exception_flags(&env->vfp.fp_status_a64);
-     t = FIELD_DP64(t, ID_AA64MMFR2, UAO, 1);
+     i |= get_float_exception_flags(&env->vfp.standard_fp_status);
-     t = FIELD_DP64(t, ID_AA64MMFR2, CNP, 1); /* TTCNP */
+@@ -XXX,XX +XXX,XX @@ static void vfp_clear_float_status_exc_flags(CPUARMState *env)
-     t = FIELD_DP64(t, ID_AA64MMFR2, ST, 1); /* TTST */
+      * values. The caller should have arranged for env->vfp.fpsr to
-+    t = FIELD_DP64(t, ID_AA64MMFR2, VARANGE, 1); /* FEAT_LVA */
+      * be the architecturally up-to-date exception flag information first.
-     cpu->isar.id_aa64mmfr2 = t;
+      */
+-    set_float_exception_flags(0, &env->vfp.fp_status);
-     t = cpu->isar.id_aa64zfr0;
+     set_float_exception_flags(0, &env->vfp.fp_status_a32);
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+     set_float_exception_flags(0, &env->vfp.fp_status_a64);
-index XXXXXXX..XXXXXXX 100644
+     set_float_exception_flags(0, &env->vfp.fp_status_f16);
---- a/target/arm/helper.c
+@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
-+++ b/target/arm/helper.c
+             i = float_round_to_zero;
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+             break;
-     } else {
+         }
-         max_tsz = 39;
+-        set_float_rounding_mode(i, &env->vfp.fp_status);
          set_float_rounding_mode(i, &env->vfp.fp_status_a32);
          set_float_rounding_mode(i, &env->vfp.fp_status_a64);
          set_float_rounding_mode(i, &env->vfp.fp_status_f16);
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
      }
--    min_tsz = 16;  /* TODO: ARMv8.2-LVA  */
+     if (changed & FPCR_FZ) {
-+
+         bool ftz_enabled = val & FPCR_FZ;
-+    min_tsz = 16;
+-        set_flush_to_zero(ftz_enabled, &env->vfp.fp_status);
-+    if (using64k) {
+-        set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status);
-+        if (cpu_isar_feature(aa64_lva, env_archcpu(env))) {
+         set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_a32);
-+            min_tsz = 12;
+         set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_a32);
-+        }
+         set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_a64);
-+    }
+@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
-+    /* TODO: FEAT_LPA2 */
+     }
+     if (changed & FPCR_DN) {
-     if (tsz > max_tsz) {
+         bool dnan_enabled = val & FPCR_DN;
-         tsz = max_tsz;
+-        set_default_nan_mode(dnan_enabled, &env->vfp.fp_status);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a32);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a64);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16);
 --
-.25.1
+.34.1

-[PULL 05/26] target/arm: Support PSCI 1.1 and SMCCC 1.0
+[PULL 25/36] target/arm: Define new fp_status_f16_a32 and fp_status_f16_a64
-From: Akihiko Odaki <akihiko.odaki@gmail.com>
+As the first part of splitting the existing fp_status_f16
 into separate float_status fields for AArch32 and AArch64
 (so that we can make FEAT_AFP control bits apply only
 for AArch64), define the two new fp_status_f16_a32 and
 fp_status_f16_a64 fields, but don't use them yet.
-Support the latest PSCI on TCG and HVF. A 64-bit function called from
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-AArch32 now returns NOT_SUPPORTED, which is necessary to adhere to SMC
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
-Calling Convention 1.0. It is still not compliant with SMCCC 1.3 since
+Message-id: 20250124162836.2332150-14-peter.maydell@linaro.org
-they do not implement mandatory functions.
+---
  target/arm/cpu.h           |  4 ++++
  target/arm/tcg/translate.h | 12 ++++++++++++
  target/arm/cpu.c           |  2 ++
  target/arm/vfp_helper.c    | 14 ++++++++++++++
 files changed, 32 insertions(+)
-Signed-off-by: Akihiko Odaki <akihiko.odaki@gmail.com>
+diff --git a/target/arm/cpu.h b/target/arm/cpu.h
 Message-id: 20220213035753.34577-1-akihiko.odaki@gmail.com
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
 [PMM: update MISMATCH_CHECK checks on PSCI_VERSION macros to match]
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
  target/arm/kvm-consts.h | 13 +++++++++----
  hw/arm/boot.c           | 12 +++++++++---
  target/arm/cpu.c        |  5 +++--
  target/arm/hvf/hvf.c    | 27 ++++++++++++++++++++++++++-
  target/arm/kvm64.c      |  2 +-
  target/arm/psci.c       | 35 ++++++++++++++++++++++++++++++++---
 files changed, 80 insertions(+), 14 deletions(-)
 diff --git a/target/arm/kvm-consts.h b/target/arm/kvm-consts.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/kvm-consts.h
+--- a/target/arm/cpu.h
-+++ b/target/arm/kvm-consts.h
++++ b/target/arm/cpu.h
-@@ -XXX,XX +XXX,XX @@ MISMATCH_CHECK(QEMU_PSCI_0_1_FN_MIGRATE, KVM_PSCI_FN_MIGRATE);
+@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
- #define QEMU_PSCI_0_2_FN64_AFFINITY_INFO QEMU_PSCI_0_2_FN64(4)
+          *  fp_status_a32: is the "normal" fp status for AArch32 insns
- #define QEMU_PSCI_0_2_FN64_MIGRATE QEMU_PSCI_0_2_FN64(5)
+          *  fp_status_a64: is the "normal" fp status for AArch64 insns
+          *  fp_status_fp16: used for half-precision calculations
-+#define QEMU_PSCI_1_0_FN_PSCI_FEATURES QEMU_PSCI_0_2_FN(10)
++         *  fp_status_fp16_a32: used for AArch32 half-precision calculations
-+
++         *  fp_status_fp16_a64: used for AArch64 half-precision calculations
- MISMATCH_CHECK(QEMU_PSCI_0_2_FN_CPU_SUSPEND, PSCI_0_2_FN_CPU_SUSPEND);
+          *  standard_fp_status : the ARM "Standard FPSCR Value"
- MISMATCH_CHECK(QEMU_PSCI_0_2_FN_CPU_OFF, PSCI_0_2_FN_CPU_OFF);
+          *  standard_fp_status_fp16 : used for half-precision
- MISMATCH_CHECK(QEMU_PSCI_0_2_FN_CPU_ON, PSCI_0_2_FN_CPU_ON);
+          *       calculations with the ARM "Standard FPSCR Value"
-@@ -XXX,XX +XXX,XX @@ MISMATCH_CHECK(QEMU_PSCI_0_2_FN_MIGRATE, PSCI_0_2_FN_MIGRATE);
+@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
- MISMATCH_CHECK(QEMU_PSCI_0_2_FN64_CPU_SUSPEND, PSCI_0_2_FN64_CPU_SUSPEND);
+         float_status fp_status_a32;
- MISMATCH_CHECK(QEMU_PSCI_0_2_FN64_CPU_ON, PSCI_0_2_FN64_CPU_ON);
+         float_status fp_status_a64;
- MISMATCH_CHECK(QEMU_PSCI_0_2_FN64_MIGRATE, PSCI_0_2_FN64_MIGRATE);
+         float_status fp_status_f16;
-+MISMATCH_CHECK(QEMU_PSCI_1_0_FN_PSCI_FEATURES, PSCI_1_0_FN_PSCI_FEATURES);
++        float_status fp_status_f16_a32;
++        float_status fp_status_f16_a64;
- /* PSCI v0.2 return values used by TCG emulation of PSCI */
+         float_status standard_fp_status;
+         float_status standard_fp_status_f16;
- /* No Trusted OS migration to worry about when offlining CPUs */
- #define QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED        2
+diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h
 -/* We implement version 0.2 only */
 -#define QEMU_PSCI_0_2_RET_VERSION_0_2                       2
 +#define QEMU_PSCI_VERSION_0_1                     0x00001
 +#define QEMU_PSCI_VERSION_0_2                     0x00002
 +#define QEMU_PSCI_VERSION_1_1                     0x10001
  MISMATCH_CHECK(QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED, PSCI_0_2_TOS_MP);
 -MISMATCH_CHECK(QEMU_PSCI_0_2_RET_VERSION_0_2,
 -               (PSCI_VERSION_MAJOR(0) | PSCI_VERSION_MINOR(2)));
 +/* We don't bother to check every possible version value */
 +MISMATCH_CHECK(QEMU_PSCI_VERSION_0_2, PSCI_VERSION(0, 2));
 +MISMATCH_CHECK(QEMU_PSCI_VERSION_1_1, PSCI_VERSION(1, 1));
  /* PSCI return values (inclusive of all PSCI versions) */
  #define QEMU_PSCI_RET_SUCCESS                     0
 diff --git a/hw/arm/boot.c b/hw/arm/boot.c
 index XXXXXXX..XXXXXXX 100644
---- a/hw/arm/boot.c
+--- a/target/arm/tcg/translate.h
-+++ b/hw/arm/boot.c
++++ b/target/arm/tcg/translate.h
-@@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt)
+@@ -XXX,XX +XXX,XX @@ typedef enum ARMFPStatusFlavour {
-     }
+     FPST_A32,
+     FPST_A64,
-     qemu_fdt_add_subnode(fdt, "/psci");
+     FPST_FPCR_F16,
--    if (armcpu->psci_version == 2) {
++    FPST_A32_F16,
--        const char comp[] = "arm,psci-0.2\0arm,psci";
++    FPST_A64_F16,
--        qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
+     FPST_STD,
-+    if (armcpu->psci_version == QEMU_PSCI_VERSION_0_2 ||
+     FPST_STD_F16,
-+        armcpu->psci_version == QEMU_PSCI_VERSION_1_1) {
+ } ARMFPStatusFlavour;
-+        if (armcpu->psci_version == QEMU_PSCI_VERSION_0_2) {
+@@ -XXX,XX +XXX,XX @@ typedef enum ARMFPStatusFlavour {
-+            const char comp[] = "arm,psci-0.2\0arm,psci";
+  *   for AArch64 non-FP16 operations controlled by the FPCR
-+            qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
+  * FPST_FPCR_F16
-+        } else {
+  *   for operations controlled by the FPCR where FPCR.FZ16 is to be used
-+            const char comp[] = "arm,psci-1.0\0arm,psci-0.2\0arm,psci";
++ * FPST_A32_F16
-+            qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
++ *   for AArch32 operations controlled by the FPCR where FPCR.FZ16 is to be used
-+        }
++ * FPST_A64_F16
++ *   for AArch64 operations controlled by the FPCR where FPCR.FZ16 is to be used
-         cpu_off_fn = QEMU_PSCI_0_2_FN_CPU_OFF;
+  * FPST_STD
-         if (arm_feature(&armcpu->env, ARM_FEATURE_AARCH64)) {
+  *   for A32/T32 Neon operations using the "standard FPSCR value"
   * FPST_STD_F16
@@ -XXX,XX +XXX,XX @@ static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour)
      case FPST_FPCR_F16:
          offset = offsetof(CPUARMState, vfp.fp_status_f16);
          break;
 +    case FPST_A32_F16:
 +        offset = offsetof(CPUARMState, vfp.fp_status_f16_a32);
 +        break;
 +    case FPST_A64_F16:
 +        offset = offsetof(CPUARMState, vfp.fp_status_f16_a64);
 +        break;
      case FPST_STD:
          offset = offsetof(CPUARMState, vfp.standard_fp_status);
          break;
 diff --git a/target/arm/cpu.c b/target/arm/cpu.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu.c
 +++ b/target/arm/cpu.c
-@@ -XXX,XX +XXX,XX @@ static void arm_cpu_initfn(Object *obj)
+@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset_hold(Object *obj, ResetType type)
-      * picky DTB consumer will also provide a helpful error message.
+     arm_set_default_fp_behaviours(&env->vfp.fp_status_a64);
-      */
+     arm_set_default_fp_behaviours(&env->vfp.standard_fp_status);
-     cpu->dtb_compatible = "qemu,unknown";
+     arm_set_default_fp_behaviours(&env->vfp.fp_status_f16);
--    cpu->psci_version = 1; /* By default assume PSCI v0.1 */
++    arm_set_default_fp_behaviours(&env->vfp.fp_status_f16_a32);
-+    cpu->psci_version = QEMU_PSCI_VERSION_0_1; /* By default assume PSCI v0.1 */
++    arm_set_default_fp_behaviours(&env->vfp.fp_status_f16_a64);
-     cpu->kvm_target = QEMU_KVM_ARM_TARGET_NONE;
+     arm_set_default_fp_behaviours(&env->vfp.standard_fp_status_f16);
-     if (tcg_enabled() || hvf_enabled()) {
+ #ifndef CONFIG_USER_ONLY
--        cpu->psci_version = 2; /* TCG and HVF implement PSCI 0.2 */
+diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
-+        /* TCG and HVF implement PSCI 1.1 */
+index XXXXXXX..XXXXXXX 100644
-+        cpu->psci_version = QEMU_PSCI_VERSION_1_1;
+--- a/target/arm/vfp_helper.c
 +++ b/target/arm/vfp_helper.c
@@ -XXX,XX +XXX,XX @@ static uint32_t vfp_get_fpsr_from_host(CPUARMState *env)
      /* FZ16 does not generate an input denormal exception.  */
      i |= (get_float_exception_flags(&env->vfp.fp_status_f16)
            & ~float_flag_input_denormal);
 +    i |= (get_float_exception_flags(&env->vfp.fp_status_f16_a32)
 +          & ~float_flag_input_denormal);
 +    i |= (get_float_exception_flags(&env->vfp.fp_status_f16_a64)
 +          & ~float_flag_input_denormal);
      i |= (get_float_exception_flags(&env->vfp.standard_fp_status_f16)
            & ~float_flag_input_denormal);
      return vfp_exceptbits_from_host(i);
@@ -XXX,XX +XXX,XX @@ static void vfp_clear_float_status_exc_flags(CPUARMState *env)
      set_float_exception_flags(0, &env->vfp.fp_status_a32);
      set_float_exception_flags(0, &env->vfp.fp_status_a64);
      set_float_exception_flags(0, &env->vfp.fp_status_f16);
 +    set_float_exception_flags(0, &env->vfp.fp_status_f16_a32);
 +    set_float_exception_flags(0, &env->vfp.fp_status_f16_a64);
      set_float_exception_flags(0, &env->vfp.standard_fp_status);
      set_float_exception_flags(0, &env->vfp.standard_fp_status_f16);
  }
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
          set_float_rounding_mode(i, &env->vfp.fp_status_a32);
          set_float_rounding_mode(i, &env->vfp.fp_status_a64);
          set_float_rounding_mode(i, &env->vfp.fp_status_f16);
 +        set_float_rounding_mode(i, &env->vfp.fp_status_f16_a32);
 +        set_float_rounding_mode(i, &env->vfp.fp_status_f16_a64);
      }
      if (changed & FPCR_FZ16) {
          bool ftz_enabled = val & FPCR_FZ16;
          set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16);
 +        set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a32);
 +        set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a64);
          set_flush_to_zero(ftz_enabled, &env->vfp.standard_fp_status_f16);
          set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16);
 +        set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a32);
 +        set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a64);
          set_flush_inputs_to_zero(ftz_enabled, &env->vfp.standard_fp_status_f16);
      }
      if (changed & FPCR_FZ) {
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a32);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a64);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16);
 +        set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16_a32);
 +        set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16_a64);
      }
  }
-diff --git a/target/arm/hvf/hvf.c b/target/arm/hvf/hvf.c
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/hvf/hvf.c
-+++ b/target/arm/hvf/hvf.c
-@@ -XXX,XX +XXX,XX @@ static bool hvf_handle_psci_call(CPUState *cpu)
-     switch (param[0]) {
-     case QEMU_PSCI_0_2_FN_PSCI_VERSION:
--        ret = QEMU_PSCI_0_2_RET_VERSION_0_2;
-+        ret = QEMU_PSCI_VERSION_1_1;
-         break;
-     case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
-         ret = QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED; /* No trusted OS */
-@@ -XXX,XX +XXX,XX @@ static bool hvf_handle_psci_call(CPUState *cpu)
-     case QEMU_PSCI_0_2_FN_MIGRATE:
-         ret = QEMU_PSCI_RET_NOT_SUPPORTED;
-         break;
-+    case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
-+        switch (param[1]) {
-+        case QEMU_PSCI_0_2_FN_PSCI_VERSION:
-+        case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
-+        case QEMU_PSCI_0_2_FN_AFFINITY_INFO:
-+        case QEMU_PSCI_0_2_FN64_AFFINITY_INFO:
-+        case QEMU_PSCI_0_2_FN_SYSTEM_RESET:
-+        case QEMU_PSCI_0_2_FN_SYSTEM_OFF:
-+        case QEMU_PSCI_0_1_FN_CPU_ON:
-+        case QEMU_PSCI_0_2_FN_CPU_ON:
-+        case QEMU_PSCI_0_2_FN64_CPU_ON:
-+        case QEMU_PSCI_0_1_FN_CPU_OFF:
-+        case QEMU_PSCI_0_2_FN_CPU_OFF:
-+        case QEMU_PSCI_0_1_FN_CPU_SUSPEND:
-+        case QEMU_PSCI_0_2_FN_CPU_SUSPEND:
-+        case QEMU_PSCI_0_2_FN64_CPU_SUSPEND:
-+        case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
-+            ret = 0;
-+            break;
-+        case QEMU_PSCI_0_1_FN_MIGRATE:
-+        case QEMU_PSCI_0_2_FN_MIGRATE:
-+        default:
-+            ret = QEMU_PSCI_RET_NOT_SUPPORTED;
-+        }
-+        break;
-     default:
-         return false;
-     }
-diff --git a/target/arm/kvm64.c b/target/arm/kvm64.c
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/kvm64.c
-+++ b/target/arm/kvm64.c
-@@ -XXX,XX +XXX,XX @@ int kvm_arch_init_vcpu(CPUState *cs)
-         cpu->kvm_init_features[0] |= 1 << KVM_ARM_VCPU_POWER_OFF;
-     }
-     if (kvm_check_extension(cs->kvm_state, KVM_CAP_ARM_PSCI_0_2)) {
--        cpu->psci_version = 2;
-+        cpu->psci_version = QEMU_PSCI_VERSION_0_2;
-         cpu->kvm_init_features[0] |= 1 << KVM_ARM_VCPU_PSCI_0_2;
-     }
-     if (!arm_feature(&cpu->env, ARM_FEATURE_AARCH64)) {
-diff --git a/target/arm/psci.c b/target/arm/psci.c
-index XXXXXXX..XXXXXXX 100644
---- a/target/arm/psci.c
-+++ b/target/arm/psci.c
-@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
- {
-     /*
-      * This function partially implements the logic for dispatching Power State
--     * Coordination Interface (PSCI) calls (as described in ARM DEN 0022B.b),
-+     * Coordination Interface (PSCI) calls (as described in ARM DEN 0022D.b),
-      * to the extent required for bringing up and taking down secondary cores,
-      * and for handling reset and poweroff requests.
-      * Additional information about the calling convention used is available in
-@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
-     }
-     if ((param[0] & QEMU_PSCI_0_2_64BIT) && !is_a64(env)) {
--        ret = QEMU_PSCI_RET_INVALID_PARAMS;
-+        ret = QEMU_PSCI_RET_NOT_SUPPORTED;
-         goto err;
-     }
-@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
-         ARMCPU *target_cpu;
-     case QEMU_PSCI_0_2_FN_PSCI_VERSION:
--        ret = QEMU_PSCI_0_2_RET_VERSION_0_2;
-+        ret = QEMU_PSCI_VERSION_1_1;
-         break;
-     case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
-         ret = QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED; /* No trusted OS */
-@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
-         }
-         helper_wfi(env, 4);
-         break;
-+    case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
-+        switch (param[1]) {
-+        case QEMU_PSCI_0_2_FN_PSCI_VERSION:
-+        case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
-+        case QEMU_PSCI_0_2_FN_AFFINITY_INFO:
-+        case QEMU_PSCI_0_2_FN64_AFFINITY_INFO:
-+        case QEMU_PSCI_0_2_FN_SYSTEM_RESET:
-+        case QEMU_PSCI_0_2_FN_SYSTEM_OFF:
-+        case QEMU_PSCI_0_1_FN_CPU_ON:
-+        case QEMU_PSCI_0_2_FN_CPU_ON:
-+        case QEMU_PSCI_0_2_FN64_CPU_ON:
-+        case QEMU_PSCI_0_1_FN_CPU_OFF:
-+        case QEMU_PSCI_0_2_FN_CPU_OFF:
-+        case QEMU_PSCI_0_1_FN_CPU_SUSPEND:
-+        case QEMU_PSCI_0_2_FN_CPU_SUSPEND:
-+        case QEMU_PSCI_0_2_FN64_CPU_SUSPEND:
-+        case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
-+            if (!(param[1] & QEMU_PSCI_0_2_64BIT) || is_a64(env)) {
-+                ret = 0;
-+                break;
-+            }
-+            /* fallthrough */
-+        case QEMU_PSCI_0_1_FN_MIGRATE:
-+        case QEMU_PSCI_0_2_FN_MIGRATE:
-+        default:
-+            ret = QEMU_PSCI_RET_NOT_SUPPORTED;
-+            break;
-+        }
-+        break;
-     case QEMU_PSCI_0_1_FN_MIGRATE:
-     case QEMU_PSCI_0_2_FN_MIGRATE:
-     default:
 --
-.25.1
+.34.1

-New patch
+[PULL 26/36] target/arm: Use fp_status_f16_a32 in AArch32-only helpers
+We directly use fp_status_f16 in a handful of helpers that
+are AArch32-specific; switch to fp_status_f16_a32 for these.
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-15-peter.maydell@linaro.org
+---
+ target/arm/tcg/vec_helper.c | 4 ++--
+ target/arm/vfp_helper.c     | 2 +-
+files changed, 3 insertions(+), 3 deletions(-)
+diff --git a/target/arm/tcg/vec_helper.c b/target/arm/tcg/vec_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/vec_helper.c
++++ b/target/arm/tcg/vec_helper.c
+@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fmlal_a32)(void *vd, void *vn, void *vm,
+                             CPUARMState *env, uint32_t desc)
+ {
+     do_fmlal(vd, vn, vm, &env->vfp.standard_fp_status, desc,
+-             get_flush_inputs_to_zero(&env->vfp.fp_status_f16));
++             get_flush_inputs_to_zero(&env->vfp.fp_status_f16_a32));
+ }
+ void HELPER(gvec_fmlal_a64)(void *vd, void *vn, void *vm,
+@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fmlal_idx_a32)(void *vd, void *vn, void *vm,
+                                 CPUARMState *env, uint32_t desc)
+ {
+     do_fmlal_idx(vd, vn, vm, &env->vfp.standard_fp_status, desc,
+-                 get_flush_inputs_to_zero(&env->vfp.fp_status_f16));
++                 get_flush_inputs_to_zero(&env->vfp.fp_status_f16_a32));
+ }
+ void HELPER(gvec_fmlal_idx_a64)(void *vd, void *vn, void *vm,
+diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/vfp_helper.c
++++ b/target/arm/vfp_helper.c
+@@ -XXX,XX +XXX,XX @@ void VFP_HELPER(cmpe, P)(ARGTYPE a, ARGTYPE b, CPUARMState *env) \
+     softfloat_to_vfp_compare(env, \
+         FLOATTYPE ## _compare(a, b, &env->vfp.FPST)); \
+ }
+-DO_VFP_cmp(h, float16, dh_ctype_f16, fp_status_f16)
++DO_VFP_cmp(h, float16, dh_ctype_f16, fp_status_f16_a32)
+ DO_VFP_cmp(s, float32, float32, fp_status_a32)
+ DO_VFP_cmp(d, float64, float64, fp_status_a32)
+ #undef DO_VFP_cmp
+--
+.34.1

-New patch
+[PULL 27/36] target/arm: Use fp_status_f16_a64 in AArch64-only helpers
+We directly use fp_status_f16 in a handful of helpers that are
+AArch64-specific; switch to fp_status_f16_a64 for these.
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-16-peter.maydell@linaro.org
+---
+ target/arm/tcg/sme_helper.c | 4 ++--
+ target/arm/tcg/vec_helper.c | 8 ++++----
+files changed, 6 insertions(+), 6 deletions(-)
+diff --git a/target/arm/tcg/sme_helper.c b/target/arm/tcg/sme_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/sme_helper.c
++++ b/target/arm/tcg/sme_helper.c
+@@ -XXX,XX +XXX,XX @@ void HELPER(sme_fmopa_h)(void *vza, void *vzn, void *vzm, void *vpn,
+     float_status fpst_odd, fpst_std, fpst_f16;
+     /*
+-     * Make copies of fp_status and fp_status_f16, because this operation
++     * Make copies of the fp status fields we use, because this operation
+      * does not update the cumulative fp exception status.  It also
+      * produces default NaNs. We also need a second copy of fp_status with
+      * round-to-odd -- see above.
+      */
+-    fpst_f16 = env->vfp.fp_status_f16;
++    fpst_f16 = env->vfp.fp_status_f16_a64;
+     fpst_std = env->vfp.fp_status_a64;
+     set_default_nan_mode(true, &fpst_std);
+     set_default_nan_mode(true, &fpst_f16);
+diff --git a/target/arm/tcg/vec_helper.c b/target/arm/tcg/vec_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/vec_helper.c
++++ b/target/arm/tcg/vec_helper.c
+@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fmlal_a64)(void *vd, void *vn, void *vm,
+                             CPUARMState *env, uint32_t desc)
+ {
+     do_fmlal(vd, vn, vm, &env->vfp.fp_status_a64, desc,
+-             get_flush_inputs_to_zero(&env->vfp.fp_status_f16));
++             get_flush_inputs_to_zero(&env->vfp.fp_status_f16_a64));
+ }
+ void HELPER(sve2_fmlal_zzzw_s)(void *vd, void *vn, void *vm, void *va,
+@@ -XXX,XX +XXX,XX @@ void HELPER(sve2_fmlal_zzzw_s)(void *vd, void *vn, void *vm, void *va,
+     uint16_t negn = extract32(desc, SIMD_DATA_SHIFT, 1) << 15;
+     intptr_t sel = extract32(desc, SIMD_DATA_SHIFT + 1, 1) * sizeof(float16);
+     float_status *status = &env->vfp.fp_status_a64;
+-    bool fz16 = get_flush_inputs_to_zero(&env->vfp.fp_status_f16);
++    bool fz16 = get_flush_inputs_to_zero(&env->vfp.fp_status_f16_a64);
+     for (i = 0; i < oprsz; i += sizeof(float32)) {
+         float16 nn_16 = *(float16 *)(vn + H1_2(i + sel)) ^ negn;
+@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fmlal_idx_a64)(void *vd, void *vn, void *vm,
+                                 CPUARMState *env, uint32_t desc)
+ {
+     do_fmlal_idx(vd, vn, vm, &env->vfp.fp_status_a64, desc,
+-                 get_flush_inputs_to_zero(&env->vfp.fp_status_f16));
++                 get_flush_inputs_to_zero(&env->vfp.fp_status_f16_a64));
+ }
+ void HELPER(sve2_fmlal_zzxw_s)(void *vd, void *vn, void *vm, void *va,
+@@ -XXX,XX +XXX,XX @@ void HELPER(sve2_fmlal_zzxw_s)(void *vd, void *vn, void *vm, void *va,
+     intptr_t sel = extract32(desc, SIMD_DATA_SHIFT + 1, 1) * sizeof(float16);
+     intptr_t idx = extract32(desc, SIMD_DATA_SHIFT + 2, 3) * sizeof(float16);
+     float_status *status = &env->vfp.fp_status_a64;
+-    bool fz16 = get_flush_inputs_to_zero(&env->vfp.fp_status_f16);
++    bool fz16 = get_flush_inputs_to_zero(&env->vfp.fp_status_f16_a64);
+     for (i = 0; i < oprsz; i += 16) {
+         float16 mm_16 = *(float16 *)(vm + i + idx);
+--
+.34.1

-New patch
+[PULL 28/36] target/arm: Use FPST_A32_F16 in A32 decoder
+In the A32 decoder, use FPST_A32_F16 rather than FPST_FPCR_F16.
+By doing an automated conversion of the whole file we avoid possibly
+using more than one fpst value in a set_rmode/op/restore_rmode
+sequence.
+Patch created with
+  perl -p -i -e 's/FPST_FPCR_F16(?!_)/FPST_A32_F16/g' target/arm/tcg/translate-vfp.c
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-17-peter.maydell@linaro.org
+---
+ target/arm/tcg/translate-vfp.c | 24 ++++++++++++------------
+file changed, 12 insertions(+), 12 deletions(-)
+diff --git a/target/arm/tcg/translate-vfp.c b/target/arm/tcg/translate-vfp.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/arm/tcg/translate-vfp.c
++++ b/target/arm/tcg/translate-vfp.c
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINT(DisasContext *s, arg_VRINT *a)
+     }
+     if (sz == 1) {
+-        fpst = fpstatus_ptr(FPST_FPCR_F16);
++        fpst = fpstatus_ptr(FPST_A32_F16);
+     } else {
+         fpst = fpstatus_ptr(FPST_A32);
+     }
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT(DisasContext *s, arg_VCVT *a)
+     }
+     if (sz == 1) {
+-        fpst = fpstatus_ptr(FPST_FPCR_F16);
++        fpst = fpstatus_ptr(FPST_A32_F16);
+     } else {
+         fpst = fpstatus_ptr(FPST_A32);
+     }
+@@ -XXX,XX +XXX,XX @@ static bool do_vfp_3op_hp(DisasContext *s, VFPGen3OpSPFn *fn,
+     /*
+      * Do a half-precision operation. Functionally this is
+      * the same as do_vfp_3op_sp(), except:
+-     *  - it uses the FPST_FPCR_F16
++     *  - it uses the FPST_A32_F16
+      *  - it doesn't need the VFP vector handling (fp16 is a
+      *    v8 feature, and in v8 VFP vectors don't exist)
+      *  - it does the aa32_fp16_arith feature test
+@@ -XXX,XX +XXX,XX @@ static bool do_vfp_3op_hp(DisasContext *s, VFPGen3OpSPFn *fn,
+     f0 = tcg_temp_new_i32();
+     f1 = tcg_temp_new_i32();
+     fd = tcg_temp_new_i32();
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     vfp_load_reg16(f0, vn);
+     vfp_load_reg16(f1, vm);
+@@ -XXX,XX +XXX,XX @@ static bool do_vfm_hp(DisasContext *s, arg_VFMA_sp *a, bool neg_n, bool neg_d)
+         /* VFNMA, VFNMS */
+         gen_vfp_negh(vd, vd);
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     gen_helper_vfp_muladdh(vd, vn, vm, vd, fpst);
+     vfp_store_reg32(vd, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ DO_VFP_2OP(VNEG, dp, gen_vfp_negd, aa32_fpdp_v2)
+ static void gen_VSQRT_hp(TCGv_i32 vd, TCGv_i32 vm)
+ {
+-    gen_helper_vfp_sqrth(vd, vm, fpstatus_ptr(FPST_FPCR_F16));
++    gen_helper_vfp_sqrth(vd, vm, fpstatus_ptr(FPST_A32_F16));
+ }
+ static void gen_VSQRT_sp(TCGv_i32 vd, TCGv_i32 vm)
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTR_hp(DisasContext *s, arg_VRINTR_sp *a)
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg16(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     gen_helper_rinth(tmp, tmp, fpst);
+     vfp_store_reg32(tmp, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTZ_hp(DisasContext *s, arg_VRINTZ_sp *a)
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg16(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     tcg_rmode = gen_set_rmode(FPROUNDING_ZERO, fpst);
+     gen_helper_rinth(tmp, tmp, fpst);
+     gen_restore_rmode(tcg_rmode, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VRINTX_hp(DisasContext *s, arg_VRINTX_sp *a)
+     tmp = tcg_temp_new_i32();
+     vfp_load_reg16(tmp, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     gen_helper_rinth_exact(tmp, tmp, fpst);
+     vfp_store_reg32(tmp, a->vd);
+     return true;
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_int_hp(DisasContext *s, arg_VCVT_int_sp *a)
+     vm = tcg_temp_new_i32();
+     vfp_load_reg32(vm, a->vm);
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     if (a->s) {
+         /* i32 -> f16 */
+         gen_helper_vfp_sitoh(vm, vm, fpst);
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_fix_hp(DisasContext *s, arg_VCVT_fix_sp *a)
+     vd = tcg_temp_new_i32();
+     vfp_load_reg32(vd, a->vd);
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     shift = tcg_constant_i32(frac_bits);
+     /* Switch on op:U:sx bits */
+@@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_hp_int(DisasContext *s, arg_VCVT_sp_int *a)
+         return true;
+     }
+-    fpst = fpstatus_ptr(FPST_FPCR_F16);
++    fpst = fpstatus_ptr(FPST_A32_F16);
+     vm = tcg_temp_new_i32();
+     vfp_load_reg16(vm, a->vm);
+--
+.34.1

-[PULL 10/26] target/arm: Fault on invalid TCR_ELx.TxSZ
+[PULL 29/36] target/arm: Use FPST_A64_F16 in A64 decoder
-From: Richard Henderson <richard.henderson@linaro.org>
+In the A32 decoder, use FPST_A64_F16 rather than FPST_FPCR_F16.
 By doing an automated conversion of the whole file we avoid possibly
 using more than one fpst value in a set_rmode/op/restore_rmode
 sequence.
-Without FEAT_LVA, the behaviour of programming an invalid value
+Patch created with
-is IMPLEMENTATION DEFINED.  With FEAT_LVA, programming an invalid
+  perl -p -i -e 's/FPST_FPCR_F16(?!_)/FPST_A64_F16/g' target/arm/tcg/translate-{a64,sve,sme}.c
 minimum value requires a Translation fault.
-It is most self-consistent to choose to generate the fault always.
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20250124162836.2332150-18-peter.maydell@linaro.org
 ---
  target/arm/tcg/translate-a64.c | 32 ++++++++---------
  target/arm/tcg/translate-sve.c | 66 +++++++++++++++++-----------------
 files changed, 49 insertions(+), 49 deletions(-)
-Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
+diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c
 Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20220301215958.157011-4-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
  target/arm/internals.h |  1 +
  target/arm/helper.c    | 32 ++++++++++++++++++++++++++++----
 files changed, 29 insertions(+), 4 deletions(-)
 diff --git a/target/arm/internals.h b/target/arm/internals.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/internals.h
+--- a/target/arm/tcg/translate-a64.c
-+++ b/target/arm/internals.h
++++ b/target/arm/tcg/translate-a64.c
-@@ -XXX,XX +XXX,XX @@ typedef struct ARMVAParameters {
+@@ -XXX,XX +XXX,XX @@ static void gen_gvec_op3_fpst(DisasContext *s, bool is_q, int rd, int rn,
-     bool hpd        : 1;
+                               int rm, bool is_fp16, int data,
-     bool using16k   : 1;
+                               gen_helper_gvec_3_ptr *fn)
-     bool using64k   : 1;
+ {
-+    bool tsz_oob    : 1;  /* tsz has been clamped to legal range */
+-    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_A64);
- } ARMVAParameters;
++    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_A64_F16 : FPST_A64);
+     tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd),
- ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+                        vec_full_reg_offset(s, rn),
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+                        vec_full_reg_offset(s, rm), fpst,
@@ -XXX,XX +XXX,XX @@ static void gen_gvec_op4_fpst(DisasContext *s, bool is_q, int rd, int rn,
                                int rm, int ra, bool is_fp16, int data,
                                gen_helper_gvec_4_ptr *fn)
  {
 -    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_A64);
 +    TCGv_ptr fpst = fpstatus_ptr(is_fp16 ? FPST_A64_F16 : FPST_A64);
      tcg_gen_gvec_4_ptr(vec_full_reg_offset(s, rd),
                         vec_full_reg_offset(s, rn),
                         vec_full_reg_offset(s, rm),
@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar(DisasContext *s, arg_rrr_e *a, const FPScalar *f)
          if (fp_access_check(s)) {
              TCGv_i32 t0 = read_fp_hreg(s, a->rn);
              TCGv_i32 t1 = read_fp_hreg(s, a->rm);
 -            f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_FPCR_F16));
 +            f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_A64_F16));
              write_fp_sreg(s, a->rd, t0);
          }
          break;
@@ -XXX,XX +XXX,XX @@ static bool do_fcmp0_s(DisasContext *s, arg_rr_e *a,
              TCGv_i32 t0 = read_fp_hreg(s, a->rn);
              TCGv_i32 t1 = tcg_constant_i32(0);
              if (swap) {
 -                f->gen_h(t0, t1, t0, fpstatus_ptr(FPST_FPCR_F16));
 +                f->gen_h(t0, t1, t0, fpstatus_ptr(FPST_A64_F16));
              } else {
 -                f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_FPCR_F16));
 +                f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_A64_F16));
              }
              write_fp_sreg(s, a->rd, t0);
          }
@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar_idx(DisasContext *s, arg_rrx_e *a, const FPScalar *f)
              TCGv_i32 t1 = tcg_temp_new_i32();
              read_vec_element_i32(s, t1, a->rm, a->idx, MO_16);
 -            f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_FPCR_F16));
 +            f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_A64_F16));
              write_fp_sreg(s, a->rd, t0);
          }
          break;
@@ -XXX,XX +XXX,XX @@ static bool do_fmla_scalar_idx(DisasContext *s, arg_rrx_e *a, bool neg)
                  gen_vfp_negh(t1, t1);
              }
              gen_helper_advsimd_muladdh(t0, t1, t2, t0,
 -                                       fpstatus_ptr(FPST_FPCR_F16));
 +                                       fpstatus_ptr(FPST_A64_F16));
              write_fp_sreg(s, a->rd, t0);
          }
          break;
@@ -XXX,XX +XXX,XX @@ static bool do_fp3_scalar_pair(DisasContext *s, arg_rr_e *a, const FPScalar *f)
              read_vec_element_i32(s, t0, a->rn, 0, MO_16);
              read_vec_element_i32(s, t1, a->rn, 1, MO_16);
 -            f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_FPCR_F16));
 +            f->gen_h(t0, t0, t1, fpstatus_ptr(FPST_A64_F16));
              write_fp_sreg(s, a->rd, t0);
          }
          break;
@@ -XXX,XX +XXX,XX @@ static bool do_fmadd(DisasContext *s, arg_rrrr_e *a, bool neg_a, bool neg_n)
              if (neg_n) {
                  gen_vfp_negh(tn, tn);
              }
 -            fpst = fpstatus_ptr(FPST_FPCR_F16);
 +            fpst = fpstatus_ptr(FPST_A64_F16);
              gen_helper_advsimd_muladdh(ta, tn, tm, ta, fpst);
              write_fp_sreg(s, a->rd, ta);
          }
@@ -XXX,XX +XXX,XX @@ static bool do_fp_reduction(DisasContext *s, arg_qrr_e *a,
      if (fp_access_check(s)) {
          MemOp esz = a->esz;
          int elts = (a->q ? 16 : 8) >> esz;
 -        TCGv_ptr fpst = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +        TCGv_ptr fpst = fpstatus_ptr(esz == MO_16 ? FPST_A64_F16 : FPST_A64);
          TCGv_i32 res = do_reduction_op(s, a->rn, esz, 0, elts, fpst, fn);
          write_fp_sreg(s, a->rd, res);
      }
@@ -XXX,XX +XXX,XX @@ static void handle_fp_compare(DisasContext *s, int size,
                                bool cmp_with_zero, bool signal_all_nans)
  {
      TCGv_i64 tcg_flags = tcg_temp_new_i64();
 -    TCGv_ptr fpst = fpstatus_ptr(size == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    TCGv_ptr fpst = fpstatus_ptr(size == MO_16 ? FPST_A64_F16 : FPST_A64);
      if (size == MO_64) {
          TCGv_i64 tcg_vn, tcg_vm;
@@ -XXX,XX +XXX,XX @@ static bool do_fp1_scalar(DisasContext *s, arg_rr_e *a,
          return check == 0;
      }
 -    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      if (rmode >= 0) {
          tcg_rmode = gen_set_rmode(rmode, fpst);
      }
@@ -XXX,XX +XXX,XX @@ static bool do_cvtf_scalar(DisasContext *s, MemOp esz, int rd, int shift,
      TCGv_i32 tcg_shift, tcg_single;
      TCGv_i64 tcg_double;
 -    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      tcg_shift = tcg_constant_i32(shift);
      switch (esz) {
@@ -XXX,XX +XXX,XX @@ static void do_fcvt_scalar(DisasContext *s, MemOp out, MemOp esz,
      TCGv_ptr tcg_fpstatus;
      TCGv_i32 tcg_shift, tcg_rmode, tcg_single;
 -    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    tcg_fpstatus = fpstatus_ptr(esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      tcg_shift = tcg_constant_i32(shift);
      tcg_rmode = gen_set_rmode(rmode, tcg_fpstatus);
@@ -XXX,XX +XXX,XX @@ static bool do_fp1_vector(DisasContext *s, arg_qrr_e *a,
          return check == 0;
      }
 -    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      if (rmode >= 0) {
          tcg_rmode = gen_set_rmode(rmode, fpst);
      }
@@ -XXX,XX +XXX,XX @@ static bool do_gvec_op2_fpst(DisasContext *s, MemOp esz, bool is_q,
          return check == 0;
      }
 -    fpst = fpstatus_ptr(esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    fpst = fpstatus_ptr(esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      tcg_gen_gvec_2_ptr(vec_full_reg_offset(s, rd),
                         vec_full_reg_offset(s, rn), fpst,
                         is_q ? 16 : 8, vec_full_reg_size(s),
 diff --git a/target/arm/tcg/translate-sve.c b/target/arm/tcg/translate-sve.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
+--- a/target/arm/tcg/translate-sve.c
-+++ b/target/arm/helper.c
++++ b/target/arm/tcg/translate-sve.c
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+@@ -XXX,XX +XXX,XX @@ static bool gen_gvec_fpst_arg_zz(DisasContext *s, gen_helper_gvec_2_ptr *fn,
-                                    ARMMMUIdx mmu_idx, bool data)
+                                  arg_rr_esz *a, int data)
  {
-     uint64_t tcr = regime_tcr(env, mmu_idx)->raw_tcr;
+     return gen_gvec_fpst_zz(s, fn, a->rd, a->rn, data,
--    bool epd, hpd, using16k, using64k;
+-                            a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
--    int select, tsz, tbi, max_tsz;
++                            a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
-+    bool epd, hpd, using16k, using64k, tsz_oob;
+ }
-+    int select, tsz, tbi, max_tsz, min_tsz;
+ /* Invoke an out-of-line helper on 3 Zregs. */
-     if (!regime_has_2_ranges(mmu_idx)) {
+@@ -XXX,XX +XXX,XX @@ static bool gen_gvec_fpst_arg_zzz(DisasContext *s, gen_helper_gvec_3_ptr *fn,
-         select = 0;
+                                   arg_rrr_esz *a, int data)
-@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
+ {
-     } else {
+     return gen_gvec_fpst_zzz(s, fn, a->rd, a->rn, a->rm, data,
-         max_tsz = 39;
+-                             a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
-     }
++                             a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
-+    min_tsz = 16;  /* TODO: ARMv8.2-LVA  */
+ }
--    tsz = MIN(tsz, max_tsz);
+ /* Invoke an out-of-line helper on 4 Zregs. */
--    tsz = MAX(tsz, 16);  /* TODO: ARMv8.2-LVA  */
+@@ -XXX,XX +XXX,XX @@ static bool gen_gvec_fpst_arg_zpzz(DisasContext *s, gen_helper_gvec_4_ptr *fn,
-+    if (tsz > max_tsz) {
+                                    arg_rprr_esz *a)
-+        tsz = max_tsz;
+ {
-+        tsz_oob = true;
+     return gen_gvec_fpst_zzzp(s, fn, a->rd, a->rn, a->rm, a->pg, 0,
-+    } else if (tsz < min_tsz) {
+-                              a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
-+        tsz = min_tsz;
++                              a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
-+        tsz_oob = true;
+ }
-+    } else {
-+        tsz_oob = false;
+ /* Invoke a vector expander on two Zregs and an immediate.  */
-+    }
+@@ -XXX,XX +XXX,XX @@ static bool do_FMLA_zzxz(DisasContext *s, arg_rrxr_esz *a, bool sub)
      /* Present TBI as a composite with TBID.  */
      tbi = aa64_va_parameter_tbi(tcr, mmu_idx);
@@ -XXX,XX +XXX,XX @@ ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
          .hpd = hpd,
          .using16k = using16k,
          .using64k = using64k,
 +        .tsz_oob = tsz_oob,
      };
+     return gen_gvec_fpst_zzzz(s, fns[a->esz], a->rd, a->rn, a->rm, a->ra,
+                               (a->index << 1) | sub,
+-                              a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
++                              a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
  }
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
+ TRANS_FEAT(FMLA_zzxz, aa64_sve, do_FMLA_zzxz, a, false)
-         param = aa64_va_parameters(env, address, mmu_idx,
+@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const fmul_idx_fns[4] = {
-                                    access_type != MMU_INST_FETCH);
+ };
-         level = 0;
+ TRANS_FEAT(FMUL_zzx, aa64_sve, gen_gvec_fpst_zzz,
-+
+            fmul_idx_fns[a->esz], a->rd, a->rn, a->rm, a->index,
-+        /*
+-           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
-+         * If TxSZ is programmed to a value larger than the maximum,
++           a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
-+         * or smaller than the effective minimum, it is IMPLEMENTATION
-+         * DEFINED whether we behave as if the field were programmed
+ /*
-+         * within bounds, or if a level 0 Translation fault is generated.
+  *** SVE Floating Point Fast Reduction Group
-+         *
+@@ -XXX,XX +XXX,XX @@ static bool do_reduce(DisasContext *s, arg_rpr_esz *a,
-+         * With FEAT_LVA, fault on less than minimum becomes required,
-+         * so our choice is to always raise the fault.
+     tcg_gen_addi_ptr(t_zn, tcg_env, vec_full_reg_offset(s, a->rn));
-+         */
+     tcg_gen_addi_ptr(t_pg, tcg_env, pred_full_reg_offset(s, a->pg));
-+        if (param.tsz_oob) {
+-    status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
-+            fault_type = ARMFault_Translation;
++    status = fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
-+            goto do_fault;
-+        }
+     fn(temp, t_zn, t_pg, status, t_desc);
-+
-         addrsize = 64 - 8 * param.tbi;
+@@ -XXX,XX +XXX,XX @@ static bool do_ppz_fp(DisasContext *s, arg_rpr_esz *a,
-         inputsize = 64 - param.tsz;
+     if (sve_access_check(s)) {
-     } else {
+         unsigned vsz = vec_full_reg_size(s);
          TCGv_ptr status =
 -            fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +            fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
          tcg_gen_gvec_3_ptr(pred_full_reg_offset(s, a->rd),
                             vec_full_reg_offset(s, a->rn),
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const ftmad_fns[4] = {
  };
  TRANS_FEAT_NONSTREAMING(FTMAD, aa64_sve, gen_gvec_fpst_zzz,
                          ftmad_fns[a->esz], a->rd, a->rn, a->rm, a->imm,
 -                        a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +                        a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  /*
   *** SVE Floating Point Accumulating Reduction Group
@@ -XXX,XX +XXX,XX @@ static bool trans_FADDA(DisasContext *s, arg_rprr_esz *a)
      t_pg = tcg_temp_new_ptr();
      tcg_gen_addi_ptr(t_rm, tcg_env, vec_full_reg_offset(s, a->rm));
      tcg_gen_addi_ptr(t_pg, tcg_env, pred_full_reg_offset(s, a->pg));
 -    t_fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    t_fpst = fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      t_desc = tcg_constant_i32(simd_desc(vsz, vsz, 0));
      fns[a->esz - 1](t_val, t_val, t_rm, t_pg, t_fpst, t_desc);
@@ -XXX,XX +XXX,XX @@ static void do_fp_scalar(DisasContext *s, int zd, int zn, int pg, bool is_fp16,
      tcg_gen_addi_ptr(t_zn, tcg_env, vec_full_reg_offset(s, zn));
      tcg_gen_addi_ptr(t_pg, tcg_env, pred_full_reg_offset(s, pg));
 -    status = fpstatus_ptr(is_fp16 ? FPST_FPCR_F16 : FPST_A64);
 +    status = fpstatus_ptr(is_fp16 ? FPST_A64_F16 : FPST_A64);
      desc = tcg_constant_i32(simd_desc(vsz, vsz, 0));
      fn(t_zd, t_zn, t_pg, scalar, status, desc);
  }
@@ -XXX,XX +XXX,XX @@ static bool do_fp_cmp(DisasContext *s, arg_rprr_esz *a,
      }
      if (sve_access_check(s)) {
          unsigned vsz = vec_full_reg_size(s);
 -        TCGv_ptr status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +        TCGv_ptr status = fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
          tcg_gen_gvec_4_ptr(pred_full_reg_offset(s, a->rd),
                             vec_full_reg_offset(s, a->rn),
                             vec_full_reg_offset(s, a->rm),
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_4_ptr * const fcadd_fns[] = {
  };
  TRANS_FEAT(FCADD, aa64_sve, gen_gvec_fpst_zzzp, fcadd_fns[a->esz],
             a->rd, a->rn, a->rm, a->pg, a->rot,
 -           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  #define DO_FMLA(NAME, name) \
      static gen_helper_gvec_5_ptr * const name##_fns[4] = {              \
@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FCADD, aa64_sve, gen_gvec_fpst_zzzp, fcadd_fns[a->esz],
      };                                                                  \
      TRANS_FEAT(NAME, aa64_sve, gen_gvec_fpst_zzzzp, name##_fns[a->esz], \
                 a->rd, a->rn, a->rm, a->ra, a->pg, 0,                    \
 -               a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +               a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  DO_FMLA(FMLA_zpzzz, fmla_zpzzz)
  DO_FMLA(FMLS_zpzzz, fmls_zpzzz)
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_5_ptr * const fcmla_fns[4] = {
  };
  TRANS_FEAT(FCMLA_zpzzz, aa64_sve, gen_gvec_fpst_zzzzp, fcmla_fns[a->esz],
             a->rd, a->rn, a->rm, a->ra, a->pg, a->rot,
 -           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  static gen_helper_gvec_4_ptr * const fcmla_idx_fns[4] = {
      NULL, gen_helper_gvec_fcmlah_idx, gen_helper_gvec_fcmlas_idx, NULL
  };
  TRANS_FEAT(FCMLA_zzxz, aa64_sve, gen_gvec_fpst_zzzz, fcmla_idx_fns[a->esz],
             a->rd, a->rn, a->rm, a->ra, a->index * 4 + a->rot,
 -           a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  /*
   *** SVE Floating Point Unary Operations Predicated Group
@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FCVT_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
             gen_helper_sve_fcvt_sd, a, 0, FPST_A64)
  TRANS_FEAT(FCVTZS_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_fcvtzs_hh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_fcvtzs_hh, a, 0, FPST_A64_F16)
  TRANS_FEAT(FCVTZU_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_fcvtzu_hh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_fcvtzu_hh, a, 0, FPST_A64_F16)
  TRANS_FEAT(FCVTZS_hs, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_fcvtzs_hs, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_fcvtzs_hs, a, 0, FPST_A64_F16)
  TRANS_FEAT(FCVTZU_hs, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_fcvtzu_hs, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_fcvtzu_hs, a, 0, FPST_A64_F16)
  TRANS_FEAT(FCVTZS_hd, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_fcvtzs_hd, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_fcvtzs_hd, a, 0, FPST_A64_F16)
  TRANS_FEAT(FCVTZU_hd, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_fcvtzu_hd, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_fcvtzu_hd, a, 0, FPST_A64_F16)
  TRANS_FEAT(FCVTZS_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
             gen_helper_sve_fcvtzs_ss, a, 0, FPST_A64)
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const frint_fns[] = {
      gen_helper_sve_frint_d
  };
  TRANS_FEAT(FRINTI, aa64_sve, gen_gvec_fpst_arg_zpz, frint_fns[a->esz],
 -           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a, 0, a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  static gen_helper_gvec_3_ptr * const frintx_fns[] = {
      NULL,
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const frintx_fns[] = {
      gen_helper_sve_frintx_d
  };
  TRANS_FEAT(FRINTX, aa64_sve, gen_gvec_fpst_arg_zpz, frintx_fns[a->esz],
 -           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +           a, 0, a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
  static bool do_frint_mode(DisasContext *s, arg_rpr_esz *a,
                            ARMFPRounding mode, gen_helper_gvec_3_ptr *fn)
@@ -XXX,XX +XXX,XX @@ static bool do_frint_mode(DisasContext *s, arg_rpr_esz *a,
      }
      vsz = vec_full_reg_size(s);
 -    status = fpstatus_ptr(a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64);
 +    status = fpstatus_ptr(a->esz == MO_16 ? FPST_A64_F16 : FPST_A64);
      tmode = gen_set_rmode(mode, status);
      tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, a->rd),
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const frecpx_fns[] = {
      gen_helper_sve_frecpx_s, gen_helper_sve_frecpx_d,
  };
  TRANS_FEAT(FRECPX, aa64_sve, gen_gvec_fpst_arg_zpz, frecpx_fns[a->esz],
 -           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a, 0, a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  static gen_helper_gvec_3_ptr * const fsqrt_fns[] = {
      NULL,                   gen_helper_sve_fsqrt_h,
      gen_helper_sve_fsqrt_s, gen_helper_sve_fsqrt_d,
  };
  TRANS_FEAT(FSQRT, aa64_sve, gen_gvec_fpst_arg_zpz, fsqrt_fns[a->esz],
 -           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a, 0, a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  TRANS_FEAT(SCVTF_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_scvt_hh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_scvt_hh, a, 0, FPST_A64_F16)
  TRANS_FEAT(SCVTF_sh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_scvt_sh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_scvt_sh, a, 0, FPST_A64_F16)
  TRANS_FEAT(SCVTF_dh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_scvt_dh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_scvt_dh, a, 0, FPST_A64_F16)
  TRANS_FEAT(SCVTF_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
             gen_helper_sve_scvt_ss, a, 0, FPST_A64)
@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(SCVTF_dd, aa64_sve, gen_gvec_fpst_arg_zpz,
             gen_helper_sve_scvt_dd, a, 0, FPST_A64)
  TRANS_FEAT(UCVTF_hh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_ucvt_hh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_ucvt_hh, a, 0, FPST_A64_F16)
  TRANS_FEAT(UCVTF_sh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_ucvt_sh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_ucvt_sh, a, 0, FPST_A64_F16)
  TRANS_FEAT(UCVTF_dh, aa64_sve, gen_gvec_fpst_arg_zpz,
 -           gen_helper_sve_ucvt_dh, a, 0, FPST_FPCR_F16)
 +           gen_helper_sve_ucvt_dh, a, 0, FPST_A64_F16)
  TRANS_FEAT(UCVTF_ss, aa64_sve, gen_gvec_fpst_arg_zpz,
             gen_helper_sve_ucvt_ss, a, 0, FPST_A64)
@@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const flogb_fns[] = {
      gen_helper_flogb_s, gen_helper_flogb_d
  };
  TRANS_FEAT(FLOGB, aa64_sve2, gen_gvec_fpst_arg_zpz, flogb_fns[a->esz],
 -           a, 0, a->esz == MO_16 ? FPST_FPCR_F16 : FPST_A64)
 +           a, 0, a->esz == MO_16 ? FPST_A64_F16 : FPST_A64)
  static bool do_FMLAL_zzzw(DisasContext *s, arg_rrrr_esz *a, bool sub, bool sel)
  {
 --
-.25.1
+.34.1

-[PULL 09/26] target/arm: Set TCR_EL1.TSZ for user-only
+[PULL 30/36] target/arm: Remove now-unused vfp.fp_status_f16 and FPST_FPCR_F16
-From: Richard Henderson <richard.henderson@linaro.org>
+Now we have moved all the uses of vfp.fp_status_f16 and FPST_FPCR_F16
 to the new A32 or A64 fields, we can remove these.
-Set this as the kernel would, to 48 bits, to keep the computation
+Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-of the address space correct for PAuth.
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
 Message-id: 20250124162836.2332150-19-peter.maydell@linaro.org
 ---
  target/arm/cpu.h           | 2 --
  target/arm/tcg/translate.h | 6 ------
  target/arm/cpu.c           | 1 -
  target/arm/vfp_helper.c    | 7 -------
 files changed, 16 deletions(-)
-Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
+diff --git a/target/arm/cpu.h b/target/arm/cpu.h
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
+index XXXXXXX..XXXXXXX 100644
-Message-id: 20220301215958.157011-3-richard.henderson@linaro.org
+--- a/target/arm/cpu.h
-Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
++++ b/target/arm/cpu.h
----
+@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
- target/arm/cpu.c | 3 ++-
+          *
-file changed, 2 insertions(+), 1 deletion(-)
+          *  fp_status_a32: is the "normal" fp status for AArch32 insns
+          *  fp_status_a64: is the "normal" fp status for AArch64 insns
 -         *  fp_status_fp16: used for half-precision calculations
           *  fp_status_fp16_a32: used for AArch32 half-precision calculations
           *  fp_status_fp16_a64: used for AArch64 half-precision calculations
           *  standard_fp_status : the ARM "Standard FPSCR Value"
@@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState {
           */
          float_status fp_status_a32;
          float_status fp_status_a64;
 -        float_status fp_status_f16;
          float_status fp_status_f16_a32;
          float_status fp_status_f16_a64;
          float_status standard_fp_status;
 diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/tcg/translate.h
 +++ b/target/arm/tcg/translate.h
@@ -XXX,XX +XXX,XX @@ static inline CPUARMTBFlags arm_tbflags_from_tb(const TranslationBlock *tb)
  typedef enum ARMFPStatusFlavour {
      FPST_A32,
      FPST_A64,
 -    FPST_FPCR_F16,
      FPST_A32_F16,
      FPST_A64_F16,
      FPST_STD,
@@ -XXX,XX +XXX,XX @@ typedef enum ARMFPStatusFlavour {
   *   for AArch32 non-FP16 operations controlled by the FPCR
   * FPST_A64
   *   for AArch64 non-FP16 operations controlled by the FPCR
 - * FPST_FPCR_F16
 - *   for operations controlled by the FPCR where FPCR.FZ16 is to be used
   * FPST_A32_F16
   *   for AArch32 operations controlled by the FPCR where FPCR.FZ16 is to be used
   * FPST_A64_F16
@@ -XXX,XX +XXX,XX @@ static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour)
      case FPST_A64:
          offset = offsetof(CPUARMState, vfp.fp_status_a64);
          break;
 -    case FPST_FPCR_F16:
 -        offset = offsetof(CPUARMState, vfp.fp_status_f16);
 -        break;
      case FPST_A32_F16:
          offset = offsetof(CPUARMState, vfp.fp_status_f16_a32);
          break;
 diff --git a/target/arm/cpu.c b/target/arm/cpu.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/cpu.c
 +++ b/target/arm/cpu.c
-@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(DeviceState *dev)
+@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset_hold(Object *obj, ResetType type)
-                 aarch64_sve_zcr_get_valid_len(cpu, cpu->sve_default_vq - 1);
+     arm_set_default_fp_behaviours(&env->vfp.fp_status_a32);
      arm_set_default_fp_behaviours(&env->vfp.fp_status_a64);
      arm_set_default_fp_behaviours(&env->vfp.standard_fp_status);
 -    arm_set_default_fp_behaviours(&env->vfp.fp_status_f16);
      arm_set_default_fp_behaviours(&env->vfp.fp_status_f16_a32);
      arm_set_default_fp_behaviours(&env->vfp.fp_status_f16_a64);
      arm_set_default_fp_behaviours(&env->vfp.standard_fp_status_f16);
 diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/vfp_helper.c
 +++ b/target/arm/vfp_helper.c
@@ -XXX,XX +XXX,XX @@ static uint32_t vfp_get_fpsr_from_host(CPUARMState *env)
      i |= get_float_exception_flags(&env->vfp.fp_status_a64);
      i |= get_float_exception_flags(&env->vfp.standard_fp_status);
      /* FZ16 does not generate an input denormal exception.  */
 -    i |= (get_float_exception_flags(&env->vfp.fp_status_f16)
 -          & ~float_flag_input_denormal);
      i |= (get_float_exception_flags(&env->vfp.fp_status_f16_a32)
            & ~float_flag_input_denormal);
      i |= (get_float_exception_flags(&env->vfp.fp_status_f16_a64)
@@ -XXX,XX +XXX,XX @@ static void vfp_clear_float_status_exc_flags(CPUARMState *env)
       */
      set_float_exception_flags(0, &env->vfp.fp_status_a32);
      set_float_exception_flags(0, &env->vfp.fp_status_a64);
 -    set_float_exception_flags(0, &env->vfp.fp_status_f16);
      set_float_exception_flags(0, &env->vfp.fp_status_f16_a32);
      set_float_exception_flags(0, &env->vfp.fp_status_f16_a64);
      set_float_exception_flags(0, &env->vfp.standard_fp_status);
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
          }
-         /*
+         set_float_rounding_mode(i, &env->vfp.fp_status_a32);
-+         * Enable 48-bit address space (TODO: take reserved_va into account).
+         set_float_rounding_mode(i, &env->vfp.fp_status_a64);
-          * Enable TBI0 but not TBI1.
+-        set_float_rounding_mode(i, &env->vfp.fp_status_f16);
-          * Note that this must match useronly_clean_ptr.
+         set_float_rounding_mode(i, &env->vfp.fp_status_f16_a32);
-          */
+         set_float_rounding_mode(i, &env->vfp.fp_status_f16_a64);
--        env->cp15.tcr_el[1].raw_tcr = (1ULL << 37);
+     }
-+        env->cp15.tcr_el[1].raw_tcr = 5 | (1ULL << 37);
+     if (changed & FPCR_FZ16) {
+         bool ftz_enabled = val & FPCR_FZ16;
-         /* Enable MTE */
+-        set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16);
-         if (cpu_isar_feature(aa64_mte, cpu)) {
+         set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a32);
          set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a64);
          set_flush_to_zero(ftz_enabled, &env->vfp.standard_fp_status_f16);
 -        set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16);
          set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a32);
          set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16_a64);
          set_flush_inputs_to_zero(ftz_enabled, &env->vfp.standard_fp_status_f16);
@@ -XXX,XX +XXX,XX @@ static void vfp_set_fpcr_to_host(CPUARMState *env, uint32_t val, uint32_t mask)
          bool dnan_enabled = val & FPCR_DN;
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a32);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_a64);
 -        set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16_a32);
          set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16_a64);
      }
 --
-.25.1
+.34.1

-[PULL 26/26] ui/cocoa.m: Remove unnecessary NSAutoreleasePools
+[PULL 31/36] fpu: Rename float_flag_input_denormal to float_flag_input_denormal_flushed
-In commit 6e657e64cdc478 in 2013 we added some autorelease pools to
+Our float_flag_input_denormal exception flag is set when the fpu code
-deal with complaints from macOS when we made calls into Cocoa from
+flushes an input denormal to zero.  This is what many guest
-threads that didn't have automatically created autorelease pools.
+architectures (eg classic Arm behaviour) require, but it is not the
-Later on, macOS got stricter about forbidding cross-thread Cocoa
+only donarmal-related reason we might want to set an exception flag.
-calls, and in commit 5588840ff77800e839d8 we restructured the code to
+The x86 behaviour (which we do not currently model correctly) wants
-avoid them.  This left the autorelease pool creation in several
+to see an exception flag when a denormal input is *not* flushed to
-functions without any purpose; delete it.
+zero and is actually used in an arithmetic operation. Arm's FEAT_AFP
+also wants these semantics.
-We still need the pool in cocoa_refresh() for the clipboard related
-code which is called directly there.
+Rename float_flag_input_denormal to float_flag_input_denormal_flushed
 to make it clearer when it is set and to allow us to add a new
 float_flag_input_denormal_used next to it for the x86/FEAT_AFP
 semantics.
 Commit created with
  for f in `git grep -l float_flag_input_denormal`; do sed -i -e 's/float_flag_input_denormal/float_flag_input_denormal_flushed/' $f; done
 and manual editing of softfloat-types.h and softfloat.c to clean
 up the indentation afterwards and to fix a comment which wasn't
 using the full name of the flag.
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-Reviewed-by: Akihiko Odaki <akihiko.odaki@gmail.com>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
-Tested-by: Akihiko Odaki <akihiko.odaki@gmail.com>
+Message-id: 20250124162836.2332150-20-peter.maydell@linaro.org
 Message-id: 20220224101330.967429-3-peter.maydell@linaro.org
 ---
- ui/cocoa.m | 6 ------
+ include/fpu/softfloat-types.h |  5 +++--
-file changed, 6 deletions(-)
+ fpu/softfloat.c               |  4 ++--
+ target/arm/tcg/sve_helper.c   |  6 +++---
-diff --git a/ui/cocoa.m b/ui/cocoa.m
+ target/arm/vfp_helper.c       | 10 +++++-----
-index XXXXXXX..XXXXXXX 100644
+ target/i386/tcg/fpu_helper.c  |  6 +++---
---- a/ui/cocoa.m
+ target/mips/tcg/msa_helper.c  |  2 +-
-+++ b/ui/cocoa.m
+ target/rx/op_helper.c         |  2 +-
-@@ -XXX,XX +XXX,XX @@ int main (int argc, char **argv) {
+ fpu/softfloat-parts.c.inc     |  2 +-
- static void cocoa_update(DisplayChangeListener *dcl,
+files changed, 19 insertions(+), 18 deletions(-)
-                          int x, int y, int w, int h)
 diff --git a/include/fpu/softfloat-types.h b/include/fpu/softfloat-types.h
 index XXXXXXX..XXXXXXX 100644
 --- a/include/fpu/softfloat-types.h
 +++ b/include/fpu/softfloat-types.h
@@ -XXX,XX +XXX,XX @@ enum {
      float_flag_overflow        = 0x0004,
      float_flag_underflow       = 0x0008,
      float_flag_inexact         = 0x0010,
 -    float_flag_input_denormal  = 0x0020,
 +    /* We flushed an input denormal to 0 (because of flush_inputs_to_zero) */
 +    float_flag_input_denormal_flushed = 0x0020,
      float_flag_output_denormal = 0x0040,
      float_flag_invalid_isi     = 0x0080,  /* inf - inf */
      float_flag_invalid_imz     = 0x0100,  /* inf * 0 */
@@ -XXX,XX +XXX,XX @@ typedef struct float_status {
      bool tininess_before_rounding;
      /* should denormalised results go to zero and set the inexact flag? */
      bool flush_to_zero;
 -    /* should denormalised inputs go to zero and set the input_denormal flag? */
 +    /* should denormalised inputs go to zero and set input_denormal_flushed? */
      bool flush_inputs_to_zero;
      bool default_nan_mode;
      /*
 diff --git a/fpu/softfloat.c b/fpu/softfloat.c
 index XXXXXXX..XXXXXXX 100644
 --- a/fpu/softfloat.c
 +++ b/fpu/softfloat.c
@@ -XXX,XX +XXX,XX @@ this code that are retained.
          if (unlikely(soft_t ## _is_denormal(*a))) {                     \
              *a = soft_t ## _set_sign(soft_t ## _zero,                   \
                                       soft_t ## _is_neg(*a));            \
 -            float_raise(float_flag_input_denormal, s);                  \
 +            float_raise(float_flag_input_denormal_flushed, s);          \
          }                                                               \
      }
@@ -XXX,XX +XXX,XX @@ float128 float128_silence_nan(float128 a, float_status *status)
  static bool parts_squash_denormal(FloatParts64 p, float_status *status)
  {
--    NSAutoreleasePool * pool = [[NSAutoreleasePool alloc] init];
+     if (p.exp == 0 && p.frac != 0) {
--
+-        float_raise(float_flag_input_denormal, status);
-     COCOA_DEBUG("qemu_cocoa: cocoa_update\n");
++        float_raise(float_flag_input_denormal_flushed, status);
+         return true;
-     dispatch_async(dispatch_get_main_queue(), ^{
+     }
-@@ -XXX,XX +XXX,XX @@ static void cocoa_update(DisplayChangeListener *dcl,
-         }
+diff --git a/target/arm/tcg/sve_helper.c b/target/arm/tcg/sve_helper.c
-         [cocoaView setNeedsDisplayInRect:rect];
+index XXXXXXX..XXXXXXX 100644
-     });
+--- a/target/arm/tcg/sve_helper.c
--
++++ b/target/arm/tcg/sve_helper.c
--    [pool release];
+@@ -XXX,XX +XXX,XX @@ static int16_t do_float16_logb_as_int(float16 a, float_status *s)
                  return -15 - clz32(frac);
              }
              /* flush to zero */
 -            float_raise(float_flag_input_denormal, s);
 +            float_raise(float_flag_input_denormal_flushed, s);
          }
      } else if (unlikely(exp == 0x1f)) {
          if (frac == 0) {
@@ -XXX,XX +XXX,XX @@ static int32_t do_float32_logb_as_int(float32 a, float_status *s)
                  return -127 - clz32(frac);
              }
              /* flush to zero */
 -            float_raise(float_flag_input_denormal, s);
 +            float_raise(float_flag_input_denormal_flushed, s);
          }
      } else if (unlikely(exp == 0xff)) {
          if (frac == 0) {
@@ -XXX,XX +XXX,XX @@ static int64_t do_float64_logb_as_int(float64 a, float_status *s)
                  return -1023 - clz64(frac);
              }
              /* flush to zero */
 -            float_raise(float_flag_input_denormal, s);
 +            float_raise(float_flag_input_denormal_flushed, s);
          }
      } else if (unlikely(exp == 0x7ff)) {
          if (frac == 0) {
 diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/vfp_helper.c
 +++ b/target/arm/vfp_helper.c
@@ -XXX,XX +XXX,XX @@ static inline uint32_t vfp_exceptbits_from_host(int host_bits)
      if (host_bits & float_flag_inexact) {
          target_bits |= FPSR_IXC;
      }
 -    if (host_bits & float_flag_input_denormal) {
 +    if (host_bits & float_flag_input_denormal_flushed) {
          target_bits |= FPSR_IDC;
      }
      return target_bits;
@@ -XXX,XX +XXX,XX @@ static uint32_t vfp_get_fpsr_from_host(CPUARMState *env)
      i |= get_float_exception_flags(&env->vfp.standard_fp_status);
      /* FZ16 does not generate an input denormal exception.  */
      i |= (get_float_exception_flags(&env->vfp.fp_status_f16_a32)
 -          & ~float_flag_input_denormal);
 +          & ~float_flag_input_denormal_flushed);
      i |= (get_float_exception_flags(&env->vfp.fp_status_f16_a64)
 -          & ~float_flag_input_denormal);
 +          & ~float_flag_input_denormal_flushed);
      i |= (get_float_exception_flags(&env->vfp.standard_fp_status_f16)
 -          & ~float_flag_input_denormal);
 +          & ~float_flag_input_denormal_flushed);
      return vfp_exceptbits_from_host(i);
  }
- static void cocoa_switch(DisplayChangeListener *dcl,
+@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(fjcvtzs)(float64 value, float_status *status)
-                          DisplaySurface *surface)
- {
+     /* Normal inexact, denormal with flush-to-zero, or overflow or NaN */
--    NSAutoreleasePool * pool = [[NSAutoreleasePool alloc] init];
+     inexact = e_new & (float_flag_inexact |
-     pixman_image_t *image = surface->image;
+-                       float_flag_input_denormal |
++                       float_flag_input_denormal_flushed |
-     COCOA_DEBUG("qemu_cocoa: cocoa_switch\n");
+                        float_flag_invalid);
-@@ -XXX,XX +XXX,XX @@ static void cocoa_switch(DisplayChangeListener *dcl,
-         [cocoaView updateUIInfo];
+     /* While not inexact for IEEE FP, -0.0 is inexact for JavaScript. */
-         [cocoaView switchSurface:image];
+diff --git a/target/i386/tcg/fpu_helper.c b/target/i386/tcg/fpu_helper.c
-     });
+index XXXXXXX..XXXXXXX 100644
--    [pool release];
+--- a/target/i386/tcg/fpu_helper.c
 +++ b/target/i386/tcg/fpu_helper.c
@@ -XXX,XX +XXX,XX @@ static void merge_exception_flags(CPUX86State *env, uint8_t old_flags)
                         (new_flags & float_flag_overflow ? FPUS_OE : 0) |
                         (new_flags & float_flag_underflow ? FPUS_UE : 0) |
                         (new_flags & float_flag_inexact ? FPUS_PE : 0) |
 -                       (new_flags & float_flag_input_denormal ? FPUS_DE : 0)));
 +                       (new_flags & float_flag_input_denormal_flushed ? FPUS_DE : 0)));
  }
- static void cocoa_refresh(DisplayChangeListener *dcl)
+ static inline floatx80 helper_fdiv(CPUX86State *env, floatx80 a, floatx80 b)
@@ -XXX,XX +XXX,XX @@ void helper_fxtract(CPUX86State *env)
              int shift = clz64(temp.l.lower);
              temp.l.lower <<= shift;
              expdif = 1 - EXPBIAS - shift;
 -            float_raise(float_flag_input_denormal, &env->fp_status);
 +            float_raise(float_flag_input_denormal_flushed, &env->fp_status);
          } else {
              expdif = EXPD(temp) - EXPBIAS;
          }
@@ -XXX,XX +XXX,XX @@ void update_mxcsr_from_sse_status(CPUX86State *env)
      uint8_t flags = get_float_exception_flags(&env->sse_status);
      /*
       * The MXCSR denormal flag has opposite semantics to
 -     * float_flag_input_denormal (the softfloat code sets that flag
 +     * float_flag_input_denormal_flushed (the softfloat code sets that flag
       * only when flushing input denormals to zero, but SSE sets it
       * only when not flushing them to zero), so is not converted
       * here.
 diff --git a/target/mips/tcg/msa_helper.c b/target/mips/tcg/msa_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/mips/tcg/msa_helper.c
 +++ b/target/mips/tcg/msa_helper.c
@@ -XXX,XX +XXX,XX @@ static inline int update_msacsr(CPUMIPSState *env, int action, int denormal)
      enable = GET_FP_ENABLE(env->active_tc.msacsr) | FP_UNIMPLEMENTED;
      /* Set Inexact (I) when flushing inputs to zero */
 -    if ((ieee_exception_flags & float_flag_input_denormal) &&
 +    if ((ieee_exception_flags & float_flag_input_denormal_flushed) &&
              (env->active_tc.msacsr & MSACSR_FS_MASK) != 0) {
          if (action & CLEAR_IS_INEXACT) {
              mips_exception_flags &= ~FP_INEXACT;
 diff --git a/target/rx/op_helper.c b/target/rx/op_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/rx/op_helper.c
 +++ b/target/rx/op_helper.c
@@ -XXX,XX +XXX,XX @@ static void update_fpsw(CPURXState *env, float32 ret, uintptr_t retaddr)
          if (xcpt & float_flag_inexact) {
              SET_FPSW(X);
          }
 -        if ((xcpt & (float_flag_input_denormal
 +        if ((xcpt & (float_flag_input_denormal_flushed
                       | float_flag_output_denormal))
              && !FIELD_EX32(env->fpsw, FPSW, DN)) {
              env->fpsw = FIELD_DP32(env->fpsw, FPSW, CE, 1);
 diff --git a/fpu/softfloat-parts.c.inc b/fpu/softfloat-parts.c.inc
 index XXXXXXX..XXXXXXX 100644
 --- a/fpu/softfloat-parts.c.inc
 +++ b/fpu/softfloat-parts.c.inc
@@ -XXX,XX +XXX,XX @@ static void partsN(canonicalize)(FloatPartsN *p, float_status *status,
          if (likely(frac_eqz(p))) {
              p->cls = float_class_zero;
          } else if (status->flush_inputs_to_zero) {
 -            float_raise(float_flag_input_denormal, status);
 +            float_raise(float_flag_input_denormal_flushed, status);
              p->cls = float_class_zero;
              frac_clear(p);
          } else {
 --
-.25.1
+.34.1

-[PULL 24/26] target/arm: Report KVM's actual PSCI version to guest in dtb
+[PULL 32/36] fpu: Rename float_flag_output_denormal to float_flag_output_denormal_flushed
-When we're using KVM, the PSCI implementation is provided by the
+Our float_flag_output_denormal exception flag is set when
-kernel, but QEMU has to tell the guest about it via the device tree.
+the fpu code flushes an output denormal to zero. Rename
-Currently we look at the KVM_CAP_ARM_PSCI_0_2 capability to determine
+it to float_flag_output_denormal_flushed:
-if the kernel is providing at least PSCI 0.2, but if the kernel
+ * this keeps it parallel with the flag for flushing
-provides a newer version than that we will still only tell the guest
+   input denormals, which we just renamed
-it has PSCI 0.2.  (This is fairly harmless; it just means the guest
+ * it makes it clearer that it doesn't mean "set when
-won't use newer parts of the PSCI API.)
+   the output is a denormal"
-The kernel exposes the specific PSCI version it is implementing via
+Commit created with
-the ONE_REG API; use this to report in the dtb that the PSCI
+ for f in `git grep -l float_flag_output_denormal`; do sed -i -e 's/float_flag_output_denormal/float_flag_output_denormal_flushed/' $f; done
 implementation is 1.0-compatible if appropriate.  (The device tree
 binding currently only distinguishes "pre-0.2", "0.2-compatible" and
 "1.0-compatible".)
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-Reviewed-by: Marc Zyngier <maz@kernel.org>
-Reviewed-by: Akihiko Odaki <akihiko.odaki@gmail.com>
 Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
-Reviewed-by: Andrew Jones <drjones@redhat.com>
+Message-id: 20250124162836.2332150-21-peter.maydell@linaro.org
 Message-id: 20220224134655.1207865-1-peter.maydell@linaro.org
 ---
- target/arm/kvm-consts.h |  1 +
+ include/fpu/softfloat-types.h | 3 ++-
- hw/arm/boot.c           |  5 ++---
+ fpu/softfloat.c               | 2 +-
- target/arm/kvm64.c      | 12 ++++++++++++
+ target/arm/vfp_helper.c       | 2 +-
-files changed, 15 insertions(+), 3 deletions(-)
+ target/i386/tcg/fpu_helper.c  | 2 +-
  target/m68k/fpu_helper.c      | 2 +-
  target/mips/tcg/msa_helper.c  | 2 +-
  target/rx/op_helper.c         | 2 +-
  target/tricore/fpu_helper.c   | 6 +++---
  fpu/softfloat-parts.c.inc     | 2 +-
 files changed, 12 insertions(+), 11 deletions(-)
-diff --git a/target/arm/kvm-consts.h b/target/arm/kvm-consts.h
+diff --git a/include/fpu/softfloat-types.h b/include/fpu/softfloat-types.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/kvm-consts.h
+--- a/include/fpu/softfloat-types.h
-+++ b/target/arm/kvm-consts.h
++++ b/include/fpu/softfloat-types.h
-@@ -XXX,XX +XXX,XX @@ MISMATCH_CHECK(QEMU_PSCI_1_0_FN_PSCI_FEATURES, PSCI_1_0_FN_PSCI_FEATURES);
+@@ -XXX,XX +XXX,XX @@ enum {
+     float_flag_inexact         = 0x0010,
- #define QEMU_PSCI_VERSION_0_1                     0x00001
+     /* We flushed an input denormal to 0 (because of flush_inputs_to_zero) */
- #define QEMU_PSCI_VERSION_0_2                     0x00002
+     float_flag_input_denormal_flushed = 0x0020,
-+#define QEMU_PSCI_VERSION_1_0                     0x10000
+-    float_flag_output_denormal = 0x0040,
- #define QEMU_PSCI_VERSION_1_1                     0x10001
++    /* We flushed an output denormal to 0 (because of flush_to_zero) */
++    float_flag_output_denormal_flushed = 0x0040,
- MISMATCH_CHECK(QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED, PSCI_0_2_TOS_MP);
+     float_flag_invalid_isi     = 0x0080,  /* inf - inf */
-diff --git a/hw/arm/boot.c b/hw/arm/boot.c
+     float_flag_invalid_imz     = 0x0100,  /* inf * 0 */
      float_flag_invalid_idi     = 0x0200,  /* inf / inf */
 diff --git a/fpu/softfloat.c b/fpu/softfloat.c
 index XXXXXXX..XXXXXXX 100644
---- a/hw/arm/boot.c
+--- a/fpu/softfloat.c
-+++ b/hw/arm/boot.c
++++ b/fpu/softfloat.c
-@@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt)
+@@ -XXX,XX +XXX,XX @@ floatx80 roundAndPackFloatx80(FloatX80RoundPrec roundingPrecision, bool zSign,
          }
          if ( zExp <= 0 ) {
              if (status->flush_to_zero) {
 -                float_raise(float_flag_output_denormal, status);
 +                float_raise(float_flag_output_denormal_flushed, status);
                  return packFloatx80(zSign, 0, 0);
              }
              isTiny = status->tininess_before_rounding
 diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/vfp_helper.c
 +++ b/target/arm/vfp_helper.c
@@ -XXX,XX +XXX,XX @@ static inline uint32_t vfp_exceptbits_from_host(int host_bits)
      if (host_bits & float_flag_overflow) {
          target_bits |= FPSR_OFC;
      }
+-    if (host_bits & (float_flag_underflow | float_flag_output_denormal)) {
-     qemu_fdt_add_subnode(fdt, "/psci");
++    if (host_bits & (float_flag_underflow | float_flag_output_denormal_flushed)) {
--    if (armcpu->psci_version == QEMU_PSCI_VERSION_0_2 ||
+         target_bits |= FPSR_UFC;
--        armcpu->psci_version == QEMU_PSCI_VERSION_1_1) {
+     }
--        if (armcpu->psci_version == QEMU_PSCI_VERSION_0_2) {
+     if (host_bits & float_flag_inexact) {
-+    if (armcpu->psci_version >= QEMU_PSCI_VERSION_0_2) {
+diff --git a/target/i386/tcg/fpu_helper.c b/target/i386/tcg/fpu_helper.c
 +        if (armcpu->psci_version < QEMU_PSCI_VERSION_1_0) {
              const char comp[] = "arm,psci-0.2\0arm,psci";
              qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
          } else {
 diff --git a/target/arm/kvm64.c b/target/arm/kvm64.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/kvm64.c
+--- a/target/i386/tcg/fpu_helper.c
-+++ b/target/arm/kvm64.c
++++ b/target/i386/tcg/fpu_helper.c
-@@ -XXX,XX +XXX,XX @@ int kvm_arch_init_vcpu(CPUState *cs)
+@@ -XXX,XX +XXX,XX @@ void update_mxcsr_from_sse_status(CPUX86State *env)
-     uint64_t mpidr;
+                    (flags & float_flag_overflow ? FPUS_OE : 0) |
-     ARMCPU *cpu = ARM_CPU(cs);
+                    (flags & float_flag_underflow ? FPUS_UE : 0) |
-     CPUARMState *env = &cpu->env;
+                    (flags & float_flag_inexact ? FPUS_PE : 0) |
-+    uint64_t psciver;
+-                   (flags & float_flag_output_denormal ? FPUS_UE | FPUS_PE :
++                   (flags & float_flag_output_denormal_flushed ? FPUS_UE | FPUS_PE :
-     if (cpu->kvm_target == QEMU_KVM_ARM_TARGET_NONE ||
+));
-         !object_dynamic_cast(OBJECT(cpu), TYPE_AARCH64_CPU)) {
+ }
-@@ -XXX,XX +XXX,XX @@ int kvm_arch_init_vcpu(CPUState *cs)
 diff --git a/target/m68k/fpu_helper.c b/target/m68k/fpu_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/m68k/fpu_helper.c
 +++ b/target/m68k/fpu_helper.c
@@ -XXX,XX +XXX,XX @@ static int cpu_m68k_exceptbits_from_host(int host_bits)
      if (host_bits & float_flag_overflow) {
          target_bits |= 0x40;
      }
 -    if (host_bits & (float_flag_underflow | float_flag_output_denormal)) {
 +    if (host_bits & (float_flag_underflow | float_flag_output_denormal_flushed)) {
          target_bits |= 0x20;
      }
      if (host_bits & float_flag_divbyzero) {
 diff --git a/target/mips/tcg/msa_helper.c b/target/mips/tcg/msa_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/mips/tcg/msa_helper.c
 +++ b/target/mips/tcg/msa_helper.c
@@ -XXX,XX +XXX,XX @@ static inline int update_msacsr(CPUMIPSState *env, int action, int denormal)
      }
      /* Set Inexact (I) and Underflow (U) when flushing outputs to zero */
 -    if ((ieee_exception_flags & float_flag_output_denormal) &&
 +    if ((ieee_exception_flags & float_flag_output_denormal_flushed) &&
              (env->active_tc.msacsr & MSACSR_FS_MASK) != 0) {
          mips_exception_flags |= FP_INEXACT;
          if (action & CLEAR_FS_UNDERFLOW) {
 diff --git a/target/rx/op_helper.c b/target/rx/op_helper.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/rx/op_helper.c
 +++ b/target/rx/op_helper.c
@@ -XXX,XX +XXX,XX @@ static void update_fpsw(CPURXState *env, float32 ret, uintptr_t retaddr)
              SET_FPSW(X);
          }
+         if ((xcpt & (float_flag_input_denormal_flushed
+-                     | float_flag_output_denormal))
++                     | float_flag_output_denormal_flushed))
+             && !FIELD_EX32(env->fpsw, FPSW, DN)) {
+             env->fpsw = FIELD_DP32(env->fpsw, FPSW, CE, 1);
+         }
+diff --git a/target/tricore/fpu_helper.c b/target/tricore/fpu_helper.c
+index XXXXXXX..XXXXXXX 100644
+--- a/target/tricore/fpu_helper.c
++++ b/target/tricore/fpu_helper.c
+@@ -XXX,XX +XXX,XX @@ static inline uint8_t f_get_excp_flags(CPUTriCoreState *env)
+            & (float_flag_invalid
+               | float_flag_overflow
+               | float_flag_underflow
+-              | float_flag_output_denormal
++              | float_flag_output_denormal_flushed
+               | float_flag_divbyzero
+               | float_flag_inexact);
+ }
+@@ -XXX,XX +XXX,XX @@ static void f_update_psw_flags(CPUTriCoreState *env, uint8_t flags)
+         some_excp = 1;
      }
-+    /*
+-    if (flags & float_flag_underflow || flags & float_flag_output_denormal) {
-+     * KVM reports the exact PSCI version it is implementing via a
++    if (flags & float_flag_underflow || flags & float_flag_output_denormal_flushed) {
-+     * special sysreg. If it is present, use its contents to determine
+         env->FPU_FU = 1 << 31;
-+     * what to report to the guest in the dtb (it is the PSCI version,
+         some_excp = 1;
-+     * in the same 15-bits major 16-bits minor format that PSCI_VERSION
+     }
-+     * returns).
+@@ -XXX,XX +XXX,XX @@ static void f_update_psw_flags(CPUTriCoreState *env, uint8_t flags)
-+     */
+         some_excp = 1;
-+    if (!kvm_get_one_reg(cs, KVM_REG_ARM_PSCI_VERSION, &psciver)) {
+     }
-+        cpu->psci_version = psciver;
-+    }
+-    if (flags & float_flag_inexact || flags & float_flag_output_denormal) {
-+
++    if (flags & float_flag_inexact || flags & float_flag_output_denormal_flushed) {
-     /*
+         env->PSW |= 1 << 26;
-      * When KVM is in use, PSCI is emulated in-kernel and not by qemu.
+         some_excp = 1;
-      * Currently KVM has its own idea about MPIDR assignment, so we
+     }
 diff --git a/fpu/softfloat-parts.c.inc b/fpu/softfloat-parts.c.inc
 index XXXXXXX..XXXXXXX 100644
 --- a/fpu/softfloat-parts.c.inc
 +++ b/fpu/softfloat-parts.c.inc
@@ -XXX,XX +XXX,XX @@ static void partsN(uncanon_normal)(FloatPartsN *p, float_status *s,
          }
          frac_shr(p, frac_shift);
      } else if (s->flush_to_zero) {
 -        flags |= float_flag_output_denormal;
 +        flags |= float_flag_output_denormal_flushed;
          p->cls = float_class_zero;
          exp = 0;
          frac_clear(p);
 --
-.25.1
+.34.1

-[PULL 02/26] hw/arm/mps2-tz.c: Update AN547 documentation URL
+[PULL 33/36] fpu: Fix a comment in softfloat-types.h
-The AN547 application note URL has changed: update our comment
+In softfloat-types.h a comment documents that if the float_status
-accordingly. (Rev B is still downloadable from the old URL,
+field flush_to_zero is set then we flush denormalised results to 0
-but there is a new Rev C of the document now.)
+and set the inexact flag.  This isn't correct: the status flag that
 we set when flush_to_zero causes us to flush an output to zero is
 float_flag_output_denormal_flushed.
 Correct the comment.
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
-Tested-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
+Message-id: 20250124162836.2332150-22-peter.maydell@linaro.org
 Message-id: 20220221094144.426191-1-peter.maydell@linaro.org
 ---
- hw/arm/mps2-tz.c | 2 +-
+ include/fpu/softfloat-types.h | 2 +-
 file changed, 1 insertion(+), 1 deletion(-)
-diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c
+diff --git a/include/fpu/softfloat-types.h b/include/fpu/softfloat-types.h
 index XXXXXXX..XXXXXXX 100644
---- a/hw/arm/mps2-tz.c
+--- a/include/fpu/softfloat-types.h
-+++ b/hw/arm/mps2-tz.c
++++ b/include/fpu/softfloat-types.h
-@@ -XXX,XX +XXX,XX @@
+@@ -XXX,XX +XXX,XX @@ typedef struct float_status {
-  * Application Note AN524:
+     Float3NaNPropRule float_3nan_prop_rule;
-  * https://developer.arm.com/documentation/dai0524/latest/
+     FloatInfZeroNaNRule float_infzeronan_rule;
-  * Application Note AN547:
+     bool tininess_before_rounding;
-- * https://developer.arm.com/-/media/Arm%20Developer%20Community/PDF/DAI0547B_SSE300_PLUS_U55_FPGA_for_mps3.pdf
+-    /* should denormalised results go to zero and set the inexact flag? */
-+ * https://developer.arm.com/documentation/dai0547/latest/
++    /* should denormalised results go to zero and set output_denormal_flushed? */
-  *
+     bool flush_to_zero;
-  * The AN505 defers to the Cortex-M33 processor ARMv8M IoT Kit FVP User Guide
+     /* should denormalised inputs go to zero and set input_denormal_flushed? */
-  * (ARM ECM0601256) for the details of some of the device layout:
+     bool flush_inputs_to_zero;
 --
-.25.1
+.34.1

-[PULL 25/26] ui/cocoa.m: Fix updateUIInfo threading issues
+[PULL 34/36] target/arm: Remove redundant advsimd float16 helpers
-The updateUIInfo method makes Cocoa API calls.  It also calls back
+The advsimd_addh etc helpers defined in helper-a64.c are identical to
-into QEMU functions like dpy_set_ui_info().  To do this safely, we
+the vfp_addh etc helpers defined in helper-vfp.c: both take two
-need to follow two rules:
+float16 inputs (in a uint32_t type) plus a float_status* and are
- * Cocoa API calls are made on the Cocoa UI thread
+simple wrappers around the softfloat float16_* functions.
  * When calling back into QEMU we must hold the iothread lock
-Fix the places where we got this wrong, by taking the iothread lock
+(The duplication seems to be a historical accident: we added the
-while executing updateUIInfo, and moving the call in cocoa_switch()
+advsimd helpers in 2018 as part of the A64 implementation, and at
-inside the dispatch_async block.
+that time there was no f16 emulation in A32.  Then later we added the
 A32 f16 handling by extending the existing VFP helper macros to
 generate f16 versions as well as f32 and f64, and didn't realise we
 could clean things up.)
-Some of the Cocoa UI methods which call updateUIInfo are invoked as
+Remove the now-unnecessary advsimd helpers and make the places that
-part of the initial application startup, while we're still doing the
+generated calls to them use the vfp helpers instead. Many of the
-little cross-thread dance described in the comment just above
+helper functions were already unused.
-call_qemu_main().  This meant they were calling back into the QEMU UI
-layer before we'd actually finished initializing our display and
+(The remaining advsimd_ helpers are those which don't have vfp
-registered the DisplayChangeListener, which isn't really valid.  Once
+versions.)
 updateUIInfo takes the iothread lock, we no longer get away with
 this, because during this startup phase the iothread lock is held by
 the QEMU main-loop thread which is waiting for us to finish our
 display initialization.  So we must suppress updateUIInfo until
 applicationDidFinishLaunching allows the QEMU main-loop thread to
 continue.
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
-Reviewed-by: Akihiko Odaki <akihiko.odaki@gmail.com>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
-Tested-by: Akihiko Odaki <akihiko.odaki@gmail.com>
+Message-id: 20250124162836.2332150-26-peter.maydell@linaro.org
 Message-id: 20220224101330.967429-2-peter.maydell@linaro.org
 ---
- ui/cocoa.m | 25 ++++++++++++++++++++++---
+ target/arm/tcg/helper-a64.h    |  8 --------
-file changed, 22 insertions(+), 3 deletions(-)
+ target/arm/tcg/helper-a64.c    |  9 ---------
  target/arm/tcg/translate-a64.c | 16 ++++++++--------
 files changed, 8 insertions(+), 25 deletions(-)
-diff --git a/ui/cocoa.m b/ui/cocoa.m
+diff --git a/target/arm/tcg/helper-a64.h b/target/arm/tcg/helper-a64.h
 index XXXXXXX..XXXXXXX 100644
---- a/ui/cocoa.m
+--- a/target/arm/tcg/helper-a64.h
-+++ b/ui/cocoa.m
++++ b/target/arm/tcg/helper-a64.h
-@@ -XXX,XX +XXX,XX @@ QemuCocoaView *cocoaView;
+@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_2(frecpx_f16, TCG_CALL_NO_RWG, f16, f16, fpst)
-     }
+ DEF_HELPER_FLAGS_2(fcvtx_f64_to_f32, TCG_CALL_NO_RWG, f32, f64, fpst)
  DEF_HELPER_FLAGS_3(crc32_64, TCG_CALL_NO_RWG_SE, i64, i64, i64, i32)
  DEF_HELPER_FLAGS_3(crc32c_64, TCG_CALL_NO_RWG_SE, i64, i64, i64, i32)
 -DEF_HELPER_FLAGS_3(advsimd_maxh, TCG_CALL_NO_RWG, f16, f16, f16, fpst)
 -DEF_HELPER_FLAGS_3(advsimd_minh, TCG_CALL_NO_RWG, f16, f16, f16, fpst)
 -DEF_HELPER_FLAGS_3(advsimd_maxnumh, TCG_CALL_NO_RWG, f16, f16, f16, fpst)
 -DEF_HELPER_FLAGS_3(advsimd_minnumh, TCG_CALL_NO_RWG, f16, f16, f16, fpst)
 -DEF_HELPER_3(advsimd_addh, f16, f16, f16, fpst)
 -DEF_HELPER_3(advsimd_subh, f16, f16, f16, fpst)
 -DEF_HELPER_3(advsimd_mulh, f16, f16, f16, fpst)
 -DEF_HELPER_3(advsimd_divh, f16, f16, f16, fpst)
  DEF_HELPER_3(advsimd_ceq_f16, i32, f16, f16, fpst)
  DEF_HELPER_3(advsimd_cge_f16, i32, f16, f16, fpst)
  DEF_HELPER_3(advsimd_cgt_f16, i32, f16, f16, fpst)
 diff --git a/target/arm/tcg/helper-a64.c b/target/arm/tcg/helper-a64.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/tcg/helper-a64.c
 +++ b/target/arm/tcg/helper-a64.c
@@ -XXX,XX +XXX,XX @@ uint32_t ADVSIMD_HELPER(name, h)(uint32_t a, uint32_t b, float_status *fpst) \
      return float16_ ## name(a, b, fpst);    \
  }
--- (void) updateUIInfo
+-ADVSIMD_HALFOP(add)
-+- (void) updateUIInfoLocked
+-ADVSIMD_HALFOP(sub)
- {
+-ADVSIMD_HALFOP(mul)
-+    /* Must be called with the iothread lock, i.e. via updateUIInfo */
+-ADVSIMD_HALFOP(div)
-     NSSize frameSize;
+-ADVSIMD_HALFOP(min)
-     QemuUIInfo info;
+-ADVSIMD_HALFOP(max)
+-ADVSIMD_HALFOP(minnum)
-@@ -XXX,XX +XXX,XX @@ QemuCocoaView *cocoaView;
+-ADVSIMD_HALFOP(maxnum)
-     dpy_set_ui_info(dcl.con, &info, TRUE);
+-
  #define ADVSIMD_TWOHALFOP(name)                                         \
  uint32_t ADVSIMD_HELPER(name, 2h)(uint32_t two_a, uint32_t two_b,       \
                                    float_status *fpst)                   \
 diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c
 index XXXXXXX..XXXXXXX 100644
 --- a/target/arm/tcg/translate-a64.c
 +++ b/target/arm/tcg/translate-a64.c
@@ -XXX,XX +XXX,XX @@ static const FPScalar f_scalar_fmul = {
  TRANS(FMUL_s, do_fp3_scalar, a, &f_scalar_fmul)
  static const FPScalar f_scalar_fmax = {
 -    gen_helper_advsimd_maxh,
 +    gen_helper_vfp_maxh,
      gen_helper_vfp_maxs,
      gen_helper_vfp_maxd,
  };
  TRANS(FMAX_s, do_fp3_scalar, a, &f_scalar_fmax)
  static const FPScalar f_scalar_fmin = {
 -    gen_helper_advsimd_minh,
 +    gen_helper_vfp_minh,
      gen_helper_vfp_mins,
      gen_helper_vfp_mind,
  };
  TRANS(FMIN_s, do_fp3_scalar, a, &f_scalar_fmin)
  static const FPScalar f_scalar_fmaxnm = {
 -    gen_helper_advsimd_maxnumh,
 +    gen_helper_vfp_maxnumh,
      gen_helper_vfp_maxnums,
      gen_helper_vfp_maxnumd,
  };
  TRANS(FMAXNM_s, do_fp3_scalar, a, &f_scalar_fmaxnm)
  static const FPScalar f_scalar_fminnm = {
 -    gen_helper_advsimd_minnumh,
 +    gen_helper_vfp_minnumh,
      gen_helper_vfp_minnums,
      gen_helper_vfp_minnumd,
  };
@@ -XXX,XX +XXX,XX @@ static bool do_fp_reduction(DisasContext *s, arg_qrr_e *a,
      return true;
  }
-+- (void) updateUIInfo
+-TRANS_FEAT(FMAXNMV_h, aa64_fp16, do_fp_reduction, a, gen_helper_advsimd_maxnumh)
-+{
+-TRANS_FEAT(FMINNMV_h, aa64_fp16, do_fp_reduction, a, gen_helper_advsimd_minnumh)
-+    if (!allow_events) {
+-TRANS_FEAT(FMAXV_h, aa64_fp16, do_fp_reduction, a, gen_helper_advsimd_maxh)
-+        /*
+-TRANS_FEAT(FMINV_h, aa64_fp16, do_fp_reduction, a, gen_helper_advsimd_minh)
-+         * Don't try to tell QEMU about UI information in the application
++TRANS_FEAT(FMAXNMV_h, aa64_fp16, do_fp_reduction, a, gen_helper_vfp_maxnumh)
-+         * startup phase -- we haven't yet registered dcl with the QEMU UI
++TRANS_FEAT(FMINNMV_h, aa64_fp16, do_fp_reduction, a, gen_helper_vfp_minnumh)
-+         * layer, and also trying to take the iothread lock would deadlock.
++TRANS_FEAT(FMAXV_h, aa64_fp16, do_fp_reduction, a, gen_helper_vfp_maxh)
-+         * When cocoa_display_init() does register the dcl, the UI layer
++TRANS_FEAT(FMINV_h, aa64_fp16, do_fp_reduction, a, gen_helper_vfp_minh)
-+         * will call cocoa_switch(), which will call updateUIInfo, so
-+         * we don't lose any information here.
+ TRANS(FMAXNMV_s, do_fp_reduction, a, gen_helper_vfp_maxnums)
-+         */
+ TRANS(FMINNMV_s, do_fp_reduction, a, gen_helper_vfp_minnums)
 +        return;
 +    }
 +
 +    with_iothread_lock(^{
 +        [self updateUIInfoLocked];
 +    });
 +}
 +
  - (void)viewDidMoveToWindow
  {
      [self updateUIInfo];
@@ -XXX,XX +XXX,XX @@ static void cocoa_switch(DisplayChangeListener *dcl,
      COCOA_DEBUG("qemu_cocoa: cocoa_switch\n");
 -    [cocoaView updateUIInfo];
 -
      // The DisplaySurface will be freed as soon as this callback returns.
      // We take a reference to the underlying pixman image here so it does
      // not disappear from under our feet; the switchSurface method will
@@ -XXX,XX +XXX,XX @@ static void cocoa_switch(DisplayChangeListener *dcl,
      pixman_image_ref(image);
      dispatch_async(dispatch_get_main_queue(), ^{
 +        [cocoaView updateUIInfo];
          [cocoaView switchSurface:image];
      });
      [pool release];
 --
-.25.1
+.34.1

-[PULL 12/26] target/arm: Pass outputsize down to check_s2_mmu_setup
+[PULL 35/36] target/arm: Use FPST_A64_F16 for halfprec-to-other conversions
-From: Richard Henderson <richard.henderson@linaro.org>
+We should be using the F16-specific float_status for conversions from
 half-precision, because halfprec inputs never set Input Denormal.
-Pass down the width of the output address from translation.
+Without FEAT_AHP, using the wrong fpst here had no effect, because
-For now this is still just PAMax, but a subsequent patch will
+the only difference between the A64_F16 and A64 fpst is its handling
-compute the correct value from TCR_ELx.{I}PS.
+of flush-to-zero on input and output, and the helper functions
 vfp_fcvt_f16_to_* and vfp_fcvt_*_to_f16 all explicitly squash the
 relevant flushing flags, and flush_inputs_to_zero was the only way
 that IDC could be set.
-Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
+With FEAT_AHP, the FPCR.AH=1 behaviour sets IDC for
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
+input_denormal_used, which we will only ignore in
-Message-id: 20220301215958.157011-6-richard.henderson@linaro.org
+vfp_get_fpsr_from_host() for the A64_F16 fpst; so it matters that we
 use that one for f16 inputs (and the normal one for single/double to
 f16 conversions).
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
+Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
+Message-id: 20250124162836.2332150-27-peter.maydell@linaro.org
 ---
- target/arm/helper.c | 21 ++++++++++-----------
+ target/arm/tcg/translate-a64.c | 9 ++++++---
-file changed, 10 insertions(+), 11 deletions(-)
+ target/arm/tcg/translate-sve.c | 4 ++--
 files changed, 8 insertions(+), 5 deletions(-)
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
+--- a/target/arm/tcg/translate-a64.c
-+++ b/target/arm/helper.c
++++ b/target/arm/tcg/translate-a64.c
-@@ -XXX,XX +XXX,XX @@ do_fault:
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_sh(DisasContext *s, arg_rr *a)
-  * false otherwise.
+     if (fp_access_check(s)) {
-  */
+         TCGv_i32 tcg_rn = read_fp_hreg(s, a->rn);
- static bool check_s2_mmu_setup(ARMCPU *cpu, bool is_aa64, int level,
+         TCGv_i32 tcg_rd = tcg_temp_new_i32();
--                               int inputsize, int stride)
+-        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_A64);
-+                               int inputsize, int stride, int outputsize)
++        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_A64_F16);
- {
+         TCGv_i32 tcg_ahp = get_ahp_flag();
-     const int grainsize = stride + 3;
-     int startsizecheck;
+         gen_helper_vfp_fcvt_f16_to_f32(tcg_rd, tcg_rn, tcg_fpst, tcg_ahp);
-@@ -XXX,XX +XXX,XX @@ static bool check_s2_mmu_setup(ARMCPU *cpu, bool is_aa64, int level,
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVT_s_dh(DisasContext *s, arg_rr *a)
      if (fp_access_check(s)) {
          TCGv_i32 tcg_rn = read_fp_hreg(s, a->rn);
          TCGv_i64 tcg_rd = tcg_temp_new_i64();
 -        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_A64);
 +        TCGv_ptr tcg_fpst = fpstatus_ptr(FPST_A64_F16);
          TCGv_i32 tcg_ahp = get_ahp_flag();
          gen_helper_vfp_fcvt_f16_to_f64(tcg_rd, tcg_rn, tcg_fpst, tcg_ahp);
@@ -XXX,XX +XXX,XX @@ static bool trans_FCVTL_v(DisasContext *s, arg_qrr_e *a)
          return true;
      }
-     if (is_aa64) {
+-    fpst = fpstatus_ptr(FPST_A64);
--        CPUARMState *env = &cpu->env;
+     if (a->esz == MO_64) {
--        unsigned int pamax = arm_pamax(cpu);
+         /* 32 -> 64 bit fp conversion */
--
+         TCGv_i64 tcg_res[2];
-         switch (stride) {
+         TCGv_i32 tcg_op = tcg_temp_new_i32();
-         case 13: /* 64KB Pages.  */
+         int srcelt = a->q ? 2 : 0;
--            if (level == 0 || (level == 1 && pamax <= 42)) {
-+            if (level == 0 || (level == 1 && outputsize <= 42)) {
++        fpst = fpstatus_ptr(FPST_A64);
-                 return false;
++
-             }
+         for (pass = 0; pass < 2; pass++) {
-             break;
+             tcg_res[pass] = tcg_temp_new_i64();
-         case 11: /* 16KB Pages.  */
+             read_vec_element_i32(s, tcg_op, a->rn, srcelt + pass, MO_32);
--            if (level == 0 || (level == 1 && pamax <= 40)) {
+@@ -XXX,XX +XXX,XX @@ static bool trans_FCVTL_v(DisasContext *s, arg_qrr_e *a)
-+            if (level == 0 || (level == 1 && outputsize <= 40)) {
+         TCGv_i32 tcg_res[4];
-                 return false;
+         TCGv_i32 ahp = get_ahp_flag();
-             }
-             break;
++        fpst = fpstatus_ptr(FPST_A64_F16);
-         case 9: /* 4KB Pages.  */
++
--            if (level == 0 && pamax <= 42) {
+         for (pass = 0; pass < 4; pass++) {
-+            if (level == 0 && outputsize <= 42) {
+             tcg_res[pass] = tcg_temp_new_i32();
-                 return false;
+             read_vec_element_i32(s, tcg_res[pass], a->rn, srcelt + pass, MO_16);
-             }
+diff --git a/target/arm/tcg/translate-sve.c b/target/arm/tcg/translate-sve.c
-             break;
+index XXXXXXX..XXXXXXX 100644
-@@ -XXX,XX +XXX,XX @@ static bool check_s2_mmu_setup(ARMCPU *cpu, bool is_aa64, int level,
+--- a/target/arm/tcg/translate-sve.c
-         }
++++ b/target/arm/tcg/translate-sve.c
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FCMLA_zzxz, aa64_sve, gen_gvec_fpst_zzzz, fcmla_idx_fns[a->esz],
-         /* Inputsize checks.  */
+ TRANS_FEAT(FCVT_sh, aa64_sve, gen_gvec_fpst_arg_zpz,
--        if (inputsize > pamax &&
+            gen_helper_sve_fcvt_sh, a, 0, FPST_A64)
--            (arm_el_is_aa64(env, 1) || inputsize > 40)) {
+ TRANS_FEAT(FCVT_hs, aa64_sve, gen_gvec_fpst_arg_zpz,
-+        if (inputsize > outputsize &&
+-           gen_helper_sve_fcvt_hs, a, 0, FPST_A64)
-+            (arm_el_is_aa64(&cpu->env, 1) || inputsize > 40)) {
++           gen_helper_sve_fcvt_hs, a, 0, FPST_A64_F16)
-             /* This is CONSTRAINED UNPREDICTABLE and we choose to fault.  */
-             return false;
+ TRANS_FEAT(BFCVT, aa64_sve_bf16, gen_gvec_fpst_arg_zpz,
-         }
+            gen_helper_sve_bfcvt, a, 0, FPST_A64)
-@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
+@@ -XXX,XX +XXX,XX @@ TRANS_FEAT(BFCVT, aa64_sve_bf16, gen_gvec_fpst_arg_zpz,
-     target_ulong page_size;
+ TRANS_FEAT(FCVT_dh, aa64_sve, gen_gvec_fpst_arg_zpz,
-     uint32_t attrs;
+            gen_helper_sve_fcvt_dh, a, 0, FPST_A64)
-     int32_t stride;
+ TRANS_FEAT(FCVT_hd, aa64_sve, gen_gvec_fpst_arg_zpz,
--    int addrsize, inputsize;
+-           gen_helper_sve_fcvt_hd, a, 0, FPST_A64)
-+    int addrsize, inputsize, outputsize;
++           gen_helper_sve_fcvt_hd, a, 0, FPST_A64_F16)
-     TCR *tcr = regime_tcr(env, mmu_idx);
+ TRANS_FEAT(FCVT_ds, aa64_sve, gen_gvec_fpst_arg_zpz,
-     int ap, ns, xn, pxn;
+            gen_helper_sve_fcvt_ds, a, 0, FPST_A64)
-     uint32_t el = regime_el(env, mmu_idx);
+ TRANS_FEAT(FCVT_sd, aa64_sve, gen_gvec_fpst_arg_zpz,
@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
          addrsize = 64 - 8 * param.tbi;
          inputsize = 64 - param.tsz;
 +        outputsize = arm_pamax(cpu);
      } else {
          param = aa32_va_parameters(env, address, mmu_idx);
          level = 1;
          addrsize = (mmu_idx == ARMMMUIdx_Stage2 ? 40 : 32);
          inputsize = addrsize - param.tsz;
 +        outputsize = 40;
      }
      /*
@@ -XXX,XX +XXX,XX @@ static bool get_phys_addr_lpae(CPUARMState *env, uint64_t address,
          /* Check that the starting level is valid. */
          ok = check_s2_mmu_setup(cpu, aarch64, startlevel,
 -                                inputsize, stride);
 +                                inputsize, stride, outputsize);
          if (!ok) {
              fault_type = ARMFault_Translation;
              goto do_fault;
 --
-.25.1
+.34.1

-[PULL 15/26] target/arm: Prepare DBGBVR and DBGWVR for FEAT_LVA
+[PULL 36/36] hw/usb/canokey: Fix buffer overflow for OUT packet
-From: Richard Henderson <richard.henderson@linaro.org>
+From: Hongren Zheng <i@zenithal.me>
-The original A.a revision of the AArch64 ARM required that we
+When USBPacket in OUT direction has larger payload
-force-extend the addresses in these registers from 49 bits.
+than the ep_out_buffer (of size 512), a buffer overflow
-This language has been loosened via a combination of IMPLEMENTATION
+would occur.
 DEFINED and CONSTRAINTED UNPREDICTABLE to allow consideration of
 the entire aligned address.
-This means that we do not have to consider whether or not FEAT_LVA
+It could be fixed by limiting the size of usb_packet_copy
-is enabled, and decide from which bit an address might need to be
+to be at most buffer size. Further optimization gets rid
-extended.
+of the ep_out_buffer and directly uses ep_out as the target
 buffer.
+This is reported by a security researcher who artificially
+constructed an OUT packet of size 2047. The report has gone
+through the QEMU security process, and as this device is for
+testing purpose and no deployment of it in virtualization
+environment is observed, it is triaged not to be a security bug.
+Cc: qemu-stable@nongnu.org
+Fixes: d7d34918551dc48 ("hw/usb: Add CanoKey Implementation")
+Reported-by: Juan Jose Lopez Jaimez <thatjiaozi@gmail.com>
+Signed-off-by: Hongren Zheng <i@zenithal.me>
+Message-id: Z4TfMOrZz6IQYl_h@Sun
 Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
-Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
-Message-id: 20220301215958.157011-9-richard.henderson@linaro.org
 Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
 ---
- target/arm/helper.c | 32 ++++++++++++++++++++++++--------
+ hw/usb/canokey.h | 4 ----
-file changed, 24 insertions(+), 8 deletions(-)
+ hw/usb/canokey.c | 6 +++---
 files changed, 3 insertions(+), 7 deletions(-)
-diff --git a/target/arm/helper.c b/target/arm/helper.c
+diff --git a/hw/usb/canokey.h b/hw/usb/canokey.h
 index XXXXXXX..XXXXXXX 100644
---- a/target/arm/helper.c
+--- a/hw/usb/canokey.h
-+++ b/target/arm/helper.c
++++ b/hw/usb/canokey.h
-@@ -XXX,XX +XXX,XX @@ static void dbgwvr_write(CPUARMState *env, const ARMCPRegInfo *ri,
+@@ -XXX,XX +XXX,XX @@
-     ARMCPU *cpu = env_archcpu(env);
+ #define CANOKEY_EP_NUM 3
-     int i = ri->crm;
+ /* BULK/INTR IN can be up to 1352 bytes, e.g. get key info */
+ #define CANOKEY_EP_IN_BUFFER_SIZE 2048
--    /* Bits [63:49] are hardwired to the value of bit [48]; that is, the
+-/* BULK OUT can be up to 270 bytes, e.g. PIV import cert */
--     * register reads and behaves as if values written are sign extended.
+-#define CANOKEY_EP_OUT_BUFFER_SIZE 512
-+    /*
-      * Bits [1:0] are RES0.
+ typedef enum {
-+     *
+     CANOKEY_EP_IN_WAIT,
-+     * It is IMPLEMENTATION DEFINED whether [63:49] ([63:53] with FEAT_LVA)
+@@ -XXX,XX +XXX,XX @@ typedef struct CanoKeyState {
-+     * are hardwired to the value of bit [48] ([52] with FEAT_LVA), or if
+     /* OUT pointer to canokey recv buffer */
-+     * they contain the value written.  It is CONSTRAINED UNPREDICTABLE
+     uint8_t *ep_out[CANOKEY_EP_NUM];
-+     * whether the RESS bits are ignored when comparing an address.
+     uint32_t ep_out_size[CANOKEY_EP_NUM];
-+     *
+-    /* For large BULK OUT, multiple write to ep_out is needed */
-+     * Therefore we are allowed to compare the entire register, which lets
+-    uint8_t ep_out_buffer[CANOKEY_EP_NUM][CANOKEY_EP_OUT_BUFFER_SIZE];
-+     * us avoid considering whether or not FEAT_LVA is actually enabled.
-      */
+     /* Properties */
--    value = sextract64(value, 0, 49) & ~3ULL;
+     char *file; /* canokey-file */
-+    value &= ~3ULL;
+diff --git a/hw/usb/canokey.c b/hw/usb/canokey.c
+index XXXXXXX..XXXXXXX 100644
-     raw_write(env, ri, value);
+--- a/hw/usb/canokey.c
-     hw_watchpoint_update(cpu, i);
++++ b/hw/usb/canokey.c
-@@ -XXX,XX +XXX,XX @@ void hw_breakpoint_update(ARMCPU *cpu, int n)
+@@ -XXX,XX +XXX,XX @@ static void canokey_handle_data(USBDevice *dev, USBPacket *p)
-     case 0: /* unlinked address match */
+     switch (p->pid) {
-     case 1: /* linked address match */
+     case USB_TOKEN_OUT:
-     {
+         trace_canokey_handle_data_out(ep_out, p->iov.size);
--        /* Bits [63:49] are hardwired to the value of bit [48]; that is,
+-        usb_packet_copy(p, key->ep_out_buffer[ep_out], p->iov.size);
--         * we behave as if the register was sign extended. Bits [1:0] are
+         out_pos = 0;
--         * RES0. The BAS field is used to allow setting breakpoints on 16
++        /* segment packet into (possibly multiple) ep_out */
--         * bit wide instructions; it is CONSTRAINED UNPREDICTABLE whether
+         while (out_pos != p->iov.size) {
-+        /*
+             /*
-+         * Bits [1:0] are RES0.
+              * key->ep_out[ep_out] set by prepare_receive
-+         *
+@@ -XXX,XX +XXX,XX @@ static void canokey_handle_data(USBDevice *dev, USBPacket *p)
-+         * It is IMPLEMENTATION DEFINED whether bits [63:49]
+              * to be the buffer length
-+         * ([63:53] for FEAT_LVA) are hardwired to a copy of the sign bit
+              */
-+         * of the VA field ([48] or [52] for FEAT_LVA), or whether the
+             out_len = MIN(p->iov.size - out_pos, key->ep_out_size[ep_out]);
-+         * value is read as written.  It is CONSTRAINED UNPREDICTABLE
+-            memcpy(key->ep_out[ep_out],
-+         * whether the RESS bits are ignored when comparing an address.
+-                    key->ep_out_buffer[ep_out] + out_pos, out_len);
-+         * Therefore we are allowed to compare the entire register, which
++            /* usb_packet_copy would update the pos offset internally */
-+         * lets us avoid considering whether FEAT_LVA is actually enabled.
++            usb_packet_copy(p, key->ep_out[ep_out], out_len);
-+         *
+             out_pos += out_len;
-+         * The BAS field is used to allow setting breakpoints on 16-bit
+             /* update ep_out_size to actual len */
-+         * wide instructions; it is CONSTRAINED UNPREDICTABLE whether
+             key->ep_out_size[ep_out] = out_len;
           * a bp will fire if the addresses covered by the bp and the addresses
           * covered by the insn overlap but the insn doesn't start at the
           * start of the bp address range. We choose to require the insn and
@@ -XXX,XX +XXX,XX @@ void hw_breakpoint_update(ARMCPU *cpu, int n)
           * See also figure D2-3 in the v8 ARM ARM (DDI0487A.c).
           */
          int bas = extract64(bcr, 5, 4);
 -        addr = sextract64(bvr, 0, 49) & ~3ULL;
 +        addr = bvr & ~3ULL;
          if (bas == 0) {
              return;
          }
 --
-.25.1
+.34.1

The following changes since commit 64ada298b98a51eb2512607f6e6180cb330c47b1:

Merge remote-tracking branch 'remotes/legoater/tags/pull-ppc-20220302' into staging (2022-03-02 12:38:46 +0000)

are available in the Git repository at:

https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20220302

for you to fetch changes up to 268c11984e67867c22f53beb3c7f8b98900d66b2:

ui/cocoa.m: Remove unnecessary NSAutoreleasePools (2022-03-02 19:27:37 +0000)

----------------------------------------------------------------
target-arm queue:
 * mps3-an547: Add missing user ahb interfaces
 * hw/arm/mps2-tz.c: Update AN547 documentation URL
 * hw/input/tsc210x: Don't abort on bad SPI word widths
 * hw/i2c: flatten pca954x mux device
 * target/arm: Support PSCI 1.1 and SMCCC 1.0
 * target/arm: Fix early free of TCG temp in handle_simd_shift_fpint_conv()
 * tests/qtest: add qtests for npcm7xx sdhci
 * Implement FEAT_LVA
 * Implement FEAT_LPA
 * Implement FEAT_LPA2 (but do not enable it yet)
 * Report KVM's actual PSCI version to guest in dtb
 * ui/cocoa.m: Fix updateUIInfo threading issues
 * ui/cocoa.m: Remove unnecessary NSAutoreleasePools

----------------------------------------------------------------
Akihiko Odaki (1):
      target/arm: Support PSCI 1.1 and SMCCC 1.0

Jimmy Brisson (1):
      mps3-an547: Add missing user ahb interfaces

Patrick Venture (1):
      hw/i2c: flatten pca954x mux device

Peter Maydell (5):
      hw/arm/mps2-tz.c: Update AN547 documentation URL
      hw/input/tsc210x: Don't abort on bad SPI word widths
      target/arm: Report KVM's actual PSCI version to guest in dtb
      ui/cocoa.m: Fix updateUIInfo threading issues
      ui/cocoa.m: Remove unnecessary NSAutoreleasePools

Richard Henderson (16):
      hw/registerfields: Add FIELD_SEX<N> and FIELD_SDP<N>
      target/arm: Set TCR_EL1.TSZ for user-only
      target/arm: Fault on invalid TCR_ELx.TxSZ
      target/arm: Move arm_pamax out of line
      target/arm: Pass outputsize down to check_s2_mmu_setup
      target/arm: Use MAKE_64BIT_MASK to compute indexmask
      target/arm: Honor TCR_ELx.{I}PS
      target/arm: Prepare DBGBVR and DBGWVR for FEAT_LVA
      target/arm: Implement FEAT_LVA
      target/arm: Implement FEAT_LPA
      target/arm: Extend arm_fi_to_lfsc to level -1
      target/arm: Introduce tlbi_aa64_get_range
      target/arm: Fix TLBIRange.base for 16k and 64k pages
      target/arm: Validate tlbi TG matches translation granule in use
      target/arm: Advertise all page sizes for -cpu max
      target/arm: Implement FEAT_LPA2

Shengtan Mao (1):
      tests/qtest: add qtests for npcm7xx sdhci

Wentao_Liang (1):
      target/arm: Fix early free of TCG temp in handle_simd_shift_fpint_conv()

From: Jimmy Brisson <jimmy.brisson@linaro.org>

With these interfaces missing, TFM would delegate peripherals 0, 1,
2, 3 and 8, and qemu would ignore the delegation of interface 8, as
it thought interface 4 was eth & USB.

This patch corrects this behavior and allows TFM to delegate the
eth & USB peripheral to NS mode.

(The old QEMU behaviour was based on revision B of the AN547
appnote; revision C corrects this error in the documentation,
and this commit brings QEMU in to line with how the FPGA
image really behaves.)

Signed-off-by: Jimmy Brisson <jimmy.brisson@linaro.org>
Message-id: 20220210210227.3203883-1-jimmy.brisson@linaro.org
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
[PMM: added commit message note clarifying that the old behaviour
was a docs issue, not because there were two different versions
of the FPGA image]
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
---
 hw/arm/mps2-tz.c | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c
index XXXXXXX..XXXXXXX 100644
--- a/hw/arm/mps2-tz.c
+++ b/hw/arm/mps2-tz.c
@@ -XXX,XX +XXX,XX @@ static void mps2tz_common_init(MachineState *machine)
                 { "gpio1", make_unimp_dev, &mms->gpio[1], 0x41101000, 0x1000 },
                 { "gpio2", make_unimp_dev, &mms->gpio[2], 0x41102000, 0x1000 },
                 { "gpio3", make_unimp_dev, &mms->gpio[3], 0x41103000, 0x1000 },
+                { /* port 4 USER AHB interface 0 */ },
+                { /* port 5 USER AHB interface 1 */ },
+                { /* port 6 USER AHB interface 2 */ },
+                { /* port 7 USER AHB interface 3 */ },
                 { "eth-usb", make_eth_usb, NULL, 0x41400000, 0x200000, { 49 } },
             },
         },
-- 
2.25.1

The AN547 application note URL has changed: update our comment
accordingly. (Rev B is still downloadable from the old URL,
but there is a new Rev C of the document now.)

Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
Tested-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
Message-id: 20220221094144.426191-1-peter.maydell@linaro.org
---
 hw/arm/mps2-tz.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c
index XXXXXXX..XXXXXXX 100644
--- a/hw/arm/mps2-tz.c
+++ b/hw/arm/mps2-tz.c
@@ -XXX,XX +XXX,XX @@
  * Application Note AN524:
  * https://developer.arm.com/documentation/dai0524/latest/
  * Application Note AN547:
- * https://developer.arm.com/-/media/Arm%20Developer%20Community/PDF/DAI0547B_SSE300_PLUS_U55_FPGA_for_mps3.pdf
+ * https://developer.arm.com/documentation/dai0547/latest/
  *
  * The AN505 defers to the Cortex-M33 processor ARMv8M IoT Kit FVP User Guide
  * (ARM ECM0601256) for the details of some of the device layout:
-- 
2.25.1

The tsc210x doesn't support anything other than 16-bit reads on the
SPI bus, but the guest can program the SPI controller to attempt
them anyway. If this happens, don't abort QEMU, just log this as
a guest error.

This fixes our machine_arm_n8x0.py:N8x0Machine.test_n800
acceptance test, which hits this assertion.

The reason we hit the assertion is because the guest kernel thinks
there is a TSC2005 on this SPI bus address, not a TSC210x.  (The n810
*does* have a TSC2005 at this address.) The TSC2005 supports the
24-bit accesses which the guest driver makes, and the TSC210x does
not (that is, our TSC210x emulation is not missing support for a word
width the hardware can handle).  It's not clear whether the problem
here is that the guest kernel incorrectly thinks the n800 has the
same device at this SPI bus address as the n810, or that QEMU's n810
board model doesn't get the SPI devices right.  At this late date
there no longer appears to be any reliable information on the web
about the hardware behaviour, but I am inclined to think this is a
guest kernel bug.  In any case, we prefer not to abort QEMU for
guest-triggerable conditions, so logging the error is the right thing
to do.

Resolves: https://gitlab.com/qemu-project/qemu/-/issues/736
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
Message-id: 20220221140750.514557-1-peter.maydell@linaro.org
---
 hw/input/tsc210x.c | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/hw/input/tsc210x.c b/hw/input/tsc210x.c
index XXXXXXX..XXXXXXX 100644
--- a/hw/input/tsc210x.c
+++ b/hw/input/tsc210x.c
@@ -XXX,XX +XXX,XX @@
 #include "hw/hw.h"
 #include "audio/audio.h"
 #include "qemu/timer.h"
+#include "qemu/log.h"
 #include "sysemu/reset.h"
 #include "ui/console.h"
 #include "hw/arm/omap.h"            /* For I2SCodec */
@@ -XXX,XX +XXX,XX @@ uint32_t tsc210x_txrx(void *opaque, uint32_t value, int len)
     TSC210xState *s = opaque;
     uint32_t ret = 0;
 
-    if (len != 16)
-        hw_error("%s: FIXME: bad SPI word width %i\n", __func__, len);
+    if (len != 16) {
+        qemu_log_mask(LOG_GUEST_ERROR,
+                      "%s: bad SPI word width %i\n", __func__, len);
+        return 0;
+    }
 
     /* TODO: sequential reads etc - how do we make sure the host doesn't
      * unintentionally read out a conversion result from a register while
-- 
2.25.1

From: Patrick Venture <venture@google.com>

Previously this device created N subdevices which each owned an i2c bus.
Now this device simply owns the N i2c busses directly.

Tested: Verified devices behind mux are still accessible via qmp and i2c
from within an arm32 SoC.

Reviewed-by: Hao Wu <wuhaotsh@google.com>
Signed-off-by: Patrick Venture <venture@google.com>
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
Tested-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
Message-id: 20220202164533.1283668-1-venture@google.com
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
---
 hw/i2c/i2c_mux_pca954x.c | 77 +++++++---------------------------------
 1 file changed, 13 insertions(+), 64 deletions(-)

diff --git a/hw/i2c/i2c_mux_pca954x.c b/hw/i2c/i2c_mux_pca954x.c
index XXXXXXX..XXXXXXX 100644
--- a/hw/i2c/i2c_mux_pca954x.c
+++ b/hw/i2c/i2c_mux_pca954x.c
@@ -XXX,XX +XXX,XX @@
 #define PCA9548_CHANNEL_COUNT 8
 #define PCA9546_CHANNEL_COUNT 4
 
-/*
- * struct Pca954xChannel - The i2c mux device will have N of these states
- * that own the i2c channel bus.
- * @bus: The owned channel bus.
- * @enabled: Is this channel active?
- */
-typedef struct Pca954xChannel {
-    SysBusDevice parent;
-
-    I2CBus       *bus;
-
-    bool         enabled;
-} Pca954xChannel;
-
-#define TYPE_PCA954X_CHANNEL "pca954x-channel"
-#define PCA954X_CHANNEL(obj) \
-    OBJECT_CHECK(Pca954xChannel, (obj), TYPE_PCA954X_CHANNEL)
-
 /*
  * struct Pca954xState - The pca954x state object.
  * @control: The value written to the mux control.
@@ -XXX,XX +XXX,XX @@ typedef struct Pca954xState {
 
     uint8_t control;
 
-    /* The channel i2c buses. */
-    Pca954xChannel channel[PCA9548_CHANNEL_COUNT];
+    bool enabled[PCA9548_CHANNEL_COUNT];
+    I2CBus *bus[PCA9548_CHANNEL_COUNT];
 } Pca954xState;
 
 /*
@@ -XXX,XX +XXX,XX @@ static bool pca954x_match(I2CSlave *candidate, uint8_t address,
     }
 
     for (i = 0; i < mc->nchans; i++) {
-        if (!mux->channel[i].enabled) {
+        if (!mux->enabled[i]) {
             continue;
         }
 
-        if (i2c_scan_bus(mux->channel[i].bus, address, broadcast,
+        if (i2c_scan_bus(mux->bus[i], address, broadcast,
                          current_devs)) {
             if (!broadcast) {
                 return true;
@@ -XXX,XX +XXX,XX @@ static void pca954x_enable_channel(Pca954xState *s, uint8_t enable_mask)
      */
     for (i = 0; i < mc->nchans; i++) {
         if (enable_mask & (1 << i)) {
-            s->channel[i].enabled = true;
+            s->enabled[i] = true;
         } else {
-            s->channel[i].enabled = false;
+            s->enabled[i] = false;
         }
     }
 }
@@ -XXX,XX +XXX,XX @@ I2CBus *pca954x_i2c_get_bus(I2CSlave *mux, uint8_t channel)
     Pca954xState *pca954x = PCA954X(mux);
 
     g_assert(channel < pc->nchans);
-    return I2C_BUS(qdev_get_child_bus(DEVICE(&pca954x->channel[channel]),
-                                      "i2c-bus"));
-}
-
-static void pca954x_channel_init(Object *obj)
-{
-    Pca954xChannel *s = PCA954X_CHANNEL(obj);
-    s->bus = i2c_init_bus(DEVICE(s), "i2c-bus");
-
-    /* Start all channels as disabled. */
-    s->enabled = false;
-}
-
-static void pca954x_channel_class_init(ObjectClass *klass, void *data)
-{
-    DeviceClass *dc = DEVICE_CLASS(klass);
-    dc->desc = "Pca954x Channel";
+    return pca954x->bus[channel];
 }
 
 static void pca9546_class_init(ObjectClass *klass, void *data)
@@ -XXX,XX +XXX,XX @@ static void pca9548_class_init(ObjectClass *klass, void *data)
     s->nchans = PCA9548_CHANNEL_COUNT;
 }
 
-static void pca954x_realize(DeviceState *dev, Error **errp)
-{
-    Pca954xState *s = PCA954X(dev);
-    Pca954xClass *c = PCA954X_GET_CLASS(s);
-    int i;
-
-    /* SMBus modules. Cannot fail. */
-    for (i = 0; i < c->nchans; i++) {
-        sysbus_realize(SYS_BUS_DEVICE(&s->channel[i]), &error_abort);
-    }
-}
-
 static void pca954x_init(Object *obj)
 {
     Pca954xState *s = PCA954X(obj);
     Pca954xClass *c = PCA954X_GET_CLASS(obj);
     int i;
 
-    /* Only initialize the children we expect. */
+    /* SMBus modules. Cannot fail. */
     for (i = 0; i < c->nchans; i++) {
-        object_initialize_child(obj, "channel[*]", &s->channel[i],
-                                TYPE_PCA954X_CHANNEL);
+        g_autofree gchar *bus_name = g_strdup_printf("i2c.%d", i);
+
+        /* start all channels as disabled. */
+        s->enabled[i] = false;
+        s->bus[i] = i2c_init_bus(DEVICE(s), bus_name);
     }
 }
 
@@ -XXX,XX +XXX,XX @@ static void pca954x_class_init(ObjectClass *klass, void *data)
     rc->phases.enter = pca954x_enter_reset;
 
     dc->desc = "Pca954x i2c-mux";
-    dc->realize = pca954x_realize;
 
     k->write_data = pca954x_write_data;
     k->receive_byte = pca954x_read_byte;
@@ -XXX,XX +XXX,XX @@ static const TypeInfo pca954x_info[] = {
         .parent        = TYPE_PCA954X,
         .class_init    = pca9548_class_init,
     },
-    {
-        .name = TYPE_PCA954X_CHANNEL,
-        .parent = TYPE_SYS_BUS_DEVICE,
-        .class_init = pca954x_channel_class_init,
-        .instance_size = sizeof(Pca954xChannel),
-        .instance_init = pca954x_channel_init,
-    }
 };
 
 DEFINE_TYPES(pca954x_info)
-- 
2.25.1

From: Akihiko Odaki <akihiko.odaki@gmail.com>

Support the latest PSCI on TCG and HVF. A 64-bit function called from
AArch32 now returns NOT_SUPPORTED, which is necessary to adhere to SMC
Calling Convention 1.0. It is still not compliant with SMCCC 1.3 since
they do not implement mandatory functions.

Signed-off-by: Akihiko Odaki <akihiko.odaki@gmail.com>
Message-id: 20220213035753.34577-1-akihiko.odaki@gmail.com
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
[PMM: update MISMATCH_CHECK checks on PSCI_VERSION macros to match]
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
---
 target/arm/kvm-consts.h | 13 +++++++++----
 hw/arm/boot.c           | 12 +++++++++---
 target/arm/cpu.c        |  5 +++--
 target/arm/hvf/hvf.c    | 27 ++++++++++++++++++++++++++-
 target/arm/kvm64.c      |  2 +-
 target/arm/psci.c       | 35 ++++++++++++++++++++++++++++++++---
 6 files changed, 80 insertions(+), 14 deletions(-)

diff --git a/target/arm/kvm-consts.h b/target/arm/kvm-consts.h
index XXXXXXX..XXXXXXX 100644
--- a/target/arm/kvm-consts.h
+++ b/target/arm/kvm-consts.h
@@ -XXX,XX +XXX,XX @@ MISMATCH_CHECK(QEMU_PSCI_0_1_FN_MIGRATE, KVM_PSCI_FN_MIGRATE);
 #define QEMU_PSCI_0_2_FN64_AFFINITY_INFO QEMU_PSCI_0_2_FN64(4)
 #define QEMU_PSCI_0_2_FN64_MIGRATE QEMU_PSCI_0_2_FN64(5)
 
+#define QEMU_PSCI_1_0_FN_PSCI_FEATURES QEMU_PSCI_0_2_FN(10)
+
 MISMATCH_CHECK(QEMU_PSCI_0_2_FN_CPU_SUSPEND, PSCI_0_2_FN_CPU_SUSPEND);
 MISMATCH_CHECK(QEMU_PSCI_0_2_FN_CPU_OFF, PSCI_0_2_FN_CPU_OFF);
 MISMATCH_CHECK(QEMU_PSCI_0_2_FN_CPU_ON, PSCI_0_2_FN_CPU_ON);
@@ -XXX,XX +XXX,XX @@ MISMATCH_CHECK(QEMU_PSCI_0_2_FN_MIGRATE, PSCI_0_2_FN_MIGRATE);
 MISMATCH_CHECK(QEMU_PSCI_0_2_FN64_CPU_SUSPEND, PSCI_0_2_FN64_CPU_SUSPEND);
 MISMATCH_CHECK(QEMU_PSCI_0_2_FN64_CPU_ON, PSCI_0_2_FN64_CPU_ON);
 MISMATCH_CHECK(QEMU_PSCI_0_2_FN64_MIGRATE, PSCI_0_2_FN64_MIGRATE);
+MISMATCH_CHECK(QEMU_PSCI_1_0_FN_PSCI_FEATURES, PSCI_1_0_FN_PSCI_FEATURES);
 
 /* PSCI v0.2 return values used by TCG emulation of PSCI */
 
 /* No Trusted OS migration to worry about when offlining CPUs */
 #define QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED        2
 
-/* We implement version 0.2 only */
-#define QEMU_PSCI_0_2_RET_VERSION_0_2                       2
+#define QEMU_PSCI_VERSION_0_1                     0x00001
+#define QEMU_PSCI_VERSION_0_2                     0x00002
+#define QEMU_PSCI_VERSION_1_1                     0x10001
 
 MISMATCH_CHECK(QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED, PSCI_0_2_TOS_MP);
-MISMATCH_CHECK(QEMU_PSCI_0_2_RET_VERSION_0_2,
-               (PSCI_VERSION_MAJOR(0) | PSCI_VERSION_MINOR(2)));
+/* We don't bother to check every possible version value */
+MISMATCH_CHECK(QEMU_PSCI_VERSION_0_2, PSCI_VERSION(0, 2));
+MISMATCH_CHECK(QEMU_PSCI_VERSION_1_1, PSCI_VERSION(1, 1));
 
 /* PSCI return values (inclusive of all PSCI versions) */
 #define QEMU_PSCI_RET_SUCCESS                     0
diff --git a/hw/arm/boot.c b/hw/arm/boot.c
index XXXXXXX..XXXXXXX 100644
--- a/hw/arm/boot.c
+++ b/hw/arm/boot.c
@@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt)
     }
 
     qemu_fdt_add_subnode(fdt, "/psci");
-    if (armcpu->psci_version == 2) {
-        const char comp[] = "arm,psci-0.2\0arm,psci";
-        qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
+    if (armcpu->psci_version == QEMU_PSCI_VERSION_0_2 ||
+        armcpu->psci_version == QEMU_PSCI_VERSION_1_1) {
+        if (armcpu->psci_version == QEMU_PSCI_VERSION_0_2) {
+            const char comp[] = "arm,psci-0.2\0arm,psci";
+            qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
+        } else {
+            const char comp[] = "arm,psci-1.0\0arm,psci-0.2\0arm,psci";
+            qemu_fdt_setprop(fdt, "/psci", "compatible", comp, sizeof(comp));
+        }
 
         cpu_off_fn = QEMU_PSCI_0_2_FN_CPU_OFF;
         if (arm_feature(&armcpu->env, ARM_FEATURE_AARCH64)) {
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
index XXXXXXX..XXXXXXX 100644
--- a/target/arm/cpu.c
+++ b/target/arm/cpu.c
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_initfn(Object *obj)
      * picky DTB consumer will also provide a helpful error message.
      */
     cpu->dtb_compatible = "qemu,unknown";
-    cpu->psci_version = 1; /* By default assume PSCI v0.1 */
+    cpu->psci_version = QEMU_PSCI_VERSION_0_1; /* By default assume PSCI v0.1 */
     cpu->kvm_target = QEMU_KVM_ARM_TARGET_NONE;
 
     if (tcg_enabled() || hvf_enabled()) {
-        cpu->psci_version = 2; /* TCG and HVF implement PSCI 0.2 */
+        /* TCG and HVF implement PSCI 1.1 */
+        cpu->psci_version = QEMU_PSCI_VERSION_1_1;
     }
 }
 
diff --git a/target/arm/hvf/hvf.c b/target/arm/hvf/hvf.c
index XXXXXXX..XXXXXXX 100644
--- a/target/arm/hvf/hvf.c
+++ b/target/arm/hvf/hvf.c
@@ -XXX,XX +XXX,XX @@ static bool hvf_handle_psci_call(CPUState *cpu)
 
     switch (param[0]) {
     case QEMU_PSCI_0_2_FN_PSCI_VERSION:
-        ret = QEMU_PSCI_0_2_RET_VERSION_0_2;
+        ret = QEMU_PSCI_VERSION_1_1;
         break;
     case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
         ret = QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED; /* No trusted OS */
@@ -XXX,XX +XXX,XX @@ static bool hvf_handle_psci_call(CPUState *cpu)
     case QEMU_PSCI_0_2_FN_MIGRATE:
         ret = QEMU_PSCI_RET_NOT_SUPPORTED;
         break;
+    case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
+        switch (param[1]) {
+        case QEMU_PSCI_0_2_FN_PSCI_VERSION:
+        case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
+        case QEMU_PSCI_0_2_FN_AFFINITY_INFO:
+        case QEMU_PSCI_0_2_FN64_AFFINITY_INFO:
+        case QEMU_PSCI_0_2_FN_SYSTEM_RESET:
+        case QEMU_PSCI_0_2_FN_SYSTEM_OFF:
+        case QEMU_PSCI_0_1_FN_CPU_ON:
+        case QEMU_PSCI_0_2_FN_CPU_ON:
+        case QEMU_PSCI_0_2_FN64_CPU_ON:
+        case QEMU_PSCI_0_1_FN_CPU_OFF:
+        case QEMU_PSCI_0_2_FN_CPU_OFF:
+        case QEMU_PSCI_0_1_FN_CPU_SUSPEND:
+        case QEMU_PSCI_0_2_FN_CPU_SUSPEND:
+        case QEMU_PSCI_0_2_FN64_CPU_SUSPEND:
+        case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
+            ret = 0;
+            break;
+        case QEMU_PSCI_0_1_FN_MIGRATE:
+        case QEMU_PSCI_0_2_FN_MIGRATE:
+        default:
+            ret = QEMU_PSCI_RET_NOT_SUPPORTED;
+        }
+        break;
     default:
         return false;
     }
diff --git a/target/arm/kvm64.c b/target/arm/kvm64.c
index XXXXXXX..XXXXXXX 100644
--- a/target/arm/kvm64.c
+++ b/target/arm/kvm64.c
@@ -XXX,XX +XXX,XX @@ int kvm_arch_init_vcpu(CPUState *cs)
         cpu->kvm_init_features[0] |= 1 << KVM_ARM_VCPU_POWER_OFF;
     }
     if (kvm_check_extension(cs->kvm_state, KVM_CAP_ARM_PSCI_0_2)) {
-        cpu->psci_version = 2;
+        cpu->psci_version = QEMU_PSCI_VERSION_0_2;
         cpu->kvm_init_features[0] |= 1 << KVM_ARM_VCPU_PSCI_0_2;
     }
     if (!arm_feature(&cpu->env, ARM_FEATURE_AARCH64)) {
diff --git a/target/arm/psci.c b/target/arm/psci.c
index XXXXXXX..XXXXXXX 100644
--- a/target/arm/psci.c
+++ b/target/arm/psci.c
@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
 {
     /*
      * This function partially implements the logic for dispatching Power State
-     * Coordination Interface (PSCI) calls (as described in ARM DEN 0022B.b),
+     * Coordination Interface (PSCI) calls (as described in ARM DEN 0022D.b),
      * to the extent required for bringing up and taking down secondary cores,
      * and for handling reset and poweroff requests.
      * Additional information about the calling convention used is available in
@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
     }
 
     if ((param[0] & QEMU_PSCI_0_2_64BIT) && !is_a64(env)) {
-        ret = QEMU_PSCI_RET_INVALID_PARAMS;
+        ret = QEMU_PSCI_RET_NOT_SUPPORTED;
         goto err;
     }
 
@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
         ARMCPU *target_cpu;
 
     case QEMU_PSCI_0_2_FN_PSCI_VERSION:
-        ret = QEMU_PSCI_0_2_RET_VERSION_0_2;
+        ret = QEMU_PSCI_VERSION_1_1;
         break;
     case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
         ret = QEMU_PSCI_0_2_RET_TOS_MIGRATION_NOT_REQUIRED; /* No trusted OS */
@@ -XXX,XX +XXX,XX @@ void arm_handle_psci_call(ARMCPU *cpu)
         }
         helper_wfi(env, 4);
         break;
+    case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
+        switch (param[1]) {
+        case QEMU_PSCI_0_2_FN_PSCI_VERSION:
+        case QEMU_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
+        case QEMU_PSCI_0_2_FN_AFFINITY_INFO:
+        case QEMU_PSCI_0_2_FN64_AFFINITY_INFO:
+        case QEMU_PSCI_0_2_FN_SYSTEM_RESET:
+        case QEMU_PSCI_0_2_FN_SYSTEM_OFF:
+        case QEMU_PSCI_0_1_FN_CPU_ON:
+        case QEMU_PSCI_0_2_FN_CPU_ON:
+        case QEMU_PSCI_0_2_FN64_CPU_ON:
+        case QEMU_PSCI_0_1_FN_CPU_OFF:
+        case QEMU_PSCI_0_2_FN_CPU_OFF:
+        case QEMU_PSCI_0_1_FN_CPU_SUSPEND:
+        case QEMU_PSCI_0_2_FN_CPU_SUSPEND:
+        case QEMU_PSCI_0_2_FN64_CPU_SUSPEND:
+        case QEMU_PSCI_1_0_FN_PSCI_FEATURES:
+            if (!(param[1] & QEMU_PSCI_0_2_64BIT) || is_a64(env)) {
+                ret = 0;
+                break;
+            }
+            /* fallthrough */
+        case QEMU_PSCI_0_1_FN_MIGRATE:
+        case QEMU_PSCI_0_2_FN_MIGRATE:
+        default:
+            ret = QEMU_PSCI_RET_NOT_SUPPORTED;
+            break;
+        }
+        break;
     case QEMU_PSCI_0_1_FN_MIGRATE:
     case QEMU_PSCI_0_2_FN_MIGRATE:
     default:
-- 
2.25.1

From: Wentao_Liang <Wentao_Liang_g@163.com>

handle_simd_shift_fpint_conv() was accidentally freeing the TCG
temporary tcg_fpstatus too early, before the last use of it.  Move
the free down to where it belongs.

Signed-off-by: Wentao_Liang <Wentao_Liang_g@163.com>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
[PMM: cleaned up commit message]
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
---
 target/arm/translate-a64.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
index XXXXXXX..XXXXXXX 100644
--- a/target/arm/translate-a64.c
+++ b/target/arm/translate-a64.c
@@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,
         }
     }
 
-    tcg_temp_free_ptr(tcg_fpstatus);
     tcg_temp_free_i32(tcg_shift);
     gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
+    tcg_temp_free_ptr(tcg_fpstatus);
     tcg_temp_free_i32(tcg_rmode);
 }
 
-- 
2.25.1

From: Shengtan Mao <stmao@google.com>

Reviewed-by: Hao Wu <wuhaotsh@google.com>
Reviewed-by: Chris Rauer <crauer@google.com>
Signed-off-by: Shengtan Mao <stmao@google.com>
Signed-off-by: Patrick Venture <venture@google.com>
Message-id: 20220225174451.192304-1-wuhaotsh@google.com
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
---
 tests/qtest/npcm7xx_sdhci-test.c | 215 +++++++++++++++++++++++++++++++
 tests/qtest/meson.build          |   1 +
 2 files changed, 216 insertions(+)
 create mode 100644 tests/qtest/npcm7xx_sdhci-test.c

diff --git a/tests/qtest/npcm7xx_sdhci-test.c b/tests/qtest/npcm7xx_sdhci-test.c
new file mode 100644
index XXXXXXX..XXXXXXX
--- /dev/null
+++ b/tests/qtest/npcm7xx_sdhci-test.c
@@ -XXX,XX +XXX,XX @@
+/*
+ * QTests for NPCM7xx SD-3.0 / MMC-4.51 Host Controller
+ *
+ * Copyright (c) 2022 Google LLC
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ */
+
+#include "qemu/osdep.h"
+#include "hw/sd/npcm7xx_sdhci.h"
+
+#include "libqos/libqtest.h"
+#include "libqtest-single.h"
+#include "libqos/sdhci-cmd.h"
+
+#define NPCM7XX_REG_SIZE 0x100
+#define NPCM7XX_MMC_BA 0xF0842000
+#define NPCM7XX_BLK_SIZE 512
+#define NPCM7XX_TEST_IMAGE_SIZE (1 << 30)
+
+char *sd_path;
+
+static QTestState *setup_sd_card(void)
+{
+    QTestState *qts = qtest_initf(
+        "-machine kudo-bmc "
+        "-device sd-card,drive=drive0 "
+        "-drive id=drive0,if=none,file=%s,format=raw,auto-read-only=off",
+        sd_path);
+
+    qtest_writew(qts, NPCM7XX_MMC_BA + SDHC_SWRST, SDHC_RESET_ALL);
+    qtest_writew(qts, NPCM7XX_MMC_BA + SDHC_CLKCON,
+                 SDHC_CLOCK_SDCLK_EN | SDHC_CLOCK_INT_STABLE |
+                     SDHC_CLOCK_INT_EN);
+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0, 0, SDHC_APP_CMD);
+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0x41200000, 0, (41 << 8));
+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0, 0, SDHC_ALL_SEND_CID);
+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0, 0, SDHC_SEND_RELATIVE_ADDR);
+    sdhci_cmd_regs(qts, NPCM7XX_MMC_BA, 0, 0, 0x45670000, 0,
+                   SDHC_SELECT_DESELECT_CARD);
+
+    return qts;
+}
+
+static void write_sdread(QTestState *qts, const char *msg)
+{
+    int fd, ret;
+    size_t len = strlen(msg);
+    char *rmsg = g_malloc(len);
+
+    /* write message to sd */
+    fd = open(sd_path, O_WRONLY);
+    g_assert(fd >= 0);
+    ret = write(fd, msg, len);
+    close(fd);
+    g_assert(ret == len);
+
+    /* read message using sdhci */
+    ret = sdhci_read_cmd(qts, NPCM7XX_MMC_BA, rmsg, len);
+    g_assert(ret == len);
+    g_assert(!memcmp(rmsg, msg, len));
+
+    g_free(rmsg);
+}
+
+/* Check MMC can read values from sd */
+static void test_read_sd(void)
+{
+    QTestState *qts = setup_sd_card();
+
+    write_sdread(qts, "hello world");
+    write_sdread(qts, "goodbye");
+
+    qtest_quit(qts);
+}
+
+static void sdwrite_read(QTestState *qts, const char *msg)
+{
+    int fd, ret;
+    size_t len = strlen(msg);
+    char *rmsg = g_malloc(len);
+
+    /* write message using sdhci */
+    sdhci_write_cmd(qts, NPCM7XX_MMC_BA, msg, len, NPCM7XX_BLK_SIZE);
+
+    /* read message from sd */
+    fd = open(sd_path, O_RDONLY);
+    g_assert(fd >= 0);
+    ret = read(fd, rmsg, len);
+    close(fd);
+    g_assert(ret == len);
+
+    g_assert(!memcmp(rmsg, msg, len));
+
+    g_free(rmsg);
+}
+
+/* Check MMC can write values to sd */
+static void test_write_sd(void)
+{
+    QTestState *qts = setup_sd_card();
+
+    sdwrite_read(qts, "hello world");
+    sdwrite_read(qts, "goodbye");
+
+    qtest_quit(qts);
+}
+
+/* Check SDHCI has correct default values. */
+static void test_reset(void)
+{
+    QTestState *qts = qtest_init("-machine kudo-bmc");
+    uint64_t addr = NPCM7XX_MMC_BA;
+    uint64_t end_addr = addr + NPCM7XX_REG_SIZE;
+    uint16_t prstvals_resets[] = {NPCM7XX_PRSTVALS_0_RESET,
+                                  NPCM7XX_PRSTVALS_1_RESET,
+                                  0,
+                                  NPCM7XX_PRSTVALS_3_RESET,
+                                  0,
+                                  0};
+    int i;
+    uint32_t mask;
+
+    while (addr < end_addr) {
+        switch (addr - NPCM7XX_MMC_BA) {
+        case SDHC_PRNSTS:
+            /*
+             * ignores bits 20 to 24: they are changed when reading registers
+             */
+            mask = 0x1f00000;
+            g_assert_cmphex(qtest_readl(qts, addr) | mask, ==,
+                            NPCM7XX_PRSNTS_RESET | mask);
+            addr += 4;
+            break;
+        case SDHC_BLKGAP:
+            g_assert_cmphex(qtest_readb(qts, addr), ==, NPCM7XX_BLKGAP_RESET);
+            addr += 1;
+            break;
+        case SDHC_CAPAB:
+            g_assert_cmphex(qtest_readq(qts, addr), ==, NPCM7XX_CAPAB_RESET);
+            addr += 8;
+            break;
+        case SDHC_MAXCURR:
+            g_assert_cmphex(qtest_readq(qts, addr), ==, NPCM7XX_MAXCURR_RESET);
+            addr += 8;
+            break;
+        case SDHC_HCVER:
+            g_assert_cmphex(qtest_readw(qts, addr), ==, NPCM7XX_HCVER_RESET);
+            addr += 2;
+            break;
+        case NPCM7XX_PRSTVALS:
+            for (i = 0; i < NPCM7XX_PRSTVALS_SIZE; ++i) {
+                g_assert_cmphex(qtest_readw(qts, addr + 2 * i), ==,
+                                prstvals_resets[i]);
+            }
+            addr += NPCM7XX_PRSTVALS_SIZE * 2;
+            break;
+        default:
+            g_assert_cmphex(qtest_readb(qts, addr), ==, 0);
+            addr += 1;
+        }
+    }
+
+    qtest_quit(qts);
+}
+
+static void drive_destroy(void)
+{
+    unlink(sd_path);
+    g_free(sd_path);
+}
+
+static void drive_create(void)
+{
+    int fd, ret;
+    GError *error = NULL;
+
+    /* Create a temporary raw image */
+    fd = g_file_open_tmp("sdhci_XXXXXX", &sd_path, &error);
+    if (fd == -1) {
+        fprintf(stderr, "unable to create sdhci file: %s\n", error->message);
+        g_error_free(error);
+    }
+    g_assert(sd_path != NULL);
+
+    ret = ftruncate(fd, NPCM7XX_TEST_IMAGE_SIZE);
+    g_assert_cmpint(ret, ==, 0);
+    g_message("%s", sd_path);
+    close(fd);
+}
+
+int main(int argc, char **argv)
+{
+    int ret;
+
+    drive_create();
+
+    g_test_init(&argc, &argv, NULL);
+
+    qtest_add_func("npcm7xx_sdhci/reset", test_reset);
+    qtest_add_func("npcm7xx_sdhci/write_sd", test_write_sd);
+    qtest_add_func("npcm7xx_sdhci/read_sd", test_read_sd);
+
+    ret = g_test_run();
+    drive_destroy();
+    return ret;
+}
diff --git a/tests/qtest/meson.build b/tests/qtest/meson.build
index XXXXXXX..XXXXXXX 100644
--- a/tests/qtest/meson.build
+++ b/tests/qtest/meson.build
@@ -XXX,XX +XXX,XX @@ qtests_npcm7xx = \
    'npcm7xx_gpio-test',
    'npcm7xx_pwm-test',
    'npcm7xx_rng-test',
+   'npcm7xx_sdhci-test',
    'npcm7xx_smbus-test',
    'npcm7xx_timer-test',
    'npcm7xx_watchdog_timer-test'] + \
-- 
2.25.1