1 | The following changes since commit 5a67d7735d4162630769ef495cf813244fc850df: | 1 | The following changes since commit eae587e8e3694b1aceab23239493fb4c7e1a80f5: |
---|---|---|---|
2 | 2 | ||
3 | Merge remote-tracking branch 'remotes/berrange-gitlab/tags/tls-deps-pull-request' into staging (2021-07-02 08:22:39 +0100) | 3 | Merge remote-tracking branch 'remotes/armbru/tags/pull-qapi-2021-09-13' into staging (2021-09-13 11:00:30 +0100) |
4 | 4 | ||
5 | are available in the Git repository at: | 5 | are available in the Git repository at: |
6 | 6 | ||
7 | https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20210702 | 7 | https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20210913 |
8 | 8 | ||
9 | for you to fetch changes up to 04ea4d3cfd0a21b248ece8eb7a9436a3d9898dd8: | 9 | for you to fetch changes up to 9a2b2ecf4d25a3943918c95d2db4508b304161b5: |
10 | 10 | ||
11 | target/arm: Implement MVE shifts by register (2021-07-02 11:48:38 +0100) | 11 | hw/arm/mps2.c: Mark internal-only I2C buses as 'full' (2021-09-13 17:09:28 +0100) |
12 | 12 | ||
13 | ---------------------------------------------------------------- | 13 | ---------------------------------------------------------------- |
14 | target-arm queue: | 14 | target-arm queue: |
15 | * more MVE instructions | 15 | * mark MPS2/MPS3 board-internal i2c buses as 'full' so that command |
16 | * hw/gpio/gpio_pwr: use shutdown function for reboot | 16 | line user-created devices are not plugged into them |
17 | * target/arm: Check NaN mode before silencing NaN | 17 | * Take an exception if PSTATE.IL is set |
18 | * tests: Boot and halt a Linux guest on the Raspberry Pi 2 machine | 18 | * Support an emulated ITS in the virt board |
19 | * hw/arm: Add basic power management to raspi. | 19 | * Add support for kudo-bmc board |
20 | * docs/system/arm: Add quanta-gbs-bmc, quanta-q7l1-bmc | 20 | * Probe for KVM_CAP_ARM_VM_IPA_SIZE when creating scratch VM |
21 | * cadence_uart: Fix clock handling issues that prevented | ||
22 | u-boot from running | ||
21 | 23 | ||
22 | ---------------------------------------------------------------- | 24 | ---------------------------------------------------------------- |
23 | Joe Komlodi (1): | 25 | Bin Meng (6): |
24 | target/arm: Check NaN mode before silencing NaN | 26 | hw/misc: zynq_slcr: Correctly compute output clocks in the reset exit phase |
27 | hw/char: cadence_uart: Disable transmit when input clock is disabled | ||
28 | hw/char: cadence_uart: Move clock/reset check to uart_can_receive() | ||
29 | hw/char: cadence_uart: Convert to memop_with_attrs() ops | ||
30 | hw/char: cadence_uart: Ignore access when unclocked or in reset for uart_{read, write}() | ||
31 | hw/char: cadence_uart: Log a guest error when device is unclocked or in reset | ||
25 | 32 | ||
26 | Maxim Uvarov (1): | 33 | Chris Rauer (1): |
27 | hw/gpio/gpio_pwr: use shutdown function for reboot | 34 | hw/arm: Add support for kudo-bmc board. |
28 | 35 | ||
29 | Nolan Leake (1): | 36 | Marc Zyngier (1): |
30 | hw/arm: Add basic power management to raspi. | 37 | hw/arm/virt: KVM: Probe for KVM_CAP_ARM_VM_IPA_SIZE when creating scratch VM |
31 | 38 | ||
32 | Patrick Venture (2): | 39 | Peter Maydell (5): |
33 | docs/system/arm: Add quanta-q7l1-bmc reference | 40 | target/arm: Take an exception if PSTATE.IL is set |
34 | docs/system/arm: Add quanta-gbs-bmc reference | 41 | qdev: Support marking individual buses as 'full' |
42 | hw/arm/mps2-tz.c: Add extra data parameter to MakeDevFn | ||
43 | hw/arm/mps2-tz.c: Mark internal-only I2C buses as 'full' | ||
44 | hw/arm/mps2.c: Mark internal-only I2C buses as 'full' | ||
35 | 45 | ||
36 | Peter Maydell (18): | 46 | Richard Henderson (1): |
37 | target/arm: Fix MVE widening/narrowing VLDR/VSTR offset calculation | 47 | target/arm: Merge disas_a64_insn into aarch64_tr_translate_insn |
38 | target/arm: Fix bugs in MVE VRMLALDAVH, VRMLSLDAVH | ||
39 | target/arm: Make asimd_imm_const() public | ||
40 | target/arm: Use asimd_imm_const for A64 decode | ||
41 | target/arm: Use dup_const() instead of bitfield_replicate() | ||
42 | target/arm: Implement MVE logical immediate insns | ||
43 | target/arm: Implement MVE vector shift left by immediate insns | ||
44 | target/arm: Implement MVE vector shift right by immediate insns | ||
45 | target/arm: Implement MVE VSHLL | ||
46 | target/arm: Implement MVE VSRI, VSLI | ||
47 | target/arm: Implement MVE VSHRN, VRSHRN | ||
48 | target/arm: Implement MVE saturating narrowing shifts | ||
49 | target/arm: Implement MVE VSHLC | ||
50 | target/arm: Implement MVE VADDLV | ||
51 | target/arm: Implement MVE long shifts by immediate | ||
52 | target/arm: Implement MVE long shifts by register | ||
53 | target/arm: Implement MVE shifts by immediate | ||
54 | target/arm: Implement MVE shifts by register | ||
55 | 48 | ||
56 | Philippe Mathieu-Daudé (1): | 49 | Shashi Mallela (9): |
57 | tests: Boot and halt a Linux guest on the Raspberry Pi 2 machine | 50 | hw/intc: GICv3 ITS initial framework |
51 | hw/intc: GICv3 ITS register definitions added | ||
52 | hw/intc: GICv3 ITS command queue framework | ||
53 | hw/intc: GICv3 ITS Command processing | ||
54 | hw/intc: GICv3 ITS Feature enablement | ||
55 | hw/intc: GICv3 redistributor ITS processing | ||
56 | tests/data/acpi/virt: Add IORT files for ITS | ||
57 | hw/arm/virt: add ITS support in virt GIC | ||
58 | tests/data/acpi/virt: Update IORT files for ITS | ||
58 | 59 | ||
59 | docs/system/arm/aspeed.rst | 1 + | 60 | docs/system/arm/nuvoton.rst | 1 + |
60 | docs/system/arm/nuvoton.rst | 5 +- | 61 | hw/intc/gicv3_internal.h | 188 ++++- |
61 | include/hw/arm/bcm2835_peripherals.h | 3 +- | 62 | include/hw/arm/virt.h | 2 + |
62 | include/hw/misc/bcm2835_powermgt.h | 29 ++ | 63 | include/hw/intc/arm_gicv3_common.h | 13 + |
63 | target/arm/helper-mve.h | 108 +++++++ | 64 | include/hw/intc/arm_gicv3_its_common.h | 32 +- |
64 | target/arm/translate.h | 41 +++ | 65 | include/hw/qdev-core.h | 24 + |
65 | target/arm/mve.decode | 177 ++++++++++- | 66 | target/arm/cpu.h | 1 + |
66 | target/arm/t32.decode | 71 ++++- | 67 | target/arm/kvm_arm.h | 4 +- |
67 | hw/arm/bcm2835_peripherals.c | 13 +- | 68 | target/arm/syndrome.h | 5 + |
68 | hw/gpio/gpio_pwr.c | 2 +- | 69 | target/arm/translate.h | 2 + |
69 | hw/misc/bcm2835_powermgt.c | 160 ++++++++++ | 70 | hw/arm/mps2-tz.c | 92 ++- |
70 | target/arm/helper-a64.c | 12 +- | 71 | hw/arm/mps2.c | 12 +- |
71 | target/arm/mve_helper.c | 524 +++++++++++++++++++++++++++++++-- | 72 | hw/arm/npcm7xx_boards.c | 34 + |
72 | target/arm/translate-a64.c | 86 +----- | 73 | hw/arm/virt.c | 29 +- |
73 | target/arm/translate-mve.c | 261 +++++++++++++++- | 74 | hw/char/cadence_uart.c | 61 +- |
74 | target/arm/translate-neon.c | 81 ----- | 75 | hw/intc/arm_gicv3.c | 14 + |
75 | target/arm/translate.c | 327 +++++++++++++++++++- | 76 | hw/intc/arm_gicv3_common.c | 13 + |
76 | target/arm/vfp_helper.c | 24 +- | 77 | hw/intc/arm_gicv3_cpuif.c | 7 +- |
77 | hw/misc/meson.build | 1 + | 78 | hw/intc/arm_gicv3_dist.c | 5 +- |
78 | tests/acceptance/boot_linux_console.py | 43 +++ | 79 | hw/intc/arm_gicv3_its.c | 1322 ++++++++++++++++++++++++++++++++ |
79 | 20 files changed, 1760 insertions(+), 209 deletions(-) | 80 | hw/intc/arm_gicv3_its_common.c | 7 +- |
80 | create mode 100644 include/hw/misc/bcm2835_powermgt.h | 81 | hw/intc/arm_gicv3_its_kvm.c | 2 +- |
81 | create mode 100644 hw/misc/bcm2835_powermgt.c | 82 | hw/intc/arm_gicv3_redist.c | 153 +++- |
83 | hw/misc/zynq_slcr.c | 31 +- | ||
84 | softmmu/qdev-monitor.c | 7 +- | ||
85 | target/arm/helper-a64.c | 1 + | ||
86 | target/arm/helper.c | 8 + | ||
87 | target/arm/kvm.c | 7 +- | ||
88 | target/arm/translate-a64.c | 255 +++--- | ||
89 | target/arm/translate.c | 21 + | ||
90 | hw/intc/meson.build | 1 + | ||
91 | tests/data/acpi/virt/IORT | Bin 0 -> 124 bytes | ||
92 | tests/data/acpi/virt/IORT.memhp | Bin 0 -> 124 bytes | ||
93 | tests/data/acpi/virt/IORT.numamem | Bin 0 -> 124 bytes | ||
94 | tests/data/acpi/virt/IORT.pxb | Bin 0 -> 124 bytes | ||
95 | 35 files changed, 2144 insertions(+), 210 deletions(-) | ||
96 | create mode 100644 hw/intc/arm_gicv3_its.c | ||
97 | create mode 100644 tests/data/acpi/virt/IORT | ||
98 | create mode 100644 tests/data/acpi/virt/IORT.memhp | ||
99 | create mode 100644 tests/data/acpi/virt/IORT.numamem | ||
100 | create mode 100644 tests/data/acpi/virt/IORT.pxb | ||
82 | 101 | diff view generated by jsdifflib |
1 | The MVE extension to v8.1M includes some new shift instructions which | 1 | From: Bin Meng <bmeng.cn@gmail.com> |
---|---|---|---|
2 | sit entirely within the non-coprocessor part of the encoding space | ||
3 | and which operate only on general-purpose registers. They take up | ||
4 | the space which was previously UNPREDICTABLE MOVS and ORRS encodings | ||
5 | with Rm == 13 or 15. | ||
6 | 2 | ||
7 | Implement the long shifts by immediate, which perform shifts on a | 3 | As of today, when booting upstream U-Boot for Xilinx Zynq, the UART |
8 | pair of general-purpose registers treated as a 64-bit quantity, with | 4 | does not receive anything. Debugging shows that the UART input clock |
9 | an immediate shift count between 1 and 32. | 5 | frequency is zero which prevents the UART from receiving anything as |
6 | per the logic in uart_receive(). | ||
10 | 7 | ||
11 | Awkwardly, because the MOVS and ORRS trans functions do not UNDEF for | 8 | From zynq_slcr_reset_exit() comment, it intends to compute output |
12 | the Rm==13,15 case, we need to explicitly emit code to UNDEF for the | 9 | clocks according to ps_clk and registers. zynq_slcr_compute_clocks() |
13 | cases where v8.1M now requires that. (Trying to change MOVS and ORRS | 10 | is called to accomplish the task, inside which device_is_in_reset() |
14 | is too difficult, because the functions that generate the code are | 11 | is called to actually make the attempt in vain. |
15 | shared between a dozen different kinds of arithmetic or logical | ||
16 | instruction for all A32, T16 and T32 encodings, and for some insns | ||
17 | and some encodings Rm==13,15 are valid.) | ||
18 | 12 | ||
19 | We make the helper functions we need for UQSHLL and SQSHLL take | 13 | Rework reset_hold() and reset_exit() so that in the reset exit phase, |
20 | a 32-bit value which the helper casts to int8_t because we'll need | 14 | the logic can really compute output clocks in reset_exit(). |
21 | these helpers also for the shift-by-register insns, where the shift | ||
22 | count might be < 0 or > 32. | ||
23 | 15 | ||
16 | With this change, upstream U-Boot boots properly again with: | ||
17 | |||
18 | $ qemu-system-arm -M xilinx-zynq-a9 -m 1G -display none -serial null -serial stdio \ | ||
19 | -device loader,file=u-boot-dtb.bin,addr=0x4000000,cpu-num=0 | ||
20 | |||
21 | Fixes: 38867cb7ec90 ("hw/misc/zynq_slcr: add clock generation for uarts") | ||
22 | Signed-off-by: Bin Meng <bmeng.cn@gmail.com> | ||
23 | Acked-by: Alistair Francis <alistair.francis@wdc.com> | ||
24 | Reviewed-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> | ||
25 | Message-id: 20210901124521.30599-2-bmeng.cn@gmail.com | ||
24 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 26 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
25 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
26 | Message-id: 20210628135835.6690-16-peter.maydell@linaro.org | ||
27 | --- | 27 | --- |
28 | target/arm/helper-mve.h | 3 ++ | 28 | hw/misc/zynq_slcr.c | 31 ++++++++++++++++++------------- |
29 | target/arm/translate.h | 1 + | 29 | 1 file changed, 18 insertions(+), 13 deletions(-) |
30 | target/arm/t32.decode | 28 +++++++++++++ | ||
31 | target/arm/mve_helper.c | 10 +++++ | ||
32 | target/arm/translate.c | 90 +++++++++++++++++++++++++++++++++++++++++ | ||
33 | 5 files changed, 132 insertions(+) | ||
34 | 30 | ||
35 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 31 | diff --git a/hw/misc/zynq_slcr.c b/hw/misc/zynq_slcr.c |
36 | index XXXXXXX..XXXXXXX 100644 | 32 | index XXXXXXX..XXXXXXX 100644 |
37 | --- a/target/arm/helper-mve.h | 33 | --- a/hw/misc/zynq_slcr.c |
38 | +++ b/target/arm/helper-mve.h | 34 | +++ b/hw/misc/zynq_slcr.c |
39 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vqrshruntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 35 | @@ -XXX,XX +XXX,XX @@ static uint64_t zynq_slcr_compute_clock(const uint64_t periods[], |
40 | DEF_HELPER_FLAGS_4(mve_vqrshrunth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 36 | zynq_slcr_compute_clock((plls), (state)->regs[reg], \ |
41 | 37 | reg ## _ ## enable_field ## _SHIFT) | |
42 | DEF_HELPER_FLAGS_4(mve_vshlc, TCG_CALL_NO_WG, i32, env, ptr, i32, i32) | 38 | |
39 | +static void zynq_slcr_compute_clocks_internal(ZynqSLCRState *s, uint64_t ps_clk) | ||
40 | +{ | ||
41 | + uint64_t io_pll = zynq_slcr_compute_pll(ps_clk, s->regs[R_IO_PLL_CTRL]); | ||
42 | + uint64_t arm_pll = zynq_slcr_compute_pll(ps_clk, s->regs[R_ARM_PLL_CTRL]); | ||
43 | + uint64_t ddr_pll = zynq_slcr_compute_pll(ps_clk, s->regs[R_DDR_PLL_CTRL]); | ||
43 | + | 44 | + |
44 | +DEF_HELPER_FLAGS_3(mve_sqshll, TCG_CALL_NO_RWG, i64, env, i64, i32) | 45 | + uint64_t uart_mux[4] = {io_pll, io_pll, arm_pll, ddr_pll}; |
45 | +DEF_HELPER_FLAGS_3(mve_uqshll, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
46 | diff --git a/target/arm/translate.h b/target/arm/translate.h | ||
47 | index XXXXXXX..XXXXXXX 100644 | ||
48 | --- a/target/arm/translate.h | ||
49 | +++ b/target/arm/translate.h | ||
50 | @@ -XXX,XX +XXX,XX @@ typedef void CryptoTwoOpFn(TCGv_ptr, TCGv_ptr); | ||
51 | typedef void CryptoThreeOpIntFn(TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
52 | typedef void CryptoThreeOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr); | ||
53 | typedef void AtomicThreeOpFn(TCGv_i64, TCGv_i64, TCGv_i64, TCGArg, MemOp); | ||
54 | +typedef void WideShiftImmFn(TCGv_i64, TCGv_i64, int64_t shift); | ||
55 | |||
56 | /** | ||
57 | * arm_tbflags_from_tb: | ||
58 | diff --git a/target/arm/t32.decode b/target/arm/t32.decode | ||
59 | index XXXXXXX..XXXXXXX 100644 | ||
60 | --- a/target/arm/t32.decode | ||
61 | +++ b/target/arm/t32.decode | ||
62 | @@ -XXX,XX +XXX,XX @@ | ||
63 | &mcr !extern cp opc1 crn crm opc2 rt | ||
64 | &mcrr !extern cp opc1 crm rt rt2 | ||
65 | |||
66 | +&mve_shl_ri rdalo rdahi shim | ||
67 | + | 46 | + |
68 | +# rdahi: bits [3:1] from insn, bit 0 is 1 | 47 | + /* compute uartX reference clocks */ |
69 | +# rdalo: bits [3:1] from insn, bit 0 is 0 | 48 | + clock_set(s->uart0_ref_clk, |
70 | +%rdahi_9 9:3 !function=times_2_plus_1 | 49 | + ZYNQ_COMPUTE_CLK(s, uart_mux, R_UART_CLK_CTRL, CLKACT0)); |
71 | +%rdalo_17 17:3 !function=times_2 | 50 | + clock_set(s->uart1_ref_clk, |
72 | + | 51 | + ZYNQ_COMPUTE_CLK(s, uart_mux, R_UART_CLK_CTRL, CLKACT1)); |
73 | # Data-processing (register) | ||
74 | |||
75 | %imm5_12_6 12:3 6:2 | ||
76 | @@ -XXX,XX +XXX,XX @@ | ||
77 | @S_xrr_shi ....... .... . rn:4 .... .... .. shty:2 rm:4 \ | ||
78 | &s_rrr_shi shim=%imm5_12_6 s=1 rd=0 | ||
79 | |||
80 | +@mve_shl_ri ....... .... . ... . . ... ... . .. .. .... \ | ||
81 | + &mve_shl_ri shim=%imm5_12_6 rdalo=%rdalo_17 rdahi=%rdahi_9 | ||
82 | + | ||
83 | { | ||
84 | TST_xrri 1110101 0000 1 .... 0 ... 1111 .... .... @S_xrr_shi | ||
85 | AND_rrri 1110101 0000 . .... 0 ... .... .... .... @s_rrr_shi | ||
86 | } | ||
87 | BIC_rrri 1110101 0001 . .... 0 ... .... .... .... @s_rrr_shi | ||
88 | { | ||
89 | + # The v8.1M MVE shift insns overlap in encoding with MOVS/ORRS | ||
90 | + # and are distinguished by having Rm==13 or 15. Those are UNPREDICTABLE | ||
91 | + # cases for MOVS/ORRS. We decode the MVE cases first, ensuring that | ||
92 | + # they explicitly call unallocated_encoding() for cases that must UNDEF | ||
93 | + # (eg "using a new shift insn on a v8.1M CPU without MVE"), and letting | ||
94 | + # the rest fall through (where ORR_rrri and MOV_rxri will end up | ||
95 | + # handling them as r13 and r15 accesses with the same semantics as A32). | ||
96 | + [ | ||
97 | + LSLL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 00 1111 @mve_shl_ri | ||
98 | + LSRL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 01 1111 @mve_shl_ri | ||
99 | + ASRL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 10 1111 @mve_shl_ri | ||
100 | + | ||
101 | + UQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 00 1111 @mve_shl_ri | ||
102 | + URSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 01 1111 @mve_shl_ri | ||
103 | + SRSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 10 1111 @mve_shl_ri | ||
104 | + SQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 11 1111 @mve_shl_ri | ||
105 | + ] | ||
106 | + | ||
107 | MOV_rxri 1110101 0010 . 1111 0 ... .... .... .... @s_rxr_shi | ||
108 | ORR_rrri 1110101 0010 . .... 0 ... .... .... .... @s_rrr_shi | ||
109 | } | ||
110 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
111 | index XXXXXXX..XXXXXXX 100644 | ||
112 | --- a/target/arm/mve_helper.c | ||
113 | +++ b/target/arm/mve_helper.c | ||
114 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(mve_vshlc)(CPUARMState *env, void *vd, uint32_t rdm, | ||
115 | mve_advance_vpt(env); | ||
116 | return rdm; | ||
117 | } | ||
118 | + | ||
119 | +uint64_t HELPER(mve_sqshll)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
120 | +{ | ||
121 | + return do_sqrshl_d(n, (int8_t)shift, false, &env->QF); | ||
122 | +} | 52 | +} |
123 | + | 53 | + |
124 | +uint64_t HELPER(mve_uqshll)(CPUARMState *env, uint64_t n, uint32_t shift) | 54 | /** |
125 | +{ | 55 | * Compute and set the ouputs clocks periods. |
126 | + return do_uqrshl_d(n, (int8_t)shift, false, &env->QF); | 56 | * But do not propagate them further. Connected clocks |
127 | +} | 57 | @@ -XXX,XX +XXX,XX @@ static void zynq_slcr_compute_clocks(ZynqSLCRState *s) |
128 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 58 | ps_clk = 0; |
129 | index XXXXXXX..XXXXXXX 100644 | 59 | } |
130 | --- a/target/arm/translate.c | 60 | |
131 | +++ b/target/arm/translate.c | 61 | - uint64_t io_pll = zynq_slcr_compute_pll(ps_clk, s->regs[R_IO_PLL_CTRL]); |
132 | @@ -XXX,XX +XXX,XX @@ static bool trans_MOVT(DisasContext *s, arg_MOVW *a) | 62 | - uint64_t arm_pll = zynq_slcr_compute_pll(ps_clk, s->regs[R_ARM_PLL_CTRL]); |
133 | return true; | 63 | - uint64_t ddr_pll = zynq_slcr_compute_pll(ps_clk, s->regs[R_DDR_PLL_CTRL]); |
64 | - | ||
65 | - uint64_t uart_mux[4] = {io_pll, io_pll, arm_pll, ddr_pll}; | ||
66 | - | ||
67 | - /* compute uartX reference clocks */ | ||
68 | - clock_set(s->uart0_ref_clk, | ||
69 | - ZYNQ_COMPUTE_CLK(s, uart_mux, R_UART_CLK_CTRL, CLKACT0)); | ||
70 | - clock_set(s->uart1_ref_clk, | ||
71 | - ZYNQ_COMPUTE_CLK(s, uart_mux, R_UART_CLK_CTRL, CLKACT1)); | ||
72 | + zynq_slcr_compute_clocks_internal(s, ps_clk); | ||
134 | } | 73 | } |
135 | 74 | ||
136 | +/* | 75 | /** |
137 | + * v8.1M MVE wide-shifts | 76 | @@ -XXX,XX +XXX,XX @@ static void zynq_slcr_reset_hold(Object *obj) |
138 | + */ | 77 | ZynqSLCRState *s = ZYNQ_SLCR(obj); |
139 | +static bool do_mve_shl_ri(DisasContext *s, arg_mve_shl_ri *a, | 78 | |
140 | + WideShiftImmFn *fn) | 79 | /* will disable all output clocks */ |
141 | +{ | 80 | - zynq_slcr_compute_clocks(s); |
142 | + TCGv_i64 rda; | 81 | + zynq_slcr_compute_clocks_internal(s, 0); |
143 | + TCGv_i32 rdalo, rdahi; | 82 | zynq_slcr_propagate_clocks(s); |
144 | + | 83 | } |
145 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_1M)) { | 84 | |
146 | + /* Decode falls through to ORR/MOV UNPREDICTABLE handling */ | 85 | @@ -XXX,XX +XXX,XX @@ static void zynq_slcr_reset_exit(Object *obj) |
147 | + return false; | 86 | ZynqSLCRState *s = ZYNQ_SLCR(obj); |
148 | + } | 87 | |
149 | + if (a->rdahi == 15) { | 88 | /* will compute output clocks according to ps_clk and registers */ |
150 | + /* These are a different encoding (SQSHL/SRSHR/UQSHL/URSHR) */ | 89 | - zynq_slcr_compute_clocks(s); |
151 | + return false; | 90 | + zynq_slcr_compute_clocks_internal(s, clock_get(s->ps_clk)); |
152 | + } | 91 | zynq_slcr_propagate_clocks(s); |
153 | + if (!dc_isar_feature(aa32_mve, s) || | 92 | } |
154 | + !arm_dc_feature(s, ARM_FEATURE_M_MAIN) || | 93 | |
155 | + a->rdahi == 13) { | ||
156 | + /* RdaHi == 13 is UNPREDICTABLE; we choose to UNDEF */ | ||
157 | + unallocated_encoding(s); | ||
158 | + return true; | ||
159 | + } | ||
160 | + | ||
161 | + if (a->shim == 0) { | ||
162 | + a->shim = 32; | ||
163 | + } | ||
164 | + | ||
165 | + rda = tcg_temp_new_i64(); | ||
166 | + rdalo = load_reg(s, a->rdalo); | ||
167 | + rdahi = load_reg(s, a->rdahi); | ||
168 | + tcg_gen_concat_i32_i64(rda, rdalo, rdahi); | ||
169 | + | ||
170 | + fn(rda, rda, a->shim); | ||
171 | + | ||
172 | + tcg_gen_extrl_i64_i32(rdalo, rda); | ||
173 | + tcg_gen_extrh_i64_i32(rdahi, rda); | ||
174 | + store_reg(s, a->rdalo, rdalo); | ||
175 | + store_reg(s, a->rdahi, rdahi); | ||
176 | + tcg_temp_free_i64(rda); | ||
177 | + | ||
178 | + return true; | ||
179 | +} | ||
180 | + | ||
181 | +static bool trans_ASRL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
182 | +{ | ||
183 | + return do_mve_shl_ri(s, a, tcg_gen_sari_i64); | ||
184 | +} | ||
185 | + | ||
186 | +static bool trans_LSLL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
187 | +{ | ||
188 | + return do_mve_shl_ri(s, a, tcg_gen_shli_i64); | ||
189 | +} | ||
190 | + | ||
191 | +static bool trans_LSRL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
192 | +{ | ||
193 | + return do_mve_shl_ri(s, a, tcg_gen_shri_i64); | ||
194 | +} | ||
195 | + | ||
196 | +static void gen_mve_sqshll(TCGv_i64 r, TCGv_i64 n, int64_t shift) | ||
197 | +{ | ||
198 | + gen_helper_mve_sqshll(r, cpu_env, n, tcg_constant_i32(shift)); | ||
199 | +} | ||
200 | + | ||
201 | +static bool trans_SQSHLL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
202 | +{ | ||
203 | + return do_mve_shl_ri(s, a, gen_mve_sqshll); | ||
204 | +} | ||
205 | + | ||
206 | +static void gen_mve_uqshll(TCGv_i64 r, TCGv_i64 n, int64_t shift) | ||
207 | +{ | ||
208 | + gen_helper_mve_uqshll(r, cpu_env, n, tcg_constant_i32(shift)); | ||
209 | +} | ||
210 | + | ||
211 | +static bool trans_UQSHLL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
212 | +{ | ||
213 | + return do_mve_shl_ri(s, a, gen_mve_uqshll); | ||
214 | +} | ||
215 | + | ||
216 | +static bool trans_SRSHRL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
217 | +{ | ||
218 | + return do_mve_shl_ri(s, a, gen_srshr64_i64); | ||
219 | +} | ||
220 | + | ||
221 | +static bool trans_URSHRL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
222 | +{ | ||
223 | + return do_mve_shl_ri(s, a, gen_urshr64_i64); | ||
224 | +} | ||
225 | + | ||
226 | /* | ||
227 | * Multiply and multiply accumulate | ||
228 | */ | ||
229 | -- | 94 | -- |
230 | 2.20.1 | 95 | 2.20.1 |
231 | 96 | ||
232 | 97 | diff view generated by jsdifflib |
1 | Implement the MVE VADDLV insn; this is similar to VADDV, except | 1 | From: Bin Meng <bmeng.cn@gmail.com> |
---|---|---|---|
2 | that it accumulates 32-bit elements into a 64-bit accumulator | ||
3 | stored in a pair of general-purpose registers. | ||
4 | 2 | ||
3 | At present when input clock is disabled, any character transmitted | ||
4 | to tx fifo can still show on the serial line, which is wrong. | ||
5 | |||
6 | Fixes: b636db306e06 ("hw/char/cadence_uart: add clock support") | ||
7 | Signed-off-by: Bin Meng <bmeng.cn@gmail.com> | ||
8 | Reviewed-by: Alistair Francis <alistair.francis@wdc.com> | ||
9 | Reviewed-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> | ||
10 | Message-id: 20210901124521.30599-3-bmeng.cn@gmail.com | ||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20210628135835.6690-15-peter.maydell@linaro.org | ||
8 | --- | 12 | --- |
9 | target/arm/helper-mve.h | 3 ++ | 13 | hw/char/cadence_uart.c | 5 +++++ |
10 | target/arm/mve.decode | 6 +++- | 14 | 1 file changed, 5 insertions(+) |
11 | target/arm/mve_helper.c | 19 ++++++++++++ | ||
12 | target/arm/translate-mve.c | 63 ++++++++++++++++++++++++++++++++++++++ | ||
13 | 4 files changed, 90 insertions(+), 1 deletion(-) | ||
14 | 15 | ||
15 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 16 | diff --git a/hw/char/cadence_uart.c b/hw/char/cadence_uart.c |
16 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/helper-mve.h | 18 | --- a/hw/char/cadence_uart.c |
18 | +++ b/target/arm/helper-mve.h | 19 | +++ b/hw/char/cadence_uart.c |
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(mve_vaddvuh, TCG_CALL_NO_WG, i32, env, ptr, i32) | 20 | @@ -XXX,XX +XXX,XX @@ static gboolean cadence_uart_xmit(void *do_not_use, GIOCondition cond, |
20 | DEF_HELPER_FLAGS_3(mve_vaddvsw, TCG_CALL_NO_WG, i32, env, ptr, i32) | 21 | static void uart_write_tx_fifo(CadenceUARTState *s, const uint8_t *buf, |
21 | DEF_HELPER_FLAGS_3(mve_vaddvuw, TCG_CALL_NO_WG, i32, env, ptr, i32) | 22 | int size) |
22 | 23 | { | |
23 | +DEF_HELPER_FLAGS_3(mve_vaddlv_s, TCG_CALL_NO_WG, i64, env, ptr, i64) | 24 | + /* ignore characters when unclocked or in reset */ |
24 | +DEF_HELPER_FLAGS_3(mve_vaddlv_u, TCG_CALL_NO_WG, i64, env, ptr, i64) | 25 | + if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
25 | + | 26 | + return; |
26 | DEF_HELPER_FLAGS_3(mve_vmovi, TCG_CALL_NO_WG, void, env, ptr, i64) | ||
27 | DEF_HELPER_FLAGS_3(mve_vandi, TCG_CALL_NO_WG, void, env, ptr, i64) | ||
28 | DEF_HELPER_FLAGS_3(mve_vorri, TCG_CALL_NO_WG, void, env, ptr, i64) | ||
29 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/mve.decode | ||
32 | +++ b/target/arm/mve.decode | ||
33 | @@ -XXX,XX +XXX,XX @@ VQDMULH_scalar 1110 1110 0 . .. ... 1 ... 0 1110 . 110 .... @2scalar | ||
34 | VQRDMULH_scalar 1111 1110 0 . .. ... 1 ... 0 1110 . 110 .... @2scalar | ||
35 | |||
36 | # Vector add across vector | ||
37 | -VADDV 111 u:1 1110 1111 size:2 01 ... 0 1111 0 0 a:1 0 qm:3 0 rda=%rdalo | ||
38 | +{ | ||
39 | + VADDV 111 u:1 1110 1111 size:2 01 ... 0 1111 0 0 a:1 0 qm:3 0 rda=%rdalo | ||
40 | + VADDLV 111 u:1 1110 1 ... 1001 ... 0 1111 00 a:1 0 qm:3 0 \ | ||
41 | + rdahi=%rdahi rdalo=%rdalo | ||
42 | +} | ||
43 | |||
44 | # Predicate operations | ||
45 | %mask_22_13 22:1 13:3 | ||
46 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
47 | index XXXXXXX..XXXXXXX 100644 | ||
48 | --- a/target/arm/mve_helper.c | ||
49 | +++ b/target/arm/mve_helper.c | ||
50 | @@ -XXX,XX +XXX,XX @@ DO_VADDV(vaddvub, 1, uint8_t) | ||
51 | DO_VADDV(vaddvuh, 2, uint16_t) | ||
52 | DO_VADDV(vaddvuw, 4, uint32_t) | ||
53 | |||
54 | +#define DO_VADDLV(OP, TYPE, LTYPE) \ | ||
55 | + uint64_t HELPER(glue(mve_, OP))(CPUARMState *env, void *vm, \ | ||
56 | + uint64_t ra) \ | ||
57 | + { \ | ||
58 | + uint16_t mask = mve_element_mask(env); \ | ||
59 | + unsigned e; \ | ||
60 | + TYPE *m = vm; \ | ||
61 | + for (e = 0; e < 16 / 4; e++, mask >>= 4) { \ | ||
62 | + if (mask & 1) { \ | ||
63 | + ra += (LTYPE)m[H4(e)]; \ | ||
64 | + } \ | ||
65 | + } \ | ||
66 | + mve_advance_vpt(env); \ | ||
67 | + return ra; \ | ||
68 | + } \ | ||
69 | + | ||
70 | +DO_VADDLV(vaddlv_s, int32_t, int64_t) | ||
71 | +DO_VADDLV(vaddlv_u, uint32_t, uint64_t) | ||
72 | + | ||
73 | /* Shifts by immediate */ | ||
74 | #define DO_2SHIFT(OP, ESIZE, TYPE, FN) \ | ||
75 | void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
76 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
77 | index XXXXXXX..XXXXXXX 100644 | ||
78 | --- a/target/arm/translate-mve.c | ||
79 | +++ b/target/arm/translate-mve.c | ||
80 | @@ -XXX,XX +XXX,XX @@ static bool trans_VADDV(DisasContext *s, arg_VADDV *a) | ||
81 | return true; | ||
82 | } | ||
83 | |||
84 | +static bool trans_VADDLV(DisasContext *s, arg_VADDLV *a) | ||
85 | +{ | ||
86 | + /* | ||
87 | + * Vector Add Long Across Vector: accumulate the 32-bit | ||
88 | + * elements of the vector into a 64-bit result stored in | ||
89 | + * a pair of general-purpose registers. | ||
90 | + * No need to check Qm's bank: it is only 3 bits in decode. | ||
91 | + */ | ||
92 | + TCGv_ptr qm; | ||
93 | + TCGv_i64 rda; | ||
94 | + TCGv_i32 rdalo, rdahi; | ||
95 | + | ||
96 | + if (!dc_isar_feature(aa32_mve, s)) { | ||
97 | + return false; | ||
98 | + } | ||
99 | + /* | ||
100 | + * rdahi == 13 is UNPREDICTABLE; rdahi == 15 is a related | ||
101 | + * encoding; rdalo always has bit 0 clear so cannot be 13 or 15. | ||
102 | + */ | ||
103 | + if (a->rdahi == 13 || a->rdahi == 15) { | ||
104 | + return false; | ||
105 | + } | ||
106 | + if (!mve_eci_check(s) || !vfp_access_check(s)) { | ||
107 | + return true; | ||
108 | + } | 27 | + } |
109 | + | 28 | + |
110 | + /* | 29 | if ((s->r[R_CR] & UART_CR_TX_DIS) || !(s->r[R_CR] & UART_CR_TX_EN)) { |
111 | + * This insn is subject to beat-wise execution. Partial execution | 30 | return; |
112 | + * of an A=0 (no-accumulate) insn which does not execute the first | 31 | } |
113 | + * beat must start with the current value of RdaHi:RdaLo, not zero. | ||
114 | + */ | ||
115 | + if (a->a || mve_skip_first_beat(s)) { | ||
116 | + /* Accumulate input from RdaHi:RdaLo */ | ||
117 | + rda = tcg_temp_new_i64(); | ||
118 | + rdalo = load_reg(s, a->rdalo); | ||
119 | + rdahi = load_reg(s, a->rdahi); | ||
120 | + tcg_gen_concat_i32_i64(rda, rdalo, rdahi); | ||
121 | + tcg_temp_free_i32(rdalo); | ||
122 | + tcg_temp_free_i32(rdahi); | ||
123 | + } else { | ||
124 | + /* Accumulate starting at zero */ | ||
125 | + rda = tcg_const_i64(0); | ||
126 | + } | ||
127 | + | ||
128 | + qm = mve_qreg_ptr(a->qm); | ||
129 | + if (a->u) { | ||
130 | + gen_helper_mve_vaddlv_u(rda, cpu_env, qm, rda); | ||
131 | + } else { | ||
132 | + gen_helper_mve_vaddlv_s(rda, cpu_env, qm, rda); | ||
133 | + } | ||
134 | + tcg_temp_free_ptr(qm); | ||
135 | + | ||
136 | + rdalo = tcg_temp_new_i32(); | ||
137 | + rdahi = tcg_temp_new_i32(); | ||
138 | + tcg_gen_extrl_i64_i32(rdalo, rda); | ||
139 | + tcg_gen_extrh_i64_i32(rdahi, rda); | ||
140 | + store_reg(s, a->rdalo, rdalo); | ||
141 | + store_reg(s, a->rdahi, rdahi); | ||
142 | + tcg_temp_free_i64(rda); | ||
143 | + mve_update_eci(s); | ||
144 | + return true; | ||
145 | +} | ||
146 | + | ||
147 | static bool do_1imm(DisasContext *s, arg_1imm *a, MVEGenOneOpImmFn *fn) | ||
148 | { | ||
149 | TCGv_ptr qd; | ||
150 | -- | 32 | -- |
151 | 2.20.1 | 33 | 2.20.1 |
152 | 34 | ||
153 | 35 | diff view generated by jsdifflib |
1 | Implement the MVE long shifts by register, which perform shifts on a | 1 | From: Bin Meng <bmeng.cn@gmail.com> |
---|---|---|---|
2 | pair of general-purpose registers treated as a 64-bit quantity, with | ||
3 | the shift count in another general-purpose register, which might be | ||
4 | either positive or negative. | ||
5 | 2 | ||
6 | Like the long-shifts-by-immediate, these encodings sit in the space | 3 | Currently the clock/reset check is done in uart_receive(), but we |
7 | that was previously the UNPREDICTABLE MOVS/ORRS with Rm==13,15. | 4 | can move the check to uart_can_receive() which is earlier. |
8 | Because LSLL_rr and ASRL_rr overlap with both MOV_rxri/ORR_rrri and | ||
9 | also with CSEL (as one of the previously-UNPREDICTABLE Rm==13 cases), | ||
10 | we have to move the CSEL pattern into the same decodetree group. | ||
11 | 5 | ||
6 | Signed-off-by: Bin Meng <bmeng.cn@gmail.com> | ||
7 | Reviewed-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> | ||
8 | Reviewed-by: Alistair Francis <alistair.francis@wdc.com> | ||
9 | Message-id: 20210901124521.30599-4-bmeng.cn@gmail.com | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
13 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
14 | Message-id: 20210628135835.6690-17-peter.maydell@linaro.org | ||
15 | --- | 11 | --- |
16 | target/arm/helper-mve.h | 6 +++ | 12 | hw/char/cadence_uart.c | 17 ++++++++++------- |
17 | target/arm/translate.h | 1 + | 13 | 1 file changed, 10 insertions(+), 7 deletions(-) |
18 | target/arm/t32.decode | 16 +++++-- | ||
19 | target/arm/mve_helper.c | 93 +++++++++++++++++++++++++++++++++++++++++ | ||
20 | target/arm/translate.c | 69 ++++++++++++++++++++++++++++++ | ||
21 | 5 files changed, 182 insertions(+), 3 deletions(-) | ||
22 | 14 | ||
23 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 15 | diff --git a/hw/char/cadence_uart.c b/hw/char/cadence_uart.c |
24 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
25 | --- a/target/arm/helper-mve.h | 17 | --- a/hw/char/cadence_uart.c |
26 | +++ b/target/arm/helper-mve.h | 18 | +++ b/hw/char/cadence_uart.c |
27 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vqrshrunth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 19 | @@ -XXX,XX +XXX,XX @@ static void uart_parameters_setup(CadenceUARTState *s) |
28 | 20 | static int uart_can_receive(void *opaque) | |
29 | DEF_HELPER_FLAGS_4(mve_vshlc, TCG_CALL_NO_WG, i32, env, ptr, i32, i32) | ||
30 | |||
31 | +DEF_HELPER_FLAGS_3(mve_sshrl, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
32 | +DEF_HELPER_FLAGS_3(mve_ushll, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
33 | DEF_HELPER_FLAGS_3(mve_sqshll, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
34 | DEF_HELPER_FLAGS_3(mve_uqshll, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
35 | +DEF_HELPER_FLAGS_3(mve_sqrshrl, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
36 | +DEF_HELPER_FLAGS_3(mve_uqrshll, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
37 | +DEF_HELPER_FLAGS_3(mve_sqrshrl48, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
38 | +DEF_HELPER_FLAGS_3(mve_uqrshll48, TCG_CALL_NO_RWG, i64, env, i64, i32) | ||
39 | diff --git a/target/arm/translate.h b/target/arm/translate.h | ||
40 | index XXXXXXX..XXXXXXX 100644 | ||
41 | --- a/target/arm/translate.h | ||
42 | +++ b/target/arm/translate.h | ||
43 | @@ -XXX,XX +XXX,XX @@ typedef void CryptoThreeOpIntFn(TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
44 | typedef void CryptoThreeOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr); | ||
45 | typedef void AtomicThreeOpFn(TCGv_i64, TCGv_i64, TCGv_i64, TCGArg, MemOp); | ||
46 | typedef void WideShiftImmFn(TCGv_i64, TCGv_i64, int64_t shift); | ||
47 | +typedef void WideShiftFn(TCGv_i64, TCGv_ptr, TCGv_i64, TCGv_i32); | ||
48 | |||
49 | /** | ||
50 | * arm_tbflags_from_tb: | ||
51 | diff --git a/target/arm/t32.decode b/target/arm/t32.decode | ||
52 | index XXXXXXX..XXXXXXX 100644 | ||
53 | --- a/target/arm/t32.decode | ||
54 | +++ b/target/arm/t32.decode | ||
55 | @@ -XXX,XX +XXX,XX @@ | ||
56 | &mcrr !extern cp opc1 crm rt rt2 | ||
57 | |||
58 | &mve_shl_ri rdalo rdahi shim | ||
59 | +&mve_shl_rr rdalo rdahi rm | ||
60 | |||
61 | # rdahi: bits [3:1] from insn, bit 0 is 1 | ||
62 | # rdalo: bits [3:1] from insn, bit 0 is 0 | ||
63 | @@ -XXX,XX +XXX,XX @@ | ||
64 | |||
65 | @mve_shl_ri ....... .... . ... . . ... ... . .. .. .... \ | ||
66 | &mve_shl_ri shim=%imm5_12_6 rdalo=%rdalo_17 rdahi=%rdahi_9 | ||
67 | +@mve_shl_rr ....... .... . ... . rm:4 ... . .. .. .... \ | ||
68 | + &mve_shl_rr rdalo=%rdalo_17 rdahi=%rdahi_9 | ||
69 | |||
70 | { | 21 | { |
71 | TST_xrri 1110101 0000 1 .... 0 ... 1111 .... .... @S_xrr_shi | 22 | CadenceUARTState *s = opaque; |
72 | @@ -XXX,XX +XXX,XX @@ BIC_rrri 1110101 0001 . .... 0 ... .... .... .... @s_rrr_shi | 23 | - int ret = MAX(CADENCE_UART_RX_FIFO_SIZE, CADENCE_UART_TX_FIFO_SIZE); |
73 | URSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 01 1111 @mve_shl_ri | 24 | - uint32_t ch_mode = s->r[R_MR] & UART_MR_CHMODE; |
74 | SRSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 10 1111 @mve_shl_ri | 25 | + int ret; |
75 | SQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 11 1111 @mve_shl_ri | 26 | + uint32_t ch_mode; |
76 | + | 27 | + |
77 | + LSLL_rr 1110101 0010 1 ... 0 .... ... 1 0000 1101 @mve_shl_rr | 28 | + /* ignore characters when unclocked or in reset */ |
78 | + ASRL_rr 1110101 0010 1 ... 0 .... ... 1 0010 1101 @mve_shl_rr | 29 | + if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
79 | + UQRSHLL64_rr 1110101 0010 1 ... 1 .... ... 1 0000 1101 @mve_shl_rr | ||
80 | + SQRSHRL64_rr 1110101 0010 1 ... 1 .... ... 1 0010 1101 @mve_shl_rr | ||
81 | + UQRSHLL48_rr 1110101 0010 1 ... 1 .... ... 1 1000 1101 @mve_shl_rr | ||
82 | + SQRSHRL48_rr 1110101 0010 1 ... 1 .... ... 1 1010 1101 @mve_shl_rr | ||
83 | ] | ||
84 | |||
85 | MOV_rxri 1110101 0010 . 1111 0 ... .... .... .... @s_rxr_shi | ||
86 | ORR_rrri 1110101 0010 . .... 0 ... .... .... .... @s_rrr_shi | ||
87 | + | ||
88 | + # v8.1M CSEL and friends | ||
89 | + CSEL 1110101 0010 1 rn:4 10 op:2 rd:4 fcond:4 rm:4 | ||
90 | } | ||
91 | { | ||
92 | MVN_rxri 1110101 0011 . 1111 0 ... .... .... .... @s_rxr_shi | ||
93 | @@ -XXX,XX +XXX,XX @@ SBC_rrri 1110101 1011 . .... 0 ... .... .... .... @s_rrr_shi | ||
94 | } | ||
95 | RSB_rrri 1110101 1110 . .... 0 ... .... .... .... @s_rrr_shi | ||
96 | |||
97 | -# v8.1M CSEL and friends | ||
98 | -CSEL 1110101 0010 1 rn:4 10 op:2 rd:4 fcond:4 rm:4 | ||
99 | - | ||
100 | # Data-processing (register-shifted register) | ||
101 | |||
102 | MOV_rxrr 1111 1010 0 shty:2 s:1 rm:4 1111 rd:4 0000 rs:4 \ | ||
103 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
104 | index XXXXXXX..XXXXXXX 100644 | ||
105 | --- a/target/arm/mve_helper.c | ||
106 | +++ b/target/arm/mve_helper.c | ||
107 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(mve_vshlc)(CPUARMState *env, void *vd, uint32_t rdm, | ||
108 | return rdm; | ||
109 | } | ||
110 | |||
111 | +uint64_t HELPER(mve_sshrl)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
112 | +{ | ||
113 | + return do_sqrshl_d(n, -(int8_t)shift, false, NULL); | ||
114 | +} | ||
115 | + | ||
116 | +uint64_t HELPER(mve_ushll)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
117 | +{ | ||
118 | + return do_uqrshl_d(n, (int8_t)shift, false, NULL); | ||
119 | +} | ||
120 | + | ||
121 | uint64_t HELPER(mve_sqshll)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
122 | { | ||
123 | return do_sqrshl_d(n, (int8_t)shift, false, &env->QF); | ||
124 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(mve_uqshll)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
125 | { | ||
126 | return do_uqrshl_d(n, (int8_t)shift, false, &env->QF); | ||
127 | } | ||
128 | + | ||
129 | +uint64_t HELPER(mve_sqrshrl)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
130 | +{ | ||
131 | + return do_sqrshl_d(n, -(int8_t)shift, true, &env->QF); | ||
132 | +} | ||
133 | + | ||
134 | +uint64_t HELPER(mve_uqrshll)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
135 | +{ | ||
136 | + return do_uqrshl_d(n, (int8_t)shift, true, &env->QF); | ||
137 | +} | ||
138 | + | ||
139 | +/* Operate on 64-bit values, but saturate at 48 bits */ | ||
140 | +static inline int64_t do_sqrshl48_d(int64_t src, int64_t shift, | ||
141 | + bool round, uint32_t *sat) | ||
142 | +{ | ||
143 | + if (shift <= -48) { | ||
144 | + /* Rounding the sign bit always produces 0. */ | ||
145 | + if (round) { | ||
146 | + return 0; | ||
147 | + } | ||
148 | + return src >> 63; | ||
149 | + } else if (shift < 0) { | ||
150 | + if (round) { | ||
151 | + src >>= -shift - 1; | ||
152 | + return (src >> 1) + (src & 1); | ||
153 | + } | ||
154 | + return src >> -shift; | ||
155 | + } else if (shift < 48) { | ||
156 | + int64_t val = src << shift; | ||
157 | + int64_t extval = sextract64(val, 0, 48); | ||
158 | + if (!sat || val == extval) { | ||
159 | + return extval; | ||
160 | + } | ||
161 | + } else if (!sat || src == 0) { | ||
162 | + return 0; | 30 | + return 0; |
163 | + } | 31 | + } |
164 | + | 32 | + |
165 | + *sat = 1; | 33 | + ret = MAX(CADENCE_UART_RX_FIFO_SIZE, CADENCE_UART_TX_FIFO_SIZE); |
166 | + return (1ULL << 47) - (src >= 0); | 34 | + ch_mode = s->r[R_MR] & UART_MR_CHMODE; |
167 | +} | 35 | |
168 | + | 36 | if (ch_mode == NORMAL_MODE || ch_mode == ECHO_MODE) { |
169 | +/* Operate on 64-bit values, but saturate at 48 bits */ | 37 | ret = MIN(ret, CADENCE_UART_RX_FIFO_SIZE - s->rx_count); |
170 | +static inline uint64_t do_uqrshl48_d(uint64_t src, int64_t shift, | 38 | @@ -XXX,XX +XXX,XX @@ static void uart_receive(void *opaque, const uint8_t *buf, int size) |
171 | + bool round, uint32_t *sat) | 39 | CadenceUARTState *s = opaque; |
172 | +{ | 40 | uint32_t ch_mode = s->r[R_MR] & UART_MR_CHMODE; |
173 | + uint64_t val, extval; | 41 | |
174 | + | 42 | - /* ignore characters when unclocked or in reset */ |
175 | + if (shift <= -(48 + round)) { | 43 | - if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
176 | + return 0; | 44 | - return; |
177 | + } else if (shift < 0) { | 45 | - } |
178 | + if (round) { | 46 | - |
179 | + val = src >> (-shift - 1); | 47 | if (ch_mode == NORMAL_MODE || ch_mode == ECHO_MODE) { |
180 | + val = (val >> 1) + (val & 1); | 48 | uart_write_rx_fifo(opaque, buf, size); |
181 | + } else { | 49 | } |
182 | + val = src >> -shift; | ||
183 | + } | ||
184 | + extval = extract64(val, 0, 48); | ||
185 | + if (!sat || val == extval) { | ||
186 | + return extval; | ||
187 | + } | ||
188 | + } else if (shift < 48) { | ||
189 | + uint64_t val = src << shift; | ||
190 | + uint64_t extval = extract64(val, 0, 48); | ||
191 | + if (!sat || val == extval) { | ||
192 | + return extval; | ||
193 | + } | ||
194 | + } else if (!sat || src == 0) { | ||
195 | + return 0; | ||
196 | + } | ||
197 | + | ||
198 | + *sat = 1; | ||
199 | + return MAKE_64BIT_MASK(0, 48); | ||
200 | +} | ||
201 | + | ||
202 | +uint64_t HELPER(mve_sqrshrl48)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
203 | +{ | ||
204 | + return do_sqrshl48_d(n, -(int8_t)shift, true, &env->QF); | ||
205 | +} | ||
206 | + | ||
207 | +uint64_t HELPER(mve_uqrshll48)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
208 | +{ | ||
209 | + return do_uqrshl48_d(n, (int8_t)shift, true, &env->QF); | ||
210 | +} | ||
211 | diff --git a/target/arm/translate.c b/target/arm/translate.c | ||
212 | index XXXXXXX..XXXXXXX 100644 | ||
213 | --- a/target/arm/translate.c | ||
214 | +++ b/target/arm/translate.c | ||
215 | @@ -XXX,XX +XXX,XX @@ static bool trans_URSHRL_ri(DisasContext *s, arg_mve_shl_ri *a) | ||
216 | return do_mve_shl_ri(s, a, gen_urshr64_i64); | ||
217 | } | ||
218 | |||
219 | +static bool do_mve_shl_rr(DisasContext *s, arg_mve_shl_rr *a, WideShiftFn *fn) | ||
220 | +{ | ||
221 | + TCGv_i64 rda; | ||
222 | + TCGv_i32 rdalo, rdahi; | ||
223 | + | ||
224 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_1M)) { | ||
225 | + /* Decode falls through to ORR/MOV UNPREDICTABLE handling */ | ||
226 | + return false; | ||
227 | + } | ||
228 | + if (a->rdahi == 15) { | ||
229 | + /* These are a different encoding (SQSHL/SRSHR/UQSHL/URSHR) */ | ||
230 | + return false; | ||
231 | + } | ||
232 | + if (!dc_isar_feature(aa32_mve, s) || | ||
233 | + !arm_dc_feature(s, ARM_FEATURE_M_MAIN) || | ||
234 | + a->rdahi == 13 || a->rm == 13 || a->rm == 15 || | ||
235 | + a->rm == a->rdahi || a->rm == a->rdalo) { | ||
236 | + /* These rdahi/rdalo/rm cases are UNPREDICTABLE; we choose to UNDEF */ | ||
237 | + unallocated_encoding(s); | ||
238 | + return true; | ||
239 | + } | ||
240 | + | ||
241 | + rda = tcg_temp_new_i64(); | ||
242 | + rdalo = load_reg(s, a->rdalo); | ||
243 | + rdahi = load_reg(s, a->rdahi); | ||
244 | + tcg_gen_concat_i32_i64(rda, rdalo, rdahi); | ||
245 | + | ||
246 | + /* The helper takes care of the sign-extension of the low 8 bits of Rm */ | ||
247 | + fn(rda, cpu_env, rda, cpu_R[a->rm]); | ||
248 | + | ||
249 | + tcg_gen_extrl_i64_i32(rdalo, rda); | ||
250 | + tcg_gen_extrh_i64_i32(rdahi, rda); | ||
251 | + store_reg(s, a->rdalo, rdalo); | ||
252 | + store_reg(s, a->rdahi, rdahi); | ||
253 | + tcg_temp_free_i64(rda); | ||
254 | + | ||
255 | + return true; | ||
256 | +} | ||
257 | + | ||
258 | +static bool trans_LSLL_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
259 | +{ | ||
260 | + return do_mve_shl_rr(s, a, gen_helper_mve_ushll); | ||
261 | +} | ||
262 | + | ||
263 | +static bool trans_ASRL_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
264 | +{ | ||
265 | + return do_mve_shl_rr(s, a, gen_helper_mve_sshrl); | ||
266 | +} | ||
267 | + | ||
268 | +static bool trans_UQRSHLL64_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
269 | +{ | ||
270 | + return do_mve_shl_rr(s, a, gen_helper_mve_uqrshll); | ||
271 | +} | ||
272 | + | ||
273 | +static bool trans_SQRSHRL64_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
274 | +{ | ||
275 | + return do_mve_shl_rr(s, a, gen_helper_mve_sqrshrl); | ||
276 | +} | ||
277 | + | ||
278 | +static bool trans_UQRSHLL48_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
279 | +{ | ||
280 | + return do_mve_shl_rr(s, a, gen_helper_mve_uqrshll48); | ||
281 | +} | ||
282 | + | ||
283 | +static bool trans_SQRSHRL48_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
284 | +{ | ||
285 | + return do_mve_shl_rr(s, a, gen_helper_mve_sqrshrl48); | ||
286 | +} | ||
287 | + | ||
288 | /* | ||
289 | * Multiply and multiply accumulate | ||
290 | */ | ||
291 | -- | 50 | -- |
292 | 2.20.1 | 51 | 2.20.1 |
293 | 52 | ||
294 | 53 | diff view generated by jsdifflib |
1 | From: Patrick Venture <venture@google.com> | 1 | From: Bin Meng <bmeng.cn@gmail.com> |
---|---|---|---|
2 | 2 | ||
3 | Adds a line-item reference to the supported quanta-q71l-bmc aspeed | 3 | This converts uart_read() and uart_write() to memop_with_attrs() ops. |
4 | entry. | ||
5 | 4 | ||
6 | Signed-off-by: Patrick Venture <venture@google.com> | 5 | Signed-off-by: Bin Meng <bmeng.cn@gmail.com> |
7 | Reviewed-by: Cédric Le Goater <clg@kaod.org> | 6 | Reviewed-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> |
8 | Message-id: 20210615192848.1065297-2-venture@google.com | 7 | Reviewed-by: Alistair Francis <alistair.francis@wdc.com> |
8 | Message-id: 20210901124521.30599-5-bmeng.cn@gmail.com | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | docs/system/arm/aspeed.rst | 1 + | 11 | hw/char/cadence_uart.c | 26 +++++++++++++++----------- |
12 | 1 file changed, 1 insertion(+) | 12 | 1 file changed, 15 insertions(+), 11 deletions(-) |
13 | 13 | ||
14 | diff --git a/docs/system/arm/aspeed.rst b/docs/system/arm/aspeed.rst | 14 | diff --git a/hw/char/cadence_uart.c b/hw/char/cadence_uart.c |
15 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/docs/system/arm/aspeed.rst | 16 | --- a/hw/char/cadence_uart.c |
17 | +++ b/docs/system/arm/aspeed.rst | 17 | +++ b/hw/char/cadence_uart.c |
18 | @@ -XXX,XX +XXX,XX @@ etc. | 18 | @@ -XXX,XX +XXX,XX @@ static void uart_read_rx_fifo(CadenceUARTState *s, uint32_t *c) |
19 | AST2400 SoC based machines : | 19 | uart_update_status(s); |
20 | 20 | } | |
21 | - ``palmetto-bmc`` OpenPOWER Palmetto POWER8 BMC | 21 | |
22 | +- ``quanta-q71l-bmc`` OpenBMC Quanta BMC | 22 | -static void uart_write(void *opaque, hwaddr offset, |
23 | 23 | - uint64_t value, unsigned size) | |
24 | AST2500 SoC based machines : | 24 | +static MemTxResult uart_write(void *opaque, hwaddr offset, |
25 | + uint64_t value, unsigned size, MemTxAttrs attrs) | ||
26 | { | ||
27 | CadenceUARTState *s = opaque; | ||
28 | |||
29 | DB_PRINT(" offset:%x data:%08x\n", (unsigned)offset, (unsigned)value); | ||
30 | offset >>= 2; | ||
31 | if (offset >= CADENCE_UART_R_MAX) { | ||
32 | - return; | ||
33 | + return MEMTX_DECODE_ERROR; | ||
34 | } | ||
35 | switch (offset) { | ||
36 | case R_IER: /* ier (wts imr) */ | ||
37 | @@ -XXX,XX +XXX,XX @@ static void uart_write(void *opaque, hwaddr offset, | ||
38 | break; | ||
39 | } | ||
40 | uart_update_status(s); | ||
41 | + | ||
42 | + return MEMTX_OK; | ||
43 | } | ||
44 | |||
45 | -static uint64_t uart_read(void *opaque, hwaddr offset, | ||
46 | - unsigned size) | ||
47 | +static MemTxResult uart_read(void *opaque, hwaddr offset, | ||
48 | + uint64_t *value, unsigned size, MemTxAttrs attrs) | ||
49 | { | ||
50 | CadenceUARTState *s = opaque; | ||
51 | uint32_t c = 0; | ||
52 | |||
53 | offset >>= 2; | ||
54 | if (offset >= CADENCE_UART_R_MAX) { | ||
55 | - c = 0; | ||
56 | - } else if (offset == R_TX_RX) { | ||
57 | + return MEMTX_DECODE_ERROR; | ||
58 | + } | ||
59 | + if (offset == R_TX_RX) { | ||
60 | uart_read_rx_fifo(s, &c); | ||
61 | } else { | ||
62 | - c = s->r[offset]; | ||
63 | + c = s->r[offset]; | ||
64 | } | ||
65 | |||
66 | DB_PRINT(" offset:%x data:%08x\n", (unsigned)(offset << 2), (unsigned)c); | ||
67 | - return c; | ||
68 | + *value = c; | ||
69 | + return MEMTX_OK; | ||
70 | } | ||
71 | |||
72 | static const MemoryRegionOps uart_ops = { | ||
73 | - .read = uart_read, | ||
74 | - .write = uart_write, | ||
75 | + .read_with_attrs = uart_read, | ||
76 | + .write_with_attrs = uart_write, | ||
77 | .endianness = DEVICE_NATIVE_ENDIAN, | ||
78 | }; | ||
25 | 79 | ||
26 | -- | 80 | -- |
27 | 2.20.1 | 81 | 2.20.1 |
28 | 82 | ||
29 | 83 | diff view generated by jsdifflib |
1 | Implement the MVE shift-right-and-narrow insn VSHRN and VRSHRN. | 1 | From: Bin Meng <bmeng.cn@gmail.com> |
---|---|---|---|
2 | 2 | ||
3 | do_urshr() is borrowed from sve_helper.c. | 3 | Read or write to uart registers when unclocked or in reset should be |
4 | ignored. Add the check there, and as a result of this, the check in | ||
5 | uart_write_tx_fifo() is now unnecessary. | ||
4 | 6 | ||
7 | Signed-off-by: Bin Meng <bmeng.cn@gmail.com> | ||
8 | Reviewed-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> | ||
9 | Reviewed-by: Alistair Francis <alistair.francis@wdc.com> | ||
10 | Message-id: 20210901124521.30599-6-bmeng.cn@gmail.com | ||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20210628135835.6690-12-peter.maydell@linaro.org | ||
8 | --- | 12 | --- |
9 | target/arm/helper-mve.h | 10 ++++++++++ | 13 | hw/char/cadence_uart.c | 15 ++++++++++----- |
10 | target/arm/mve.decode | 11 +++++++++++ | 14 | 1 file changed, 10 insertions(+), 5 deletions(-) |
11 | target/arm/mve_helper.c | 40 ++++++++++++++++++++++++++++++++++++++ | ||
12 | target/arm/translate-mve.c | 15 ++++++++++++++ | ||
13 | 4 files changed, 76 insertions(+) | ||
14 | 15 | ||
15 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 16 | diff --git a/hw/char/cadence_uart.c b/hw/char/cadence_uart.c |
16 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/helper-mve.h | 18 | --- a/hw/char/cadence_uart.c |
18 | +++ b/target/arm/helper-mve.h | 19 | +++ b/hw/char/cadence_uart.c |
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vsriw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 20 | @@ -XXX,XX +XXX,XX @@ static gboolean cadence_uart_xmit(void *do_not_use, GIOCondition cond, |
20 | DEF_HELPER_FLAGS_4(mve_vslib, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 21 | static void uart_write_tx_fifo(CadenceUARTState *s, const uint8_t *buf, |
21 | DEF_HELPER_FLAGS_4(mve_vslih, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 22 | int size) |
22 | DEF_HELPER_FLAGS_4(mve_vsliw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 23 | { |
23 | + | 24 | - /* ignore characters when unclocked or in reset */ |
24 | +DEF_HELPER_FLAGS_4(mve_vshrnbb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 25 | - if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
25 | +DEF_HELPER_FLAGS_4(mve_vshrnbh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 26 | - return; |
26 | +DEF_HELPER_FLAGS_4(mve_vshrntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 27 | - } |
27 | +DEF_HELPER_FLAGS_4(mve_vshrnth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 28 | - |
28 | + | 29 | if ((s->r[R_CR] & UART_CR_TX_DIS) || !(s->r[R_CR] & UART_CR_TX_EN)) { |
29 | +DEF_HELPER_FLAGS_4(mve_vrshrnbb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 30 | return; |
30 | +DEF_HELPER_FLAGS_4(mve_vrshrnbh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 31 | } |
31 | +DEF_HELPER_FLAGS_4(mve_vrshrntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 32 | @@ -XXX,XX +XXX,XX @@ static MemTxResult uart_write(void *opaque, hwaddr offset, |
32 | +DEF_HELPER_FLAGS_4(mve_vrshrnth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 33 | { |
33 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | 34 | CadenceUARTState *s = opaque; |
34 | index XXXXXXX..XXXXXXX 100644 | 35 | |
35 | --- a/target/arm/mve.decode | 36 | + /* ignore access when unclocked or in reset */ |
36 | +++ b/target/arm/mve.decode | 37 | + if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
37 | @@ -XXX,XX +XXX,XX @@ VSRI 111 1 1111 1 . ... ... ... 0 0100 0 1 . 1 ... 0 @2_shr_w | 38 | + return MEMTX_ERROR; |
38 | VSLI 111 1 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_b | ||
39 | VSLI 111 1 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_h | ||
40 | VSLI 111 1 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_w | ||
41 | + | ||
42 | +# Narrowing shifts (which only support b and h sizes) | ||
43 | +VSHRNB 111 0 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 1 @2_shr_b | ||
44 | +VSHRNB 111 0 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 1 @2_shr_h | ||
45 | +VSHRNT 111 0 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 1 @2_shr_b | ||
46 | +VSHRNT 111 0 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 1 @2_shr_h | ||
47 | + | ||
48 | +VRSHRNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 1 @2_shr_b | ||
49 | +VRSHRNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 1 @2_shr_h | ||
50 | +VRSHRNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 1 @2_shr_b | ||
51 | +VRSHRNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 1 @2_shr_h | ||
52 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
53 | index XXXXXXX..XXXXXXX 100644 | ||
54 | --- a/target/arm/mve_helper.c | ||
55 | +++ b/target/arm/mve_helper.c | ||
56 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT_INSERT(vsliw, 4, DO_SHL, SHL_MASK) | ||
57 | |||
58 | DO_VSHLL_ALL(vshllb, false) | ||
59 | DO_VSHLL_ALL(vshllt, true) | ||
60 | + | ||
61 | +/* | ||
62 | + * Narrowing right shifts, taking a double sized input, shifting it | ||
63 | + * and putting the result in either the top or bottom half of the output. | ||
64 | + * ESIZE, TYPE are the output, and LESIZE, LTYPE the input. | ||
65 | + */ | ||
66 | +#define DO_VSHRN(OP, TOP, ESIZE, TYPE, LESIZE, LTYPE, FN) \ | ||
67 | + void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
68 | + void *vm, uint32_t shift) \ | ||
69 | + { \ | ||
70 | + LTYPE *m = vm; \ | ||
71 | + TYPE *d = vd; \ | ||
72 | + uint16_t mask = mve_element_mask(env); \ | ||
73 | + unsigned le; \ | ||
74 | + for (le = 0; le < 16 / LESIZE; le++, mask >>= LESIZE) { \ | ||
75 | + TYPE r = FN(m[H##LESIZE(le)], shift); \ | ||
76 | + mergemask(&d[H##ESIZE(le * 2 + TOP)], r, mask); \ | ||
77 | + } \ | ||
78 | + mve_advance_vpt(env); \ | ||
79 | + } | 39 | + } |
80 | + | 40 | + |
81 | +#define DO_VSHRN_ALL(OP, FN) \ | 41 | DB_PRINT(" offset:%x data:%08x\n", (unsigned)offset, (unsigned)value); |
82 | + DO_VSHRN(OP##bb, false, 1, uint8_t, 2, uint16_t, FN) \ | 42 | offset >>= 2; |
83 | + DO_VSHRN(OP##bh, false, 2, uint16_t, 4, uint32_t, FN) \ | 43 | if (offset >= CADENCE_UART_R_MAX) { |
84 | + DO_VSHRN(OP##tb, true, 1, uint8_t, 2, uint16_t, FN) \ | 44 | @@ -XXX,XX +XXX,XX @@ static MemTxResult uart_read(void *opaque, hwaddr offset, |
85 | + DO_VSHRN(OP##th, true, 2, uint16_t, 4, uint32_t, FN) | 45 | CadenceUARTState *s = opaque; |
86 | + | 46 | uint32_t c = 0; |
87 | +static inline uint64_t do_urshr(uint64_t x, unsigned sh) | 47 | |
88 | +{ | 48 | + /* ignore access when unclocked or in reset */ |
89 | + if (likely(sh < 64)) { | 49 | + if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
90 | + return (x >> sh) + ((x >> (sh - 1)) & 1); | 50 | + return MEMTX_ERROR; |
91 | + } else if (sh == 64) { | ||
92 | + return x >> 63; | ||
93 | + } else { | ||
94 | + return 0; | ||
95 | + } | ||
96 | +} | ||
97 | + | ||
98 | +DO_VSHRN_ALL(vshrn, DO_SHR) | ||
99 | +DO_VSHRN_ALL(vrshrn, do_urshr) | ||
100 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
101 | index XXXXXXX..XXXXXXX 100644 | ||
102 | --- a/target/arm/translate-mve.c | ||
103 | +++ b/target/arm/translate-mve.c | ||
104 | @@ -XXX,XX +XXX,XX @@ DO_VSHLL(VSHLL_BS, vshllbs) | ||
105 | DO_VSHLL(VSHLL_BU, vshllbu) | ||
106 | DO_VSHLL(VSHLL_TS, vshllts) | ||
107 | DO_VSHLL(VSHLL_TU, vshlltu) | ||
108 | + | ||
109 | +#define DO_2SHIFT_N(INSN, FN) \ | ||
110 | + static bool trans_##INSN(DisasContext *s, arg_2shift *a) \ | ||
111 | + { \ | ||
112 | + static MVEGenTwoOpShiftFn * const fns[] = { \ | ||
113 | + gen_helper_mve_##FN##b, \ | ||
114 | + gen_helper_mve_##FN##h, \ | ||
115 | + }; \ | ||
116 | + return do_2shift(s, a, fns[a->size], false); \ | ||
117 | + } | 51 | + } |
118 | + | 52 | + |
119 | +DO_2SHIFT_N(VSHRNB, vshrnb) | 53 | offset >>= 2; |
120 | +DO_2SHIFT_N(VSHRNT, vshrnt) | 54 | if (offset >= CADENCE_UART_R_MAX) { |
121 | +DO_2SHIFT_N(VRSHRNB, vrshrnb) | 55 | return MEMTX_DECODE_ERROR; |
122 | +DO_2SHIFT_N(VRSHRNT, vrshrnt) | ||
123 | -- | 56 | -- |
124 | 2.20.1 | 57 | 2.20.1 |
125 | 58 | ||
126 | 59 | diff view generated by jsdifflib |
1 | The A64 AdvSIMD modified-immediate grouping uses almost the same | 1 | From: Bin Meng <bmeng.cn@gmail.com> |
---|---|---|---|
2 | constant encoding that A32 Neon does; reuse asimd_imm_const() (to | ||
3 | which we add the AArch64-specific case for cmode 15 op 1) instead of | ||
4 | reimplementing it all. | ||
5 | 2 | ||
3 | We've got SW that expects FSBL (Bootlooader) to setup clocks and | ||
4 | resets. It's quite common that users run that SW on QEMU without | ||
5 | FSBL (FSBL typically requires the Xilinx tools installed). That's | ||
6 | fine, since users can stil use -device loader to enable clocks etc. | ||
7 | |||
8 | To help folks understand what's going, a log (guest-error) message | ||
9 | would be helpful here. In particular with the serial port since | ||
10 | things will go very quiet if they get things wrong. | ||
11 | |||
12 | Suggested-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> | ||
13 | Signed-off-by: Bin Meng <bmeng.cn@gmail.com> | ||
14 | Reviewed-by: Edgar E. Iglesias <edgar.iglesias@xilinx.com> | ||
15 | Reviewed-by: Alistair Francis <alistair.francis@wdc.com> | ||
16 | Message-id: 20210901124521.30599-7-bmeng.cn@gmail.com | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 17 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20210628135835.6690-5-peter.maydell@linaro.org | ||
9 | --- | 18 | --- |
10 | target/arm/translate.h | 3 +- | 19 | hw/char/cadence_uart.c | 8 ++++++++ |
11 | target/arm/translate-a64.c | 86 ++++---------------------------------- | 20 | 1 file changed, 8 insertions(+) |
12 | target/arm/translate.c | 17 +++++++- | ||
13 | 3 files changed, 24 insertions(+), 82 deletions(-) | ||
14 | 21 | ||
15 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 22 | diff --git a/hw/char/cadence_uart.c b/hw/char/cadence_uart.c |
16 | index XXXXXXX..XXXXXXX 100644 | 23 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/translate.h | 24 | --- a/hw/char/cadence_uart.c |
18 | +++ b/target/arm/translate.h | 25 | +++ b/hw/char/cadence_uart.c |
19 | @@ -XXX,XX +XXX,XX @@ static inline MemOp finalize_memop(DisasContext *s, MemOp opc) | 26 | @@ -XXX,XX +XXX,XX @@ static int uart_can_receive(void *opaque) |
20 | * VMVN and VBIC (when cmode < 14 && op == 1). | 27 | |
21 | * | 28 | /* ignore characters when unclocked or in reset */ |
22 | * The combination cmode == 15 op == 1 is a reserved encoding for AArch32; | 29 | if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
23 | - * callers must catch this. | 30 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: uart is unclocked or in reset\n", |
24 | + * callers must catch this; we return the 64-bit constant value defined | 31 | + __func__); |
25 | + * for AArch64. | 32 | return 0; |
26 | * | 33 | } |
27 | * cmode = 2,3,4,5,6,7,10,11,12,13 imm=0 was UNPREDICTABLE in v7A but | 34 | |
28 | * is either not unpredictable or merely CONSTRAINED UNPREDICTABLE in v8A; | 35 | @@ -XXX,XX +XXX,XX @@ static void uart_event(void *opaque, QEMUChrEvent event) |
29 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 36 | |
30 | index XXXXXXX..XXXXXXX 100644 | 37 | /* ignore characters when unclocked or in reset */ |
31 | --- a/target/arm/translate-a64.c | 38 | if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
32 | +++ b/target/arm/translate-a64.c | 39 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: uart is unclocked or in reset\n", |
33 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn) | 40 | + __func__); |
34 | { | ||
35 | int rd = extract32(insn, 0, 5); | ||
36 | int cmode = extract32(insn, 12, 4); | ||
37 | - int cmode_3_1 = extract32(cmode, 1, 3); | ||
38 | - int cmode_0 = extract32(cmode, 0, 1); | ||
39 | int o2 = extract32(insn, 11, 1); | ||
40 | uint64_t abcdefgh = extract32(insn, 5, 5) | (extract32(insn, 16, 3) << 5); | ||
41 | bool is_neg = extract32(insn, 29, 1); | ||
42 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn) | ||
43 | return; | 41 | return; |
44 | } | 42 | } |
45 | 43 | ||
46 | - /* See AdvSIMDExpandImm() in ARM ARM */ | 44 | @@ -XXX,XX +XXX,XX @@ static MemTxResult uart_write(void *opaque, hwaddr offset, |
47 | - switch (cmode_3_1) { | 45 | |
48 | - case 0: /* Replicate(Zeros(24):imm8, 2) */ | 46 | /* ignore access when unclocked or in reset */ |
49 | - case 1: /* Replicate(Zeros(16):imm8:Zeros(8), 2) */ | 47 | if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
50 | - case 2: /* Replicate(Zeros(8):imm8:Zeros(16), 2) */ | 48 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: uart is unclocked or in reset\n", |
51 | - case 3: /* Replicate(imm8:Zeros(24), 2) */ | 49 | + __func__); |
52 | - { | 50 | return MEMTX_ERROR; |
53 | - int shift = cmode_3_1 * 8; | ||
54 | - imm = bitfield_replicate(abcdefgh << shift, 32); | ||
55 | - break; | ||
56 | - } | ||
57 | - case 4: /* Replicate(Zeros(8):imm8, 4) */ | ||
58 | - case 5: /* Replicate(imm8:Zeros(8), 4) */ | ||
59 | - { | ||
60 | - int shift = (cmode_3_1 & 0x1) * 8; | ||
61 | - imm = bitfield_replicate(abcdefgh << shift, 16); | ||
62 | - break; | ||
63 | - } | ||
64 | - case 6: | ||
65 | - if (cmode_0) { | ||
66 | - /* Replicate(Zeros(8):imm8:Ones(16), 2) */ | ||
67 | - imm = (abcdefgh << 16) | 0xffff; | ||
68 | - } else { | ||
69 | - /* Replicate(Zeros(16):imm8:Ones(8), 2) */ | ||
70 | - imm = (abcdefgh << 8) | 0xff; | ||
71 | - } | ||
72 | - imm = bitfield_replicate(imm, 32); | ||
73 | - break; | ||
74 | - case 7: | ||
75 | - if (!cmode_0 && !is_neg) { | ||
76 | - imm = bitfield_replicate(abcdefgh, 8); | ||
77 | - } else if (!cmode_0 && is_neg) { | ||
78 | - int i; | ||
79 | - imm = 0; | ||
80 | - for (i = 0; i < 8; i++) { | ||
81 | - if ((abcdefgh) & (1 << i)) { | ||
82 | - imm |= 0xffULL << (i * 8); | ||
83 | - } | ||
84 | - } | ||
85 | - } else if (cmode_0) { | ||
86 | - if (is_neg) { | ||
87 | - imm = (abcdefgh & 0x3f) << 48; | ||
88 | - if (abcdefgh & 0x80) { | ||
89 | - imm |= 0x8000000000000000ULL; | ||
90 | - } | ||
91 | - if (abcdefgh & 0x40) { | ||
92 | - imm |= 0x3fc0000000000000ULL; | ||
93 | - } else { | ||
94 | - imm |= 0x4000000000000000ULL; | ||
95 | - } | ||
96 | - } else { | ||
97 | - if (o2) { | ||
98 | - /* FMOV (vector, immediate) - half-precision */ | ||
99 | - imm = vfp_expand_imm(MO_16, abcdefgh); | ||
100 | - /* now duplicate across the lanes */ | ||
101 | - imm = bitfield_replicate(imm, 16); | ||
102 | - } else { | ||
103 | - imm = (abcdefgh & 0x3f) << 19; | ||
104 | - if (abcdefgh & 0x80) { | ||
105 | - imm |= 0x80000000; | ||
106 | - } | ||
107 | - if (abcdefgh & 0x40) { | ||
108 | - imm |= 0x3e000000; | ||
109 | - } else { | ||
110 | - imm |= 0x40000000; | ||
111 | - } | ||
112 | - imm |= (imm << 32); | ||
113 | - } | ||
114 | - } | ||
115 | - } | ||
116 | - break; | ||
117 | - default: | ||
118 | - g_assert_not_reached(); | ||
119 | - } | ||
120 | - | ||
121 | - if (cmode_3_1 != 7 && is_neg) { | ||
122 | - imm = ~imm; | ||
123 | + if (cmode == 15 && o2 && !is_neg) { | ||
124 | + /* FMOV (vector, immediate) - half-precision */ | ||
125 | + imm = vfp_expand_imm(MO_16, abcdefgh); | ||
126 | + /* now duplicate across the lanes */ | ||
127 | + imm = bitfield_replicate(imm, 16); | ||
128 | + } else { | ||
129 | + imm = asimd_imm_const(abcdefgh, cmode, is_neg); | ||
130 | } | 51 | } |
131 | 52 | ||
132 | if (!((cmode & 0x9) == 0x1 || (cmode & 0xd) == 0x9)) { | 53 | @@ -XXX,XX +XXX,XX @@ static MemTxResult uart_read(void *opaque, hwaddr offset, |
133 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 54 | |
134 | index XXXXXXX..XXXXXXX 100644 | 55 | /* ignore access when unclocked or in reset */ |
135 | --- a/target/arm/translate.c | 56 | if (!clock_is_enabled(s->refclk) || device_is_in_reset(DEVICE(s))) { |
136 | +++ b/target/arm/translate.c | 57 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: uart is unclocked or in reset\n", |
137 | @@ -XXX,XX +XXX,XX @@ uint64_t asimd_imm_const(uint32_t imm, int cmode, int op) | 58 | + __func__); |
138 | case 14: | 59 | return MEMTX_ERROR; |
139 | if (op) { | 60 | } |
140 | /* | 61 | |
141 | - * This is the only case where the top and bottom 32 bits | ||
142 | - * of the encoded constant differ. | ||
143 | + * This and cmode == 15 op == 1 are the only cases where | ||
144 | + * the top and bottom 32 bits of the encoded constant differ. | ||
145 | */ | ||
146 | uint64_t imm64 = 0; | ||
147 | int n; | ||
148 | @@ -XXX,XX +XXX,XX @@ uint64_t asimd_imm_const(uint32_t imm, int cmode, int op) | ||
149 | imm |= (imm << 8) | (imm << 16) | (imm << 24); | ||
150 | break; | ||
151 | case 15: | ||
152 | + if (op) { | ||
153 | + /* Reserved encoding for AArch32; valid for AArch64 */ | ||
154 | + uint64_t imm64 = (uint64_t)(imm & 0x3f) << 48; | ||
155 | + if (imm & 0x80) { | ||
156 | + imm64 |= 0x8000000000000000ULL; | ||
157 | + } | ||
158 | + if (imm & 0x40) { | ||
159 | + imm64 |= 0x3fc0000000000000ULL; | ||
160 | + } else { | ||
161 | + imm64 |= 0x4000000000000000ULL; | ||
162 | + } | ||
163 | + return imm64; | ||
164 | + } | ||
165 | imm = ((imm & 0x80) << 24) | ((imm & 0x3f) << 19) | ||
166 | | ((imm & 0x40) ? (0x1f << 25) : (1 << 30)); | ||
167 | break; | ||
168 | -- | 62 | -- |
169 | 2.20.1 | 63 | 2.20.1 |
170 | 64 | ||
171 | 65 | diff view generated by jsdifflib |
1 | Implement the MVE VSRI and VSLI insns, which perform a | 1 | From: Marc Zyngier <maz@kernel.org> |
---|---|---|---|
2 | shift-and-insert operation. | ||
3 | 2 | ||
3 | Although we probe for the IPA limits imposed by KVM (and the hardware) | ||
4 | when computing the memory map, we still use the old style '0' when | ||
5 | creating a scratch VM in kvm_arm_create_scratch_host_vcpu(). | ||
6 | |||
7 | On systems that are severely IPA challenged (such as the Apple M1), | ||
8 | this results in a failure as KVM cannot use the default 40bit that | ||
9 | '0' represents. | ||
10 | |||
11 | Instead, probe for the extension and use the reported IPA limit | ||
12 | if available. | ||
13 | |||
14 | Cc: Andrew Jones <drjones@redhat.com> | ||
15 | Cc: Eric Auger <eric.auger@redhat.com> | ||
16 | Cc: Peter Maydell <peter.maydell@linaro.org> | ||
17 | Signed-off-by: Marc Zyngier <maz@kernel.org> | ||
18 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
19 | Message-id: 20210822144441.1290891-2-maz@kernel.org | ||
4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 20 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
6 | Message-id: 20210628135835.6690-11-peter.maydell@linaro.org | ||
7 | --- | 21 | --- |
8 | target/arm/helper-mve.h | 8 ++++++++ | 22 | target/arm/kvm.c | 7 ++++++- |
9 | target/arm/mve.decode | 9 ++++++++ | 23 | 1 file changed, 6 insertions(+), 1 deletion(-) |
10 | target/arm/mve_helper.c | 42 ++++++++++++++++++++++++++++++++++++++ | ||
11 | target/arm/translate-mve.c | 3 +++ | ||
12 | 4 files changed, 62 insertions(+) | ||
13 | 24 | ||
14 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 25 | diff --git a/target/arm/kvm.c b/target/arm/kvm.c |
15 | index XXXXXXX..XXXXXXX 100644 | 26 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/helper-mve.h | 27 | --- a/target/arm/kvm.c |
17 | +++ b/target/arm/helper-mve.h | 28 | +++ b/target/arm/kvm.c |
18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vshlltsb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 29 | @@ -XXX,XX +XXX,XX @@ bool kvm_arm_create_scratch_host_vcpu(const uint32_t *cpus_to_try, |
19 | DEF_HELPER_FLAGS_4(mve_vshlltsh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 30 | struct kvm_vcpu_init *init) |
20 | DEF_HELPER_FLAGS_4(mve_vshlltub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 31 | { |
21 | DEF_HELPER_FLAGS_4(mve_vshlltuh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 32 | int ret = 0, kvmfd = -1, vmfd = -1, cpufd = -1; |
22 | + | 33 | + int max_vm_pa_size; |
23 | +DEF_HELPER_FLAGS_4(mve_vsrib, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 34 | |
24 | +DEF_HELPER_FLAGS_4(mve_vsrih, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 35 | kvmfd = qemu_open_old("/dev/kvm", O_RDWR); |
25 | +DEF_HELPER_FLAGS_4(mve_vsriw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 36 | if (kvmfd < 0) { |
26 | + | 37 | goto err; |
27 | +DEF_HELPER_FLAGS_4(mve_vslib, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 38 | } |
28 | +DEF_HELPER_FLAGS_4(mve_vslih, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 39 | - vmfd = ioctl(kvmfd, KVM_CREATE_VM, 0); |
29 | +DEF_HELPER_FLAGS_4(mve_vsliw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 40 | + max_vm_pa_size = ioctl(kvmfd, KVM_CHECK_EXTENSION, KVM_CAP_ARM_VM_IPA_SIZE); |
30 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | 41 | + if (max_vm_pa_size < 0) { |
31 | index XXXXXXX..XXXXXXX 100644 | 42 | + max_vm_pa_size = 0; |
32 | --- a/target/arm/mve.decode | ||
33 | +++ b/target/arm/mve.decode | ||
34 | @@ -XXX,XX +XXX,XX @@ VSHLL_TS 111 0 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_h | ||
35 | |||
36 | VSHLL_TU 111 1 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_b | ||
37 | VSHLL_TU 111 1 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_h | ||
38 | + | ||
39 | +# Shift-and-insert | ||
40 | +VSRI 111 1 1111 1 . ... ... ... 0 0100 0 1 . 1 ... 0 @2_shr_b | ||
41 | +VSRI 111 1 1111 1 . ... ... ... 0 0100 0 1 . 1 ... 0 @2_shr_h | ||
42 | +VSRI 111 1 1111 1 . ... ... ... 0 0100 0 1 . 1 ... 0 @2_shr_w | ||
43 | + | ||
44 | +VSLI 111 1 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_b | ||
45 | +VSLI 111 1 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_h | ||
46 | +VSLI 111 1 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_w | ||
47 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
48 | index XXXXXXX..XXXXXXX 100644 | ||
49 | --- a/target/arm/mve_helper.c | ||
50 | +++ b/target/arm/mve_helper.c | ||
51 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT_SAT_S(vqshlui_s, DO_SUQSHL_OP) | ||
52 | DO_2SHIFT_U(vrshli_u, DO_VRSHLU) | ||
53 | DO_2SHIFT_S(vrshli_s, DO_VRSHLS) | ||
54 | |||
55 | +/* Shift-and-insert; we always work with 64 bits at a time */ | ||
56 | +#define DO_2SHIFT_INSERT(OP, ESIZE, SHIFTFN, MASKFN) \ | ||
57 | + void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
58 | + void *vm, uint32_t shift) \ | ||
59 | + { \ | ||
60 | + uint64_t *d = vd, *m = vm; \ | ||
61 | + uint16_t mask; \ | ||
62 | + uint64_t shiftmask; \ | ||
63 | + unsigned e; \ | ||
64 | + if (shift == 0 || shift == ESIZE * 8) { \ | ||
65 | + /* \ | ||
66 | + * Only VSLI can shift by 0; only VSRI can shift by <dt>. \ | ||
67 | + * The generic logic would give the right answer for 0 but \ | ||
68 | + * fails for <dt>. \ | ||
69 | + */ \ | ||
70 | + goto done; \ | ||
71 | + } \ | ||
72 | + assert(shift < ESIZE * 8); \ | ||
73 | + mask = mve_element_mask(env); \ | ||
74 | + /* ESIZE / 2 gives the MO_* value if ESIZE is in [1,2,4] */ \ | ||
75 | + shiftmask = dup_const(ESIZE / 2, MASKFN(ESIZE * 8, shift)); \ | ||
76 | + for (e = 0; e < 16 / 8; e++, mask >>= 8) { \ | ||
77 | + uint64_t r = (SHIFTFN(m[H8(e)], shift) & shiftmask) | \ | ||
78 | + (d[H8(e)] & ~shiftmask); \ | ||
79 | + mergemask(&d[H8(e)], r, mask); \ | ||
80 | + } \ | ||
81 | +done: \ | ||
82 | + mve_advance_vpt(env); \ | ||
83 | + } | 43 | + } |
84 | + | 44 | + vmfd = ioctl(kvmfd, KVM_CREATE_VM, max_vm_pa_size); |
85 | +#define DO_SHL(N, SHIFT) ((N) << (SHIFT)) | 45 | if (vmfd < 0) { |
86 | +#define DO_SHR(N, SHIFT) ((N) >> (SHIFT)) | 46 | goto err; |
87 | +#define SHL_MASK(EBITS, SHIFT) MAKE_64BIT_MASK((SHIFT), (EBITS) - (SHIFT)) | 47 | } |
88 | +#define SHR_MASK(EBITS, SHIFT) MAKE_64BIT_MASK(0, (EBITS) - (SHIFT)) | ||
89 | + | ||
90 | +DO_2SHIFT_INSERT(vsrib, 1, DO_SHR, SHR_MASK) | ||
91 | +DO_2SHIFT_INSERT(vsrih, 2, DO_SHR, SHR_MASK) | ||
92 | +DO_2SHIFT_INSERT(vsriw, 4, DO_SHR, SHR_MASK) | ||
93 | +DO_2SHIFT_INSERT(vslib, 1, DO_SHL, SHL_MASK) | ||
94 | +DO_2SHIFT_INSERT(vslih, 2, DO_SHL, SHL_MASK) | ||
95 | +DO_2SHIFT_INSERT(vsliw, 4, DO_SHL, SHL_MASK) | ||
96 | + | ||
97 | /* | ||
98 | * Long shifts taking half-sized inputs from top or bottom of the input | ||
99 | * vector and producing a double-width result. ESIZE, TYPE are for | ||
100 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
101 | index XXXXXXX..XXXXXXX 100644 | ||
102 | --- a/target/arm/translate-mve.c | ||
103 | +++ b/target/arm/translate-mve.c | ||
104 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT(VSHRI_U, vshli_u, true) | ||
105 | DO_2SHIFT(VRSHRI_S, vrshli_s, true) | ||
106 | DO_2SHIFT(VRSHRI_U, vrshli_u, true) | ||
107 | |||
108 | +DO_2SHIFT(VSRI, vsri, false) | ||
109 | +DO_2SHIFT(VSLI, vsli, false) | ||
110 | + | ||
111 | #define DO_VSHLL(INSN, FN) \ | ||
112 | static bool trans_##INSN(DisasContext *s, arg_2shift *a) \ | ||
113 | { \ | ||
114 | -- | 48 | -- |
115 | 2.20.1 | 49 | 2.20.1 |
116 | 50 | ||
117 | 51 | diff view generated by jsdifflib |
1 | From: Patrick Venture <venture@google.com> | 1 | From: Chris Rauer <crauer@google.com> |
---|---|---|---|
2 | 2 | ||
3 | Add line item reference to quanta-gbs-bmc machine. | 3 | kudo-bmc is a board supported by OpenBMC. |
4 | https://github.com/openbmc/openbmc/tree/master/meta-fii/meta-kudo | ||
4 | 5 | ||
5 | Signed-off-by: Patrick Venture <venture@google.com> | 6 | Since v1: |
6 | Reviewed-by: Cédric Le Goater <clg@kaod.org> | 7 | - hyphenated Cortex-A9 |
7 | Message-id: 20210615192848.1065297-3-venture@google.com | 8 | |
8 | [PMM: fixed underline Sphinx warning] | 9 | Tested: Booted kudo firmware. |
10 | Signed-off-by: Chris Rauer <crauer@google.com> | ||
11 | Reviewed-by: Patrick Venture <venture@google.com> | ||
12 | Message-id: 20210907223234.1165705-1-crauer@google.com | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 14 | --- |
11 | docs/system/arm/nuvoton.rst | 5 +++-- | 15 | docs/system/arm/nuvoton.rst | 1 + |
12 | 1 file changed, 3 insertions(+), 2 deletions(-) | 16 | hw/arm/npcm7xx_boards.c | 34 ++++++++++++++++++++++++++++++++++ |
17 | 2 files changed, 35 insertions(+) | ||
13 | 18 | ||
14 | diff --git a/docs/system/arm/nuvoton.rst b/docs/system/arm/nuvoton.rst | 19 | diff --git a/docs/system/arm/nuvoton.rst b/docs/system/arm/nuvoton.rst |
15 | index XXXXXXX..XXXXXXX 100644 | 20 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/docs/system/arm/nuvoton.rst | 21 | --- a/docs/system/arm/nuvoton.rst |
17 | +++ b/docs/system/arm/nuvoton.rst | 22 | +++ b/docs/system/arm/nuvoton.rst |
23 | @@ -XXX,XX +XXX,XX @@ Hyperscale applications. The following machines are based on this chip : | ||
24 | |||
25 | - ``quanta-gbs-bmc`` Quanta GBS server BMC | ||
26 | - ``quanta-gsj`` Quanta GSJ server BMC | ||
27 | +- ``kudo-bmc`` Fii USA Kudo server BMC | ||
28 | |||
29 | There are also two more SoCs, NPCM710 and NPCM705, which are single-core | ||
30 | variants of NPCM750 and NPCM730, respectively. These are currently not | ||
31 | diff --git a/hw/arm/npcm7xx_boards.c b/hw/arm/npcm7xx_boards.c | ||
32 | index XXXXXXX..XXXXXXX 100644 | ||
33 | --- a/hw/arm/npcm7xx_boards.c | ||
34 | +++ b/hw/arm/npcm7xx_boards.c | ||
18 | @@ -XXX,XX +XXX,XX @@ | 35 | @@ -XXX,XX +XXX,XX @@ |
19 | -Nuvoton iBMC boards (``npcm750-evb``, ``quanta-gsj``) | 36 | #define NPCM750_EVB_POWER_ON_STRAPS 0x00001ff7 |
20 | -===================================================== | 37 | #define QUANTA_GSJ_POWER_ON_STRAPS 0x00001fff |
21 | +Nuvoton iBMC boards (``*-bmc``, ``npcm750-evb``, ``quanta-gsj``) | 38 | #define QUANTA_GBS_POWER_ON_STRAPS 0x000017ff |
22 | +================================================================ | 39 | +#define KUDO_BMC_POWER_ON_STRAPS 0x00001fff |
23 | 40 | ||
24 | The `Nuvoton iBMC`_ chips (NPCM7xx) are a family of ARM-based SoCs that are | 41 | static const char npcm7xx_default_bootrom[] = "npcm7xx_bootrom.bin"; |
25 | designed to be used as Baseboard Management Controllers (BMCs) in various | 42 | |
26 | @@ -XXX,XX +XXX,XX @@ segment. The following machines are based on this chip : | 43 | @@ -XXX,XX +XXX,XX @@ static void quanta_gbs_init(MachineState *machine) |
27 | The NPCM730 SoC has two Cortex-A9 cores and is targeted for Data Center and | 44 | npcm7xx_load_kernel(machine, soc); |
28 | Hyperscale applications. The following machines are based on this chip : | 45 | } |
29 | 46 | ||
30 | +- ``quanta-gbs-bmc`` Quanta GBS server BMC | 47 | +static void kudo_bmc_init(MachineState *machine) |
31 | - ``quanta-gsj`` Quanta GSJ server BMC | 48 | +{ |
32 | 49 | + NPCM7xxState *soc; | |
33 | There are also two more SoCs, NPCM710 and NPCM705, which are single-core | 50 | + |
51 | + soc = npcm7xx_create_soc(machine, KUDO_BMC_POWER_ON_STRAPS); | ||
52 | + npcm7xx_connect_dram(soc, machine->ram); | ||
53 | + qdev_realize(DEVICE(soc), NULL, &error_fatal); | ||
54 | + | ||
55 | + npcm7xx_load_bootrom(machine, soc); | ||
56 | + npcm7xx_connect_flash(&soc->fiu[0], 0, "mx66u51235f", | ||
57 | + drive_get(IF_MTD, 0, 0)); | ||
58 | + npcm7xx_connect_flash(&soc->fiu[1], 0, "mx66u51235f", | ||
59 | + drive_get(IF_MTD, 3, 0)); | ||
60 | + | ||
61 | + npcm7xx_load_kernel(machine, soc); | ||
62 | +} | ||
63 | + | ||
64 | static void npcm7xx_set_soc_type(NPCM7xxMachineClass *nmc, const char *type) | ||
65 | { | ||
66 | NPCM7xxClass *sc = NPCM7XX_CLASS(object_class_by_name(type)); | ||
67 | @@ -XXX,XX +XXX,XX @@ static void gbs_bmc_machine_class_init(ObjectClass *oc, void *data) | ||
68 | mc->default_ram_size = 1 * GiB; | ||
69 | } | ||
70 | |||
71 | +static void kudo_bmc_machine_class_init(ObjectClass *oc, void *data) | ||
72 | +{ | ||
73 | + NPCM7xxMachineClass *nmc = NPCM7XX_MACHINE_CLASS(oc); | ||
74 | + MachineClass *mc = MACHINE_CLASS(oc); | ||
75 | + | ||
76 | + npcm7xx_set_soc_type(nmc, TYPE_NPCM730); | ||
77 | + | ||
78 | + mc->desc = "Kudo BMC (Cortex-A9)"; | ||
79 | + mc->init = kudo_bmc_init; | ||
80 | + mc->default_ram_size = 1 * GiB; | ||
81 | +}; | ||
82 | + | ||
83 | static const TypeInfo npcm7xx_machine_types[] = { | ||
84 | { | ||
85 | .name = TYPE_NPCM7XX_MACHINE, | ||
86 | @@ -XXX,XX +XXX,XX @@ static const TypeInfo npcm7xx_machine_types[] = { | ||
87 | .name = MACHINE_TYPE_NAME("quanta-gbs-bmc"), | ||
88 | .parent = TYPE_NPCM7XX_MACHINE, | ||
89 | .class_init = gbs_bmc_machine_class_init, | ||
90 | + }, { | ||
91 | + .name = MACHINE_TYPE_NAME("kudo-bmc"), | ||
92 | + .parent = TYPE_NPCM7XX_MACHINE, | ||
93 | + .class_init = kudo_bmc_machine_class_init, | ||
94 | }, | ||
95 | }; | ||
96 | |||
34 | -- | 97 | -- |
35 | 2.20.1 | 98 | 2.20.1 |
36 | 99 | ||
37 | 100 | diff view generated by jsdifflib |
1 | From: Nolan Leake <nolan@sigbus.net> | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This is just enough to make reboot and poweroff work. Works for | 3 | Added register definitions relevant to ITS,implemented overall |
4 | linux, u-boot, and the arm trusted firmware. Not tested, but should | 4 | ITS device framework with stubs for ITS control and translater |
5 | work for plan9, and bare-metal/hobby OSes, since they seem to generally | 5 | regions read/write,extended ITS common to handle mmio init between |
6 | do what linux does for reset. | 6 | existing kvm device and newer qemu device. |
7 | 7 | ||
8 | The watchdog timer functionality is not yet implemented. | 8 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> |
9 | 9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | |
10 | Resolves: https://gitlab.com/qemu-project/qemu/-/issues/64 | 10 | Reviewed-by: Eric Auger <eric.auger@redhat.com> |
11 | Signed-off-by: Nolan Leake <nolan@sigbus.net> | 11 | Tested-by: Neil Armstrong <narmstrong@baylibre.com> |
12 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | 12 | Message-id: 20210910143951.92242-2-shashi.mallela@linaro.org |
13 | Tested-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
14 | Message-id: 20210625210209.1870217-1-nolan@sigbus.net | ||
15 | [PMM: tweaked commit title; fixed region size to 0x200; | ||
16 | moved header file to include/] | ||
17 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
18 | --- | 14 | --- |
19 | include/hw/arm/bcm2835_peripherals.h | 3 +- | 15 | hw/intc/gicv3_internal.h | 96 +++++++++- |
20 | include/hw/misc/bcm2835_powermgt.h | 29 +++++ | 16 | include/hw/intc/arm_gicv3_its_common.h | 9 +- |
21 | hw/arm/bcm2835_peripherals.c | 13 ++- | 17 | hw/intc/arm_gicv3_its.c | 241 +++++++++++++++++++++++++ |
22 | hw/misc/bcm2835_powermgt.c | 160 +++++++++++++++++++++++++++ | 18 | hw/intc/arm_gicv3_its_common.c | 7 +- |
23 | hw/misc/meson.build | 1 + | 19 | hw/intc/arm_gicv3_its_kvm.c | 2 +- |
24 | 5 files changed, 204 insertions(+), 2 deletions(-) | 20 | hw/intc/meson.build | 1 + |
25 | create mode 100644 include/hw/misc/bcm2835_powermgt.h | 21 | 6 files changed, 342 insertions(+), 14 deletions(-) |
26 | create mode 100644 hw/misc/bcm2835_powermgt.c | 22 | create mode 100644 hw/intc/arm_gicv3_its.c |
27 | 23 | ||
28 | diff --git a/include/hw/arm/bcm2835_peripherals.h b/include/hw/arm/bcm2835_peripherals.h | 24 | diff --git a/hw/intc/gicv3_internal.h b/hw/intc/gicv3_internal.h |
29 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
30 | --- a/include/hw/arm/bcm2835_peripherals.h | 26 | --- a/hw/intc/gicv3_internal.h |
31 | +++ b/include/hw/arm/bcm2835_peripherals.h | 27 | +++ b/hw/intc/gicv3_internal.h |
32 | @@ -XXX,XX +XXX,XX @@ | 28 | @@ -XXX,XX +XXX,XX @@ |
33 | #include "hw/misc/bcm2835_mphi.h" | 29 | #ifndef QEMU_ARM_GICV3_INTERNAL_H |
34 | #include "hw/misc/bcm2835_thermal.h" | 30 | #define QEMU_ARM_GICV3_INTERNAL_H |
35 | #include "hw/misc/bcm2835_cprman.h" | 31 | |
36 | +#include "hw/misc/bcm2835_powermgt.h" | 32 | +#include "hw/registerfields.h" |
37 | #include "hw/sd/sdhci.h" | 33 | #include "hw/intc/arm_gicv3_common.h" |
38 | #include "hw/sd/bcm2835_sdhost.h" | 34 | |
39 | #include "hw/gpio/bcm2835_gpio.h" | 35 | /* Distributor registers, as offsets from the distributor base address */ |
40 | @@ -XXX,XX +XXX,XX @@ struct BCM2835PeripheralState { | 36 | @@ -XXX,XX +XXX,XX @@ |
41 | BCM2835MphiState mphi; | 37 | #define GICD_CTLR_E1NWF (1U << 7) |
42 | UnimplementedDeviceState txp; | 38 | #define GICD_CTLR_RWP (1U << 31) |
43 | UnimplementedDeviceState armtmr; | 39 | |
44 | - UnimplementedDeviceState powermgt; | 40 | +/* 16 bits EventId */ |
45 | + BCM2835PowerMgtState powermgt; | 41 | +#define GICD_TYPER_IDBITS 0xf |
46 | BCM2835CprmanState cprman; | 42 | + |
47 | PL011State uart0; | 43 | /* |
48 | BCM2835AuxState aux; | 44 | * Redistributor frame offsets from RD_base |
49 | diff --git a/include/hw/misc/bcm2835_powermgt.h b/include/hw/misc/bcm2835_powermgt.h | 45 | */ |
46 | @@ -XXX,XX +XXX,XX @@ | ||
47 | #define GICR_WAKER_ProcessorSleep (1U << 1) | ||
48 | #define GICR_WAKER_ChildrenAsleep (1U << 2) | ||
49 | |||
50 | -#define GICR_PROPBASER_OUTER_CACHEABILITY_MASK (7ULL << 56) | ||
51 | -#define GICR_PROPBASER_ADDR_MASK (0xfffffffffULL << 12) | ||
52 | -#define GICR_PROPBASER_SHAREABILITY_MASK (3U << 10) | ||
53 | -#define GICR_PROPBASER_CACHEABILITY_MASK (7U << 7) | ||
54 | -#define GICR_PROPBASER_IDBITS_MASK (0x1f) | ||
55 | +FIELD(GICR_PROPBASER, IDBITS, 0, 5) | ||
56 | +FIELD(GICR_PROPBASER, INNERCACHE, 7, 3) | ||
57 | +FIELD(GICR_PROPBASER, SHAREABILITY, 10, 2) | ||
58 | +FIELD(GICR_PROPBASER, PHYADDR, 12, 40) | ||
59 | +FIELD(GICR_PROPBASER, OUTERCACHE, 56, 3) | ||
60 | |||
61 | -#define GICR_PENDBASER_PTZ (1ULL << 62) | ||
62 | -#define GICR_PENDBASER_OUTER_CACHEABILITY_MASK (7ULL << 56) | ||
63 | -#define GICR_PENDBASER_ADDR_MASK (0xffffffffULL << 16) | ||
64 | -#define GICR_PENDBASER_SHAREABILITY_MASK (3U << 10) | ||
65 | -#define GICR_PENDBASER_CACHEABILITY_MASK (7U << 7) | ||
66 | +FIELD(GICR_PENDBASER, INNERCACHE, 7, 3) | ||
67 | +FIELD(GICR_PENDBASER, SHAREABILITY, 10, 2) | ||
68 | +FIELD(GICR_PENDBASER, PHYADDR, 16, 36) | ||
69 | +FIELD(GICR_PENDBASER, OUTERCACHE, 56, 3) | ||
70 | +FIELD(GICR_PENDBASER, PTZ, 62, 1) | ||
71 | |||
72 | #define ICC_CTLR_EL1_CBPR (1U << 0) | ||
73 | #define ICC_CTLR_EL1_EOIMODE (1U << 1) | ||
74 | @@ -XXX,XX +XXX,XX @@ | ||
75 | #define ICH_VTR_EL2_PREBITS_SHIFT 26 | ||
76 | #define ICH_VTR_EL2_PRIBITS_SHIFT 29 | ||
77 | |||
78 | +/* ITS Registers */ | ||
79 | + | ||
80 | +FIELD(GITS_BASER, SIZE, 0, 8) | ||
81 | +FIELD(GITS_BASER, PAGESIZE, 8, 2) | ||
82 | +FIELD(GITS_BASER, SHAREABILITY, 10, 2) | ||
83 | +FIELD(GITS_BASER, PHYADDR, 12, 36) | ||
84 | +FIELD(GITS_BASER, PHYADDRL_64K, 16, 32) | ||
85 | +FIELD(GITS_BASER, PHYADDRH_64K, 12, 4) | ||
86 | +FIELD(GITS_BASER, ENTRYSIZE, 48, 5) | ||
87 | +FIELD(GITS_BASER, OUTERCACHE, 53, 3) | ||
88 | +FIELD(GITS_BASER, TYPE, 56, 3) | ||
89 | +FIELD(GITS_BASER, INNERCACHE, 59, 3) | ||
90 | +FIELD(GITS_BASER, INDIRECT, 62, 1) | ||
91 | +FIELD(GITS_BASER, VALID, 63, 1) | ||
92 | + | ||
93 | +FIELD(GITS_CTLR, QUIESCENT, 31, 1) | ||
94 | + | ||
95 | +FIELD(GITS_TYPER, PHYSICAL, 0, 1) | ||
96 | +FIELD(GITS_TYPER, ITT_ENTRY_SIZE, 4, 4) | ||
97 | +FIELD(GITS_TYPER, IDBITS, 8, 5) | ||
98 | +FIELD(GITS_TYPER, DEVBITS, 13, 5) | ||
99 | +FIELD(GITS_TYPER, SEIS, 18, 1) | ||
100 | +FIELD(GITS_TYPER, PTA, 19, 1) | ||
101 | +FIELD(GITS_TYPER, CIDBITS, 32, 4) | ||
102 | +FIELD(GITS_TYPER, CIL, 36, 1) | ||
103 | + | ||
104 | +#define GITS_BASER_PAGESIZE_4K 0 | ||
105 | +#define GITS_BASER_PAGESIZE_16K 1 | ||
106 | +#define GITS_BASER_PAGESIZE_64K 2 | ||
107 | + | ||
108 | +#define GITS_BASER_TYPE_DEVICE 1ULL | ||
109 | +#define GITS_BASER_TYPE_COLLECTION 4ULL | ||
110 | + | ||
111 | +/** | ||
112 | + * Default features advertised by this version of ITS | ||
113 | + */ | ||
114 | +/* Physical LPIs supported */ | ||
115 | +#define GITS_TYPE_PHYSICAL (1U << 0) | ||
116 | + | ||
117 | +/* | ||
118 | + * 12 bytes Interrupt translation Table Entry size | ||
119 | + * as per Table 5.3 in GICv3 spec | ||
120 | + * ITE Lower 8 Bytes | ||
121 | + * Bits: | 49 ... 26 | 25 ... 2 | 1 | 0 | | ||
122 | + * Values: | 1023 | IntNum | IntType | Valid | | ||
123 | + * ITE Higher 4 Bytes | ||
124 | + * Bits: | 31 ... 16 | 15 ...0 | | ||
125 | + * Values: | vPEID | ICID | | ||
126 | + */ | ||
127 | +#define ITS_ITT_ENTRY_SIZE 0xC | ||
128 | + | ||
129 | +/* 16 bits EventId */ | ||
130 | +#define ITS_IDBITS GICD_TYPER_IDBITS | ||
131 | + | ||
132 | +/* 16 bits DeviceId */ | ||
133 | +#define ITS_DEVBITS 0xF | ||
134 | + | ||
135 | +/* 16 bits CollectionId */ | ||
136 | +#define ITS_CIDBITS 0xF | ||
137 | + | ||
138 | +/* | ||
139 | + * 8 bytes Device Table Entry size | ||
140 | + * Valid = 1 bit,ITTAddr = 44 bits,Size = 5 bits | ||
141 | + */ | ||
142 | +#define GITS_DTE_SIZE (0x8ULL) | ||
143 | + | ||
144 | +/* | ||
145 | + * 8 bytes Collection Table Entry size | ||
146 | + * Valid = 1 bit,RDBase = 36 bits(considering max RDBASE) | ||
147 | + */ | ||
148 | +#define GITS_CTE_SIZE (0x8ULL) | ||
149 | + | ||
150 | /* Special interrupt IDs */ | ||
151 | #define INTID_SECURE 1020 | ||
152 | #define INTID_NONSECURE 1021 | ||
153 | diff --git a/include/hw/intc/arm_gicv3_its_common.h b/include/hw/intc/arm_gicv3_its_common.h | ||
154 | index XXXXXXX..XXXXXXX 100644 | ||
155 | --- a/include/hw/intc/arm_gicv3_its_common.h | ||
156 | +++ b/include/hw/intc/arm_gicv3_its_common.h | ||
157 | @@ -XXX,XX +XXX,XX @@ | ||
158 | #include "hw/intc/arm_gicv3_common.h" | ||
159 | #include "qom/object.h" | ||
160 | |||
161 | +#define TYPE_ARM_GICV3_ITS "arm-gicv3-its" | ||
162 | + | ||
163 | #define ITS_CONTROL_SIZE 0x10000 | ||
164 | #define ITS_TRANS_SIZE 0x10000 | ||
165 | #define ITS_SIZE (ITS_CONTROL_SIZE + ITS_TRANS_SIZE) | ||
166 | |||
167 | #define GITS_CTLR 0x0 | ||
168 | #define GITS_IIDR 0x4 | ||
169 | +#define GITS_TYPER 0x8 | ||
170 | #define GITS_CBASER 0x80 | ||
171 | #define GITS_CWRITER 0x88 | ||
172 | #define GITS_CREADR 0x90 | ||
173 | #define GITS_BASER 0x100 | ||
174 | |||
175 | +#define GITS_TRANSLATER 0x0040 | ||
176 | + | ||
177 | struct GICv3ITSState { | ||
178 | SysBusDevice parent_obj; | ||
179 | |||
180 | @@ -XXX,XX +XXX,XX @@ struct GICv3ITSState { | ||
181 | /* Registers */ | ||
182 | uint32_t ctlr; | ||
183 | uint32_t iidr; | ||
184 | + uint64_t typer; | ||
185 | uint64_t cbaser; | ||
186 | uint64_t cwriter; | ||
187 | uint64_t creadr; | ||
188 | @@ -XXX,XX +XXX,XX @@ struct GICv3ITSState { | ||
189 | |||
190 | typedef struct GICv3ITSState GICv3ITSState; | ||
191 | |||
192 | -void gicv3_its_init_mmio(GICv3ITSState *s, const MemoryRegionOps *ops); | ||
193 | +void gicv3_its_init_mmio(GICv3ITSState *s, const MemoryRegionOps *ops, | ||
194 | + const MemoryRegionOps *tops); | ||
195 | |||
196 | #define TYPE_ARM_GICV3_ITS_COMMON "arm-gicv3-its-common" | ||
197 | typedef struct GICv3ITSCommonClass GICv3ITSCommonClass; | ||
198 | diff --git a/hw/intc/arm_gicv3_its.c b/hw/intc/arm_gicv3_its.c | ||
50 | new file mode 100644 | 199 | new file mode 100644 |
51 | index XXXXXXX..XXXXXXX | 200 | index XXXXXXX..XXXXXXX |
52 | --- /dev/null | 201 | --- /dev/null |
53 | +++ b/include/hw/misc/bcm2835_powermgt.h | 202 | +++ b/hw/intc/arm_gicv3_its.c |
54 | @@ -XXX,XX +XXX,XX @@ | 203 | @@ -XXX,XX +XXX,XX @@ |
55 | +/* | 204 | +/* |
56 | + * BCM2835 Power Management emulation | 205 | + * ITS emulation for a GICv3-based system |
57 | + * | 206 | + * |
58 | + * Copyright (C) 2017 Marcin Chojnacki <marcinch7@gmail.com> | 207 | + * Copyright Linaro.org 2021 |
59 | + * Copyright (C) 2021 Nolan Leake <nolan@sigbus.net> | ||
60 | + * | 208 | + * |
61 | + * This work is licensed under the terms of the GNU GPL, version 2 or later. | 209 | + * Authors: |
62 | + * See the COPYING file in the top-level directory. | 210 | + * Shashi Mallela <shashi.mallela@linaro.org> |
63 | + */ | ||
64 | + | ||
65 | +#ifndef BCM2835_POWERMGT_H | ||
66 | +#define BCM2835_POWERMGT_H | ||
67 | + | ||
68 | +#include "hw/sysbus.h" | ||
69 | +#include "qom/object.h" | ||
70 | + | ||
71 | +#define TYPE_BCM2835_POWERMGT "bcm2835-powermgt" | ||
72 | +OBJECT_DECLARE_SIMPLE_TYPE(BCM2835PowerMgtState, BCM2835_POWERMGT) | ||
73 | + | ||
74 | +struct BCM2835PowerMgtState { | ||
75 | + SysBusDevice busdev; | ||
76 | + MemoryRegion iomem; | ||
77 | + | ||
78 | + uint32_t rstc; | ||
79 | + uint32_t rsts; | ||
80 | + uint32_t wdog; | ||
81 | +}; | ||
82 | + | ||
83 | +#endif | ||
84 | diff --git a/hw/arm/bcm2835_peripherals.c b/hw/arm/bcm2835_peripherals.c | ||
85 | index XXXXXXX..XXXXXXX 100644 | ||
86 | --- a/hw/arm/bcm2835_peripherals.c | ||
87 | +++ b/hw/arm/bcm2835_peripherals.c | ||
88 | @@ -XXX,XX +XXX,XX @@ static void bcm2835_peripherals_init(Object *obj) | ||
89 | |||
90 | object_property_add_const_link(OBJECT(&s->dwc2), "dma-mr", | ||
91 | OBJECT(&s->gpu_bus_mr)); | ||
92 | + | ||
93 | + /* Power Management */ | ||
94 | + object_initialize_child(obj, "powermgt", &s->powermgt, | ||
95 | + TYPE_BCM2835_POWERMGT); | ||
96 | } | ||
97 | |||
98 | static void bcm2835_peripherals_realize(DeviceState *dev, Error **errp) | ||
99 | @@ -XXX,XX +XXX,XX @@ static void bcm2835_peripherals_realize(DeviceState *dev, Error **errp) | ||
100 | qdev_get_gpio_in_named(DEVICE(&s->ic), BCM2835_IC_GPU_IRQ, | ||
101 | INTERRUPT_USB)); | ||
102 | |||
103 | + /* Power Management */ | ||
104 | + if (!sysbus_realize(SYS_BUS_DEVICE(&s->powermgt), errp)) { | ||
105 | + return; | ||
106 | + } | ||
107 | + | ||
108 | + memory_region_add_subregion(&s->peri_mr, PM_OFFSET, | ||
109 | + sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->powermgt), 0)); | ||
110 | + | ||
111 | create_unimp(s, &s->txp, "bcm2835-txp", TXP_OFFSET, 0x1000); | ||
112 | create_unimp(s, &s->armtmr, "bcm2835-sp804", ARMCTRL_TIMER0_1_OFFSET, 0x40); | ||
113 | - create_unimp(s, &s->powermgt, "bcm2835-powermgt", PM_OFFSET, 0x114); | ||
114 | create_unimp(s, &s->i2s, "bcm2835-i2s", I2S_OFFSET, 0x100); | ||
115 | create_unimp(s, &s->smi, "bcm2835-smi", SMI_OFFSET, 0x100); | ||
116 | create_unimp(s, &s->spi[0], "bcm2835-spi0", SPI0_OFFSET, 0x20); | ||
117 | diff --git a/hw/misc/bcm2835_powermgt.c b/hw/misc/bcm2835_powermgt.c | ||
118 | new file mode 100644 | ||
119 | index XXXXXXX..XXXXXXX | ||
120 | --- /dev/null | ||
121 | +++ b/hw/misc/bcm2835_powermgt.c | ||
122 | @@ -XXX,XX +XXX,XX @@ | ||
123 | +/* | ||
124 | + * BCM2835 Power Management emulation | ||
125 | + * | 211 | + * |
126 | + * Copyright (C) 2017 Marcin Chojnacki <marcinch7@gmail.com> | 212 | + * This work is licensed under the terms of the GNU GPL, version 2 or (at your |
127 | + * Copyright (C) 2021 Nolan Leake <nolan@sigbus.net> | 213 | + * option) any later version. See the COPYING file in the top-level directory. |
128 | + * | 214 | + * |
129 | + * This work is licensed under the terms of the GNU GPL, version 2 or later. | ||
130 | + * See the COPYING file in the top-level directory. | ||
131 | + */ | 215 | + */ |
132 | + | 216 | + |
133 | +#include "qemu/osdep.h" | 217 | +#include "qemu/osdep.h" |
134 | +#include "qemu/log.h" | 218 | +#include "qemu/log.h" |
135 | +#include "qemu/module.h" | 219 | +#include "hw/qdev-properties.h" |
136 | +#include "hw/misc/bcm2835_powermgt.h" | 220 | +#include "hw/intc/arm_gicv3_its_common.h" |
137 | +#include "migration/vmstate.h" | 221 | +#include "gicv3_internal.h" |
138 | +#include "sysemu/runstate.h" | 222 | +#include "qom/object.h" |
139 | + | 223 | +#include "qapi/error.h" |
140 | +#define PASSWORD 0x5a000000 | 224 | + |
141 | +#define PASSWORD_MASK 0xff000000 | 225 | +typedef struct GICv3ITSClass GICv3ITSClass; |
142 | + | 226 | +/* This is reusing the GICv3ITSState typedef from ARM_GICV3_ITS_COMMON */ |
143 | +#define R_RSTC 0x1c | 227 | +DECLARE_OBJ_CHECKERS(GICv3ITSState, GICv3ITSClass, |
144 | +#define V_RSTC_RESET 0x20 | 228 | + ARM_GICV3_ITS, TYPE_ARM_GICV3_ITS) |
145 | +#define R_RSTS 0x20 | 229 | + |
146 | +#define V_RSTS_POWEROFF 0x555 /* Linux uses partition 63 to indicate halt. */ | 230 | +struct GICv3ITSClass { |
147 | +#define R_WDOG 0x24 | 231 | + GICv3ITSCommonClass parent_class; |
148 | + | 232 | + void (*parent_reset)(DeviceState *dev); |
149 | +static uint64_t bcm2835_powermgt_read(void *opaque, hwaddr offset, | 233 | +}; |
150 | + unsigned size) | 234 | + |
151 | +{ | 235 | +static MemTxResult gicv3_its_translation_write(void *opaque, hwaddr offset, |
152 | + BCM2835PowerMgtState *s = (BCM2835PowerMgtState *)opaque; | 236 | + uint64_t data, unsigned size, |
153 | + uint32_t res = 0; | 237 | + MemTxAttrs attrs) |
154 | + | 238 | +{ |
155 | + switch (offset) { | 239 | + return MEMTX_OK; |
156 | + case R_RSTC: | 240 | +} |
157 | + res = s->rstc; | 241 | + |
242 | +static bool its_writel(GICv3ITSState *s, hwaddr offset, | ||
243 | + uint64_t value, MemTxAttrs attrs) | ||
244 | +{ | ||
245 | + bool result = true; | ||
246 | + | ||
247 | + return result; | ||
248 | +} | ||
249 | + | ||
250 | +static bool its_readl(GICv3ITSState *s, hwaddr offset, | ||
251 | + uint64_t *data, MemTxAttrs attrs) | ||
252 | +{ | ||
253 | + bool result = true; | ||
254 | + | ||
255 | + return result; | ||
256 | +} | ||
257 | + | ||
258 | +static bool its_writell(GICv3ITSState *s, hwaddr offset, | ||
259 | + uint64_t value, MemTxAttrs attrs) | ||
260 | +{ | ||
261 | + bool result = true; | ||
262 | + | ||
263 | + return result; | ||
264 | +} | ||
265 | + | ||
266 | +static bool its_readll(GICv3ITSState *s, hwaddr offset, | ||
267 | + uint64_t *data, MemTxAttrs attrs) | ||
268 | +{ | ||
269 | + bool result = true; | ||
270 | + | ||
271 | + return result; | ||
272 | +} | ||
273 | + | ||
274 | +static MemTxResult gicv3_its_read(void *opaque, hwaddr offset, uint64_t *data, | ||
275 | + unsigned size, MemTxAttrs attrs) | ||
276 | +{ | ||
277 | + GICv3ITSState *s = (GICv3ITSState *)opaque; | ||
278 | + bool result; | ||
279 | + | ||
280 | + switch (size) { | ||
281 | + case 4: | ||
282 | + result = its_readl(s, offset, data, attrs); | ||
158 | + break; | 283 | + break; |
159 | + case R_RSTS: | 284 | + case 8: |
160 | + res = s->rsts; | 285 | + result = its_readll(s, offset, data, attrs); |
161 | + break; | 286 | + break; |
162 | + case R_WDOG: | ||
163 | + res = s->wdog; | ||
164 | + break; | ||
165 | + | ||
166 | + default: | 287 | + default: |
167 | + qemu_log_mask(LOG_UNIMP, | 288 | + result = false; |
168 | + "bcm2835_powermgt_read: Unknown offset 0x%08"HWADDR_PRIx | ||
169 | + "\n", offset); | ||
170 | + res = 0; | ||
171 | + break; | 289 | + break; |
172 | + } | 290 | + } |
173 | + | 291 | + |
174 | + return res; | 292 | + if (!result) { |
175 | +} | ||
176 | + | ||
177 | +static void bcm2835_powermgt_write(void *opaque, hwaddr offset, | ||
178 | + uint64_t value, unsigned size) | ||
179 | +{ | ||
180 | + BCM2835PowerMgtState *s = (BCM2835PowerMgtState *)opaque; | ||
181 | + | ||
182 | + if ((value & PASSWORD_MASK) != PASSWORD) { | ||
183 | + qemu_log_mask(LOG_GUEST_ERROR, | 293 | + qemu_log_mask(LOG_GUEST_ERROR, |
184 | + "bcm2835_powermgt_write: Bad password 0x%"PRIx64 | 294 | + "%s: invalid guest read at offset " TARGET_FMT_plx |
185 | + " at offset 0x%08"HWADDR_PRIx"\n", | 295 | + "size %u\n", __func__, offset, size); |
186 | + value, offset); | 296 | + /* |
187 | + return; | 297 | + * The spec requires that reserved registers are RAZ/WI; |
298 | + * so use false returns from leaf functions as a way to | ||
299 | + * trigger the guest-error logging but don't return it to | ||
300 | + * the caller, or we'll cause a spurious guest data abort. | ||
301 | + */ | ||
302 | + *data = 0; | ||
188 | + } | 303 | + } |
189 | + | 304 | + return MEMTX_OK; |
190 | + value = value & ~PASSWORD_MASK; | 305 | +} |
191 | + | 306 | + |
192 | + switch (offset) { | 307 | +static MemTxResult gicv3_its_write(void *opaque, hwaddr offset, uint64_t data, |
193 | + case R_RSTC: | 308 | + unsigned size, MemTxAttrs attrs) |
194 | + s->rstc = value; | 309 | +{ |
195 | + if (value & V_RSTC_RESET) { | 310 | + GICv3ITSState *s = (GICv3ITSState *)opaque; |
196 | + if ((s->rsts & 0xfff) == V_RSTS_POWEROFF) { | 311 | + bool result; |
197 | + qemu_system_shutdown_request(SHUTDOWN_CAUSE_GUEST_SHUTDOWN); | 312 | + |
198 | + } else { | 313 | + switch (size) { |
199 | + qemu_system_reset_request(SHUTDOWN_CAUSE_GUEST_RESET); | 314 | + case 4: |
200 | + } | 315 | + result = its_writel(s, offset, data, attrs); |
201 | + } | ||
202 | + break; | 316 | + break; |
203 | + case R_RSTS: | 317 | + case 8: |
204 | + qemu_log_mask(LOG_UNIMP, | 318 | + result = its_writell(s, offset, data, attrs); |
205 | + "bcm2835_powermgt_write: RSTS\n"); | ||
206 | + s->rsts = value; | ||
207 | + break; | 319 | + break; |
208 | + case R_WDOG: | ||
209 | + qemu_log_mask(LOG_UNIMP, | ||
210 | + "bcm2835_powermgt_write: WDOG\n"); | ||
211 | + s->wdog = value; | ||
212 | + break; | ||
213 | + | ||
214 | + default: | 320 | + default: |
215 | + qemu_log_mask(LOG_UNIMP, | 321 | + result = false; |
216 | + "bcm2835_powermgt_write: Unknown offset 0x%08"HWADDR_PRIx | ||
217 | + "\n", offset); | ||
218 | + break; | 322 | + break; |
219 | + } | 323 | + } |
220 | +} | 324 | + |
221 | + | 325 | + if (!result) { |
222 | +static const MemoryRegionOps bcm2835_powermgt_ops = { | 326 | + qemu_log_mask(LOG_GUEST_ERROR, |
223 | + .read = bcm2835_powermgt_read, | 327 | + "%s: invalid guest write at offset " TARGET_FMT_plx |
224 | + .write = bcm2835_powermgt_write, | 328 | + "size %u\n", __func__, offset, size); |
329 | + /* | ||
330 | + * The spec requires that reserved registers are RAZ/WI; | ||
331 | + * so use false returns from leaf functions as a way to | ||
332 | + * trigger the guest-error logging but don't return it to | ||
333 | + * the caller, or we'll cause a spurious guest data abort. | ||
334 | + */ | ||
335 | + } | ||
336 | + return MEMTX_OK; | ||
337 | +} | ||
338 | + | ||
339 | +static const MemoryRegionOps gicv3_its_control_ops = { | ||
340 | + .read_with_attrs = gicv3_its_read, | ||
341 | + .write_with_attrs = gicv3_its_write, | ||
342 | + .valid.min_access_size = 4, | ||
343 | + .valid.max_access_size = 8, | ||
344 | + .impl.min_access_size = 4, | ||
345 | + .impl.max_access_size = 8, | ||
225 | + .endianness = DEVICE_NATIVE_ENDIAN, | 346 | + .endianness = DEVICE_NATIVE_ENDIAN, |
226 | + .impl.min_access_size = 4, | 347 | +}; |
348 | + | ||
349 | +static const MemoryRegionOps gicv3_its_translation_ops = { | ||
350 | + .write_with_attrs = gicv3_its_translation_write, | ||
351 | + .valid.min_access_size = 2, | ||
352 | + .valid.max_access_size = 4, | ||
353 | + .impl.min_access_size = 2, | ||
227 | + .impl.max_access_size = 4, | 354 | + .impl.max_access_size = 4, |
355 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
228 | +}; | 356 | +}; |
229 | + | 357 | + |
230 | +static const VMStateDescription vmstate_bcm2835_powermgt = { | 358 | +static void gicv3_arm_its_realize(DeviceState *dev, Error **errp) |
231 | + .name = TYPE_BCM2835_POWERMGT, | 359 | +{ |
360 | + GICv3ITSState *s = ARM_GICV3_ITS_COMMON(dev); | ||
361 | + int i; | ||
362 | + | ||
363 | + for (i = 0; i < s->gicv3->num_cpu; i++) { | ||
364 | + if (!(s->gicv3->cpu[i].gicr_typer & GICR_TYPER_PLPIS)) { | ||
365 | + error_setg(errp, "Physical LPI not supported by CPU %d", i); | ||
366 | + return; | ||
367 | + } | ||
368 | + } | ||
369 | + | ||
370 | + gicv3_its_init_mmio(s, &gicv3_its_control_ops, &gicv3_its_translation_ops); | ||
371 | + | ||
372 | + /* set the ITS default features supported */ | ||
373 | + s->typer = FIELD_DP64(s->typer, GITS_TYPER, PHYSICAL, | ||
374 | + GITS_TYPE_PHYSICAL); | ||
375 | + s->typer = FIELD_DP64(s->typer, GITS_TYPER, ITT_ENTRY_SIZE, | ||
376 | + ITS_ITT_ENTRY_SIZE - 1); | ||
377 | + s->typer = FIELD_DP64(s->typer, GITS_TYPER, IDBITS, ITS_IDBITS); | ||
378 | + s->typer = FIELD_DP64(s->typer, GITS_TYPER, DEVBITS, ITS_DEVBITS); | ||
379 | + s->typer = FIELD_DP64(s->typer, GITS_TYPER, CIL, 1); | ||
380 | + s->typer = FIELD_DP64(s->typer, GITS_TYPER, CIDBITS, ITS_CIDBITS); | ||
381 | +} | ||
382 | + | ||
383 | +static void gicv3_its_reset(DeviceState *dev) | ||
384 | +{ | ||
385 | + GICv3ITSState *s = ARM_GICV3_ITS_COMMON(dev); | ||
386 | + GICv3ITSClass *c = ARM_GICV3_ITS_GET_CLASS(s); | ||
387 | + | ||
388 | + c->parent_reset(dev); | ||
389 | + | ||
390 | + /* Quiescent bit reset to 1 */ | ||
391 | + s->ctlr = FIELD_DP32(s->ctlr, GITS_CTLR, QUIESCENT, 1); | ||
392 | + | ||
393 | + /* | ||
394 | + * setting GITS_BASER0.Type = 0b001 (Device) | ||
395 | + * GITS_BASER1.Type = 0b100 (Collection Table) | ||
396 | + * GITS_BASER<n>.Type,where n = 3 to 7 are 0b00 (Unimplemented) | ||
397 | + * GITS_BASER<0,1>.Page_Size = 64KB | ||
398 | + * and default translation table entry size to 16 bytes | ||
399 | + */ | ||
400 | + s->baser[0] = FIELD_DP64(s->baser[0], GITS_BASER, TYPE, | ||
401 | + GITS_BASER_TYPE_DEVICE); | ||
402 | + s->baser[0] = FIELD_DP64(s->baser[0], GITS_BASER, PAGESIZE, | ||
403 | + GITS_BASER_PAGESIZE_64K); | ||
404 | + s->baser[0] = FIELD_DP64(s->baser[0], GITS_BASER, ENTRYSIZE, | ||
405 | + GITS_DTE_SIZE - 1); | ||
406 | + | ||
407 | + s->baser[1] = FIELD_DP64(s->baser[1], GITS_BASER, TYPE, | ||
408 | + GITS_BASER_TYPE_COLLECTION); | ||
409 | + s->baser[1] = FIELD_DP64(s->baser[1], GITS_BASER, PAGESIZE, | ||
410 | + GITS_BASER_PAGESIZE_64K); | ||
411 | + s->baser[1] = FIELD_DP64(s->baser[1], GITS_BASER, ENTRYSIZE, | ||
412 | + GITS_CTE_SIZE - 1); | ||
413 | +} | ||
414 | + | ||
415 | +static Property gicv3_its_props[] = { | ||
416 | + DEFINE_PROP_LINK("parent-gicv3", GICv3ITSState, gicv3, "arm-gicv3", | ||
417 | + GICv3State *), | ||
418 | + DEFINE_PROP_END_OF_LIST(), | ||
419 | +}; | ||
420 | + | ||
421 | +static void gicv3_its_class_init(ObjectClass *klass, void *data) | ||
422 | +{ | ||
423 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
424 | + GICv3ITSClass *ic = ARM_GICV3_ITS_CLASS(klass); | ||
425 | + | ||
426 | + dc->realize = gicv3_arm_its_realize; | ||
427 | + device_class_set_props(dc, gicv3_its_props); | ||
428 | + device_class_set_parent_reset(dc, gicv3_its_reset, &ic->parent_reset); | ||
429 | +} | ||
430 | + | ||
431 | +static const TypeInfo gicv3_its_info = { | ||
432 | + .name = TYPE_ARM_GICV3_ITS, | ||
433 | + .parent = TYPE_ARM_GICV3_ITS_COMMON, | ||
434 | + .instance_size = sizeof(GICv3ITSState), | ||
435 | + .class_init = gicv3_its_class_init, | ||
436 | + .class_size = sizeof(GICv3ITSClass), | ||
437 | +}; | ||
438 | + | ||
439 | +static void gicv3_its_register_types(void) | ||
440 | +{ | ||
441 | + type_register_static(&gicv3_its_info); | ||
442 | +} | ||
443 | + | ||
444 | +type_init(gicv3_its_register_types) | ||
445 | diff --git a/hw/intc/arm_gicv3_its_common.c b/hw/intc/arm_gicv3_its_common.c | ||
446 | index XXXXXXX..XXXXXXX 100644 | ||
447 | --- a/hw/intc/arm_gicv3_its_common.c | ||
448 | +++ b/hw/intc/arm_gicv3_its_common.c | ||
449 | @@ -XXX,XX +XXX,XX @@ static int gicv3_its_post_load(void *opaque, int version_id) | ||
450 | |||
451 | static const VMStateDescription vmstate_its = { | ||
452 | .name = "arm_gicv3_its", | ||
232 | + .version_id = 1, | 453 | + .version_id = 1, |
233 | + .minimum_version_id = 1, | 454 | + .minimum_version_id = 1, |
234 | + .fields = (VMStateField[]) { | 455 | .pre_save = gicv3_its_pre_save, |
235 | + VMSTATE_UINT32(rstc, BCM2835PowerMgtState), | 456 | .post_load = gicv3_its_post_load, |
236 | + VMSTATE_UINT32(rsts, BCM2835PowerMgtState), | 457 | .priority = MIG_PRI_GICV3_ITS, |
237 | + VMSTATE_UINT32(wdog, BCM2835PowerMgtState), | 458 | @@ -XXX,XX +XXX,XX @@ static const MemoryRegionOps gicv3_its_trans_ops = { |
238 | + VMSTATE_END_OF_LIST() | 459 | .endianness = DEVICE_NATIVE_ENDIAN, |
239 | + } | 460 | }; |
240 | +}; | 461 | |
241 | + | 462 | -void gicv3_its_init_mmio(GICv3ITSState *s, const MemoryRegionOps *ops) |
242 | +static void bcm2835_powermgt_init(Object *obj) | 463 | +void gicv3_its_init_mmio(GICv3ITSState *s, const MemoryRegionOps *ops, |
243 | +{ | 464 | + const MemoryRegionOps *tops) |
244 | + BCM2835PowerMgtState *s = BCM2835_POWERMGT(obj); | 465 | { |
245 | + | 466 | SysBusDevice *sbd = SYS_BUS_DEVICE(s); |
246 | + memory_region_init_io(&s->iomem, obj, &bcm2835_powermgt_ops, s, | 467 | |
247 | + TYPE_BCM2835_POWERMGT, 0x200); | 468 | memory_region_init_io(&s->iomem_its_cntrl, OBJECT(s), ops, s, |
248 | + sysbus_init_mmio(SYS_BUS_DEVICE(s), &s->iomem); | 469 | "control", ITS_CONTROL_SIZE); |
249 | +} | 470 | memory_region_init_io(&s->iomem_its_translation, OBJECT(s), |
250 | + | 471 | - &gicv3_its_trans_ops, s, |
251 | +static void bcm2835_powermgt_reset(DeviceState *dev) | 472 | + tops ? tops : &gicv3_its_trans_ops, s, |
252 | +{ | 473 | "translation", ITS_TRANS_SIZE); |
253 | + BCM2835PowerMgtState *s = BCM2835_POWERMGT(dev); | 474 | |
254 | + | 475 | /* Our two regions are always adjacent, therefore we now combine them |
255 | + /* https://elinux.org/BCM2835_registers#PM */ | 476 | diff --git a/hw/intc/arm_gicv3_its_kvm.c b/hw/intc/arm_gicv3_its_kvm.c |
256 | + s->rstc = 0x00000102; | ||
257 | + s->rsts = 0x00001000; | ||
258 | + s->wdog = 0x00000000; | ||
259 | +} | ||
260 | + | ||
261 | +static void bcm2835_powermgt_class_init(ObjectClass *klass, void *data) | ||
262 | +{ | ||
263 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
264 | + | ||
265 | + dc->reset = bcm2835_powermgt_reset; | ||
266 | + dc->vmsd = &vmstate_bcm2835_powermgt; | ||
267 | +} | ||
268 | + | ||
269 | +static TypeInfo bcm2835_powermgt_info = { | ||
270 | + .name = TYPE_BCM2835_POWERMGT, | ||
271 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
272 | + .instance_size = sizeof(BCM2835PowerMgtState), | ||
273 | + .class_init = bcm2835_powermgt_class_init, | ||
274 | + .instance_init = bcm2835_powermgt_init, | ||
275 | +}; | ||
276 | + | ||
277 | +static void bcm2835_powermgt_register_types(void) | ||
278 | +{ | ||
279 | + type_register_static(&bcm2835_powermgt_info); | ||
280 | +} | ||
281 | + | ||
282 | +type_init(bcm2835_powermgt_register_types) | ||
283 | diff --git a/hw/misc/meson.build b/hw/misc/meson.build | ||
284 | index XXXXXXX..XXXXXXX 100644 | 477 | index XXXXXXX..XXXXXXX 100644 |
285 | --- a/hw/misc/meson.build | 478 | --- a/hw/intc/arm_gicv3_its_kvm.c |
286 | +++ b/hw/misc/meson.build | 479 | +++ b/hw/intc/arm_gicv3_its_kvm.c |
287 | @@ -XXX,XX +XXX,XX @@ softmmu_ss.add(when: 'CONFIG_RASPI', if_true: files( | 480 | @@ -XXX,XX +XXX,XX @@ static void kvm_arm_its_realize(DeviceState *dev, Error **errp) |
288 | 'bcm2835_rng.c', | 481 | kvm_arm_register_device(&s->iomem_its_cntrl, -1, KVM_DEV_ARM_VGIC_GRP_ADDR, |
289 | 'bcm2835_thermal.c', | 482 | KVM_VGIC_ITS_ADDR_TYPE, s->dev_fd, 0); |
290 | 'bcm2835_cprman.c', | 483 | |
291 | + 'bcm2835_powermgt.c', | 484 | - gicv3_its_init_mmio(s, NULL); |
485 | + gicv3_its_init_mmio(s, NULL, NULL); | ||
486 | |||
487 | if (!kvm_device_check_attr(s->dev_fd, KVM_DEV_ARM_VGIC_GRP_ITS_REGS, | ||
488 | GITS_CTLR)) { | ||
489 | diff --git a/hw/intc/meson.build b/hw/intc/meson.build | ||
490 | index XXXXXXX..XXXXXXX 100644 | ||
491 | --- a/hw/intc/meson.build | ||
492 | +++ b/hw/intc/meson.build | ||
493 | @@ -XXX,XX +XXX,XX @@ softmmu_ss.add(when: 'CONFIG_ARM_GIC', if_true: files( | ||
494 | 'arm_gicv3_dist.c', | ||
495 | 'arm_gicv3_its_common.c', | ||
496 | 'arm_gicv3_redist.c', | ||
497 | + 'arm_gicv3_its.c', | ||
292 | )) | 498 | )) |
293 | softmmu_ss.add(when: 'CONFIG_SLAVIO', if_true: files('slavio_misc.c')) | 499 | softmmu_ss.add(when: 'CONFIG_ETRAXFS', if_true: files('etraxfs_pic.c')) |
294 | softmmu_ss.add(when: 'CONFIG_ZYNQ', if_true: files('zynq_slcr.c', 'zynq-xadc.c')) | 500 | softmmu_ss.add(when: 'CONFIG_HEATHROW_PIC', if_true: files('heathrow_pic.c')) |
295 | -- | 501 | -- |
296 | 2.20.1 | 502 | 2.20.1 |
297 | 503 | ||
298 | 504 | diff view generated by jsdifflib |
1 | Implement the MVE VHLL (vector shift left long) insn. This has two | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | encodings: the T1 encoding is the usual shift-by-immediate format, | ||
3 | and the T2 encoding is a special case where the shift count is always | ||
4 | equal to the element size. | ||
5 | 2 | ||
3 | Defined descriptors for ITS device table,collection table and ITS | ||
4 | command queue entities.Implemented register read/write functions, | ||
5 | extract ITS table parameters and command queue parameters,extended | ||
6 | gicv3 common to capture qemu address space(which host the ITS table | ||
7 | platform memories required for subsequent ITS processing) and | ||
8 | initialize the same in ITS device. | ||
9 | |||
10 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> | ||
11 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
12 | Reviewed-by: Eric Auger <eric.auger@redhat.com> | ||
13 | Tested-by: Neil Armstrong <narmstrong@baylibre.com> | ||
14 | Message-id: 20210910143951.92242-3-shashi.mallela@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 15 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20210628135835.6690-10-peter.maydell@linaro.org | ||
9 | --- | 16 | --- |
10 | target/arm/helper-mve.h | 9 +++++++ | 17 | hw/intc/gicv3_internal.h | 29 ++ |
11 | target/arm/mve.decode | 53 +++++++++++++++++++++++++++++++++++--- | 18 | include/hw/intc/arm_gicv3_common.h | 3 + |
12 | target/arm/mve_helper.c | 32 +++++++++++++++++++++++ | 19 | include/hw/intc/arm_gicv3_its_common.h | 23 ++ |
13 | target/arm/translate-mve.c | 15 +++++++++++ | 20 | hw/intc/arm_gicv3_its.c | 376 +++++++++++++++++++++++++ |
14 | 4 files changed, 105 insertions(+), 4 deletions(-) | 21 | 4 files changed, 431 insertions(+) |
15 | 22 | ||
16 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 23 | diff --git a/hw/intc/gicv3_internal.h b/hw/intc/gicv3_internal.h |
17 | index XXXXXXX..XXXXXXX 100644 | 24 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-mve.h | 25 | --- a/hw/intc/gicv3_internal.h |
19 | +++ b/target/arm/helper-mve.h | 26 | +++ b/hw/intc/gicv3_internal.h |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vrshli_sw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 27 | @@ -XXX,XX +XXX,XX @@ FIELD(GITS_BASER, INNERCACHE, 59, 3) |
21 | DEF_HELPER_FLAGS_4(mve_vrshli_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 28 | FIELD(GITS_BASER, INDIRECT, 62, 1) |
22 | DEF_HELPER_FLAGS_4(mve_vrshli_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 29 | FIELD(GITS_BASER, VALID, 63, 1) |
23 | DEF_HELPER_FLAGS_4(mve_vrshli_uw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 30 | |
24 | + | 31 | +FIELD(GITS_CBASER, SIZE, 0, 8) |
25 | +DEF_HELPER_FLAGS_4(mve_vshllbsb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 32 | +FIELD(GITS_CBASER, SHAREABILITY, 10, 2) |
26 | +DEF_HELPER_FLAGS_4(mve_vshllbsh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 33 | +FIELD(GITS_CBASER, PHYADDR, 12, 40) |
27 | +DEF_HELPER_FLAGS_4(mve_vshllbub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 34 | +FIELD(GITS_CBASER, OUTERCACHE, 53, 3) |
28 | +DEF_HELPER_FLAGS_4(mve_vshllbuh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 35 | +FIELD(GITS_CBASER, INNERCACHE, 59, 3) |
29 | +DEF_HELPER_FLAGS_4(mve_vshlltsb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 36 | +FIELD(GITS_CBASER, VALID, 63, 1) |
30 | +DEF_HELPER_FLAGS_4(mve_vshlltsh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 37 | + |
31 | +DEF_HELPER_FLAGS_4(mve_vshlltub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 38 | +FIELD(GITS_CREADR, STALLED, 0, 1) |
32 | +DEF_HELPER_FLAGS_4(mve_vshlltuh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 39 | +FIELD(GITS_CREADR, OFFSET, 5, 15) |
33 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | 40 | + |
41 | +FIELD(GITS_CWRITER, RETRY, 0, 1) | ||
42 | +FIELD(GITS_CWRITER, OFFSET, 5, 15) | ||
43 | + | ||
44 | +FIELD(GITS_CTLR, ENABLED, 0, 1) | ||
45 | FIELD(GITS_CTLR, QUIESCENT, 31, 1) | ||
46 | |||
47 | FIELD(GITS_TYPER, PHYSICAL, 0, 1) | ||
48 | @@ -XXX,XX +XXX,XX @@ FIELD(GITS_TYPER, PTA, 19, 1) | ||
49 | FIELD(GITS_TYPER, CIDBITS, 32, 4) | ||
50 | FIELD(GITS_TYPER, CIL, 36, 1) | ||
51 | |||
52 | +#define GITS_IDREGS 0xFFD0 | ||
53 | + | ||
54 | +#define ITS_CTLR_ENABLED (1U) /* ITS Enabled */ | ||
55 | + | ||
56 | +#define GITS_BASER_RO_MASK (R_GITS_BASER_ENTRYSIZE_MASK | \ | ||
57 | + R_GITS_BASER_TYPE_MASK) | ||
58 | + | ||
59 | #define GITS_BASER_PAGESIZE_4K 0 | ||
60 | #define GITS_BASER_PAGESIZE_16K 1 | ||
61 | #define GITS_BASER_PAGESIZE_64K 2 | ||
62 | @@ -XXX,XX +XXX,XX @@ FIELD(GITS_TYPER, CIL, 36, 1) | ||
63 | #define GITS_BASER_TYPE_DEVICE 1ULL | ||
64 | #define GITS_BASER_TYPE_COLLECTION 4ULL | ||
65 | |||
66 | +#define GITS_PAGE_SIZE_4K 0x1000 | ||
67 | +#define GITS_PAGE_SIZE_16K 0x4000 | ||
68 | +#define GITS_PAGE_SIZE_64K 0x10000 | ||
69 | + | ||
70 | +#define L1TABLE_ENTRY_SIZE 8 | ||
71 | + | ||
72 | +#define GITS_CMDQ_ENTRY_SIZE 32 | ||
73 | + | ||
74 | /** | ||
75 | * Default features advertised by this version of ITS | ||
76 | */ | ||
77 | diff --git a/include/hw/intc/arm_gicv3_common.h b/include/hw/intc/arm_gicv3_common.h | ||
34 | index XXXXXXX..XXXXXXX 100644 | 78 | index XXXXXXX..XXXXXXX 100644 |
35 | --- a/target/arm/mve.decode | 79 | --- a/include/hw/intc/arm_gicv3_common.h |
36 | +++ b/target/arm/mve.decode | 80 | +++ b/include/hw/intc/arm_gicv3_common.h |
81 | @@ -XXX,XX +XXX,XX @@ struct GICv3State { | ||
82 | int dev_fd; /* kvm device fd if backed by kvm vgic support */ | ||
83 | Error *migration_blocker; | ||
84 | |||
85 | + MemoryRegion *dma; | ||
86 | + AddressSpace dma_as; | ||
87 | + | ||
88 | /* Distributor */ | ||
89 | |||
90 | /* for a GIC with the security extensions the NS banked version of this | ||
91 | diff --git a/include/hw/intc/arm_gicv3_its_common.h b/include/hw/intc/arm_gicv3_its_common.h | ||
92 | index XXXXXXX..XXXXXXX 100644 | ||
93 | --- a/include/hw/intc/arm_gicv3_its_common.h | ||
94 | +++ b/include/hw/intc/arm_gicv3_its_common.h | ||
37 | @@ -XXX,XX +XXX,XX @@ | 95 | @@ -XXX,XX +XXX,XX @@ |
38 | @2_shl_h .... .... .. 01 shift:4 .... .... .... .... &2shift qd=%qd qm=%qm size=1 | 96 | |
39 | @2_shl_w .... .... .. 1 shift:5 .... .... .... .... &2shift qd=%qd qm=%qm size=2 | 97 | #define GITS_TRANSLATER 0x0040 |
40 | 98 | ||
41 | +@2_shll_b .... .... ... 01 shift:3 .... .... .... .... &2shift qd=%qd qm=%qm size=0 | 99 | +typedef struct { |
42 | +@2_shll_h .... .... ... 1 shift:4 .... .... .... .... &2shift qd=%qd qm=%qm size=1 | 100 | + bool valid; |
43 | +# VSHLL encoding T2 where shift == esize | 101 | + bool indirect; |
44 | +@2_shll_esize_b .... .... .... 00 .. .... .... .... .... &2shift \ | 102 | + uint16_t entry_sz; |
45 | + qd=%qd qm=%qm size=0 shift=8 | 103 | + uint32_t page_sz; |
46 | +@2_shll_esize_h .... .... .... 01 .. .... .... .... .... &2shift \ | 104 | + uint32_t max_entries; |
47 | + qd=%qd qm=%qm size=1 shift=16 | 105 | + union { |
48 | + | 106 | + uint32_t max_devids; |
49 | # Right shifts are encoded as N - shift, where N is the element size in bits. | 107 | + uint32_t max_collids; |
50 | %rshift_i5 16:5 !function=rsub_32 | 108 | + } maxids; |
51 | %rshift_i4 16:4 !function=rsub_16 | 109 | + uint64_t base_addr; |
52 | @@ -XXX,XX +XXX,XX @@ VADD 1110 1111 0 . .. ... 0 ... 0 1000 . 1 . 0 ... 0 @2op | 110 | +} TableDesc; |
53 | VSUB 1111 1111 0 . .. ... 0 ... 0 1000 . 1 . 0 ... 0 @2op | 111 | + |
54 | VMUL 1110 1111 0 . .. ... 0 ... 0 1001 . 1 . 1 ... 0 @2op | 112 | +typedef struct { |
55 | 113 | + bool valid; | |
56 | -VMULH_S 111 0 1110 0 . .. ...1 ... 0 1110 . 0 . 0 ... 1 @2op | 114 | + uint32_t max_entries; |
57 | -VMULH_U 111 1 1110 0 . .. ...1 ... 0 1110 . 0 . 0 ... 1 @2op | 115 | + uint64_t base_addr; |
58 | +# The VSHLL T2 encoding is not a @2op pattern, but is here because it | 116 | +} CmdQDesc; |
59 | +# overlaps what would be size=0b11 VMULH/VRMULH | 117 | + |
118 | struct GICv3ITSState { | ||
119 | SysBusDevice parent_obj; | ||
120 | |||
121 | @@ -XXX,XX +XXX,XX @@ struct GICv3ITSState { | ||
122 | uint64_t creadr; | ||
123 | uint64_t baser[8]; | ||
124 | |||
125 | + TableDesc dt; | ||
126 | + TableDesc ct; | ||
127 | + CmdQDesc cq; | ||
128 | + | ||
129 | Error *migration_blocker; | ||
130 | }; | ||
131 | |||
132 | diff --git a/hw/intc/arm_gicv3_its.c b/hw/intc/arm_gicv3_its.c | ||
133 | index XXXXXXX..XXXXXXX 100644 | ||
134 | --- a/hw/intc/arm_gicv3_its.c | ||
135 | +++ b/hw/intc/arm_gicv3_its.c | ||
136 | @@ -XXX,XX +XXX,XX @@ struct GICv3ITSClass { | ||
137 | void (*parent_reset)(DeviceState *dev); | ||
138 | }; | ||
139 | |||
140 | +static uint64_t baser_base_addr(uint64_t value, uint32_t page_sz) | ||
60 | +{ | 141 | +{ |
61 | + VSHLL_BS 111 0 1110 0 . 11 .. 01 ... 0 1110 0 0 . 0 ... 1 @2_shll_esize_b | 142 | + uint64_t result = 0; |
62 | + VSHLL_BS 111 0 1110 0 . 11 .. 01 ... 0 1110 0 0 . 0 ... 1 @2_shll_esize_h | 143 | + |
63 | 144 | + switch (page_sz) { | |
64 | -VRMULH_S 111 0 1110 0 . .. ...1 ... 1 1110 . 0 . 0 ... 1 @2op | 145 | + case GITS_PAGE_SIZE_4K: |
65 | -VRMULH_U 111 1 1110 0 . .. ...1 ... 1 1110 . 0 . 0 ... 1 @2op | 146 | + case GITS_PAGE_SIZE_16K: |
66 | + VMULH_S 111 0 1110 0 . .. ...1 ... 0 1110 . 0 . 0 ... 1 @2op | 147 | + result = FIELD_EX64(value, GITS_BASER, PHYADDR) << 12; |
148 | + break; | ||
149 | + | ||
150 | + case GITS_PAGE_SIZE_64K: | ||
151 | + result = FIELD_EX64(value, GITS_BASER, PHYADDRL_64K) << 16; | ||
152 | + result |= FIELD_EX64(value, GITS_BASER, PHYADDRH_64K) << 48; | ||
153 | + break; | ||
154 | + | ||
155 | + default: | ||
156 | + break; | ||
157 | + } | ||
158 | + return result; | ||
67 | +} | 159 | +} |
68 | + | 160 | + |
161 | +/* | ||
162 | + * This function extracts the ITS Device and Collection table specific | ||
163 | + * parameters (like base_addr, size etc) from GITS_BASER register. | ||
164 | + * It is called during ITS enable and also during post_load migration | ||
165 | + */ | ||
166 | +static void extract_table_params(GICv3ITSState *s) | ||
69 | +{ | 167 | +{ |
70 | + VSHLL_BU 111 1 1110 0 . 11 .. 01 ... 0 1110 0 0 . 0 ... 1 @2_shll_esize_b | 168 | + uint16_t num_pages = 0; |
71 | + VSHLL_BU 111 1 1110 0 . 11 .. 01 ... 0 1110 0 0 . 0 ... 1 @2_shll_esize_h | 169 | + uint8_t page_sz_type; |
72 | + | 170 | + uint8_t type; |
73 | + VMULH_U 111 1 1110 0 . .. ...1 ... 0 1110 . 0 . 0 ... 1 @2op | 171 | + uint32_t page_sz = 0; |
172 | + uint64_t value; | ||
173 | + | ||
174 | + for (int i = 0; i < 8; i++) { | ||
175 | + value = s->baser[i]; | ||
176 | + | ||
177 | + if (!value) { | ||
178 | + continue; | ||
179 | + } | ||
180 | + | ||
181 | + page_sz_type = FIELD_EX64(value, GITS_BASER, PAGESIZE); | ||
182 | + | ||
183 | + switch (page_sz_type) { | ||
184 | + case 0: | ||
185 | + page_sz = GITS_PAGE_SIZE_4K; | ||
186 | + break; | ||
187 | + | ||
188 | + case 1: | ||
189 | + page_sz = GITS_PAGE_SIZE_16K; | ||
190 | + break; | ||
191 | + | ||
192 | + case 2: | ||
193 | + case 3: | ||
194 | + page_sz = GITS_PAGE_SIZE_64K; | ||
195 | + break; | ||
196 | + | ||
197 | + default: | ||
198 | + g_assert_not_reached(); | ||
199 | + } | ||
200 | + | ||
201 | + num_pages = FIELD_EX64(value, GITS_BASER, SIZE) + 1; | ||
202 | + | ||
203 | + type = FIELD_EX64(value, GITS_BASER, TYPE); | ||
204 | + | ||
205 | + switch (type) { | ||
206 | + | ||
207 | + case GITS_BASER_TYPE_DEVICE: | ||
208 | + memset(&s->dt, 0 , sizeof(s->dt)); | ||
209 | + s->dt.valid = FIELD_EX64(value, GITS_BASER, VALID); | ||
210 | + | ||
211 | + if (!s->dt.valid) { | ||
212 | + return; | ||
213 | + } | ||
214 | + | ||
215 | + s->dt.page_sz = page_sz; | ||
216 | + s->dt.indirect = FIELD_EX64(value, GITS_BASER, INDIRECT); | ||
217 | + s->dt.entry_sz = FIELD_EX64(value, GITS_BASER, ENTRYSIZE); | ||
218 | + | ||
219 | + if (!s->dt.indirect) { | ||
220 | + s->dt.max_entries = (num_pages * page_sz) / s->dt.entry_sz; | ||
221 | + } else { | ||
222 | + s->dt.max_entries = (((num_pages * page_sz) / | ||
223 | + L1TABLE_ENTRY_SIZE) * | ||
224 | + (page_sz / s->dt.entry_sz)); | ||
225 | + } | ||
226 | + | ||
227 | + s->dt.maxids.max_devids = (1UL << (FIELD_EX64(s->typer, GITS_TYPER, | ||
228 | + DEVBITS) + 1)); | ||
229 | + | ||
230 | + s->dt.base_addr = baser_base_addr(value, page_sz); | ||
231 | + | ||
232 | + break; | ||
233 | + | ||
234 | + case GITS_BASER_TYPE_COLLECTION: | ||
235 | + memset(&s->ct, 0 , sizeof(s->ct)); | ||
236 | + s->ct.valid = FIELD_EX64(value, GITS_BASER, VALID); | ||
237 | + | ||
238 | + /* | ||
239 | + * GITS_TYPER.HCC is 0 for this implementation | ||
240 | + * hence writes are discarded if ct.valid is 0 | ||
241 | + */ | ||
242 | + if (!s->ct.valid) { | ||
243 | + return; | ||
244 | + } | ||
245 | + | ||
246 | + s->ct.page_sz = page_sz; | ||
247 | + s->ct.indirect = FIELD_EX64(value, GITS_BASER, INDIRECT); | ||
248 | + s->ct.entry_sz = FIELD_EX64(value, GITS_BASER, ENTRYSIZE); | ||
249 | + | ||
250 | + if (!s->ct.indirect) { | ||
251 | + s->ct.max_entries = (num_pages * page_sz) / s->ct.entry_sz; | ||
252 | + } else { | ||
253 | + s->ct.max_entries = (((num_pages * page_sz) / | ||
254 | + L1TABLE_ENTRY_SIZE) * | ||
255 | + (page_sz / s->ct.entry_sz)); | ||
256 | + } | ||
257 | + | ||
258 | + if (FIELD_EX64(s->typer, GITS_TYPER, CIL)) { | ||
259 | + s->ct.maxids.max_collids = (1UL << (FIELD_EX64(s->typer, | ||
260 | + GITS_TYPER, CIDBITS) + 1)); | ||
261 | + } else { | ||
262 | + /* 16-bit CollectionId supported when CIL == 0 */ | ||
263 | + s->ct.maxids.max_collids = (1UL << 16); | ||
264 | + } | ||
265 | + | ||
266 | + s->ct.base_addr = baser_base_addr(value, page_sz); | ||
267 | + | ||
268 | + break; | ||
269 | + | ||
270 | + default: | ||
271 | + break; | ||
272 | + } | ||
273 | + } | ||
74 | +} | 274 | +} |
75 | + | 275 | + |
276 | +static void extract_cmdq_params(GICv3ITSState *s) | ||
76 | +{ | 277 | +{ |
77 | + VSHLL_TS 111 0 1110 0 . 11 .. 01 ... 1 1110 0 0 . 0 ... 1 @2_shll_esize_b | 278 | + uint16_t num_pages = 0; |
78 | + VSHLL_TS 111 0 1110 0 . 11 .. 01 ... 1 1110 0 0 . 0 ... 1 @2_shll_esize_h | 279 | + uint64_t value = s->cbaser; |
79 | + | 280 | + |
80 | + VRMULH_S 111 0 1110 0 . .. ...1 ... 1 1110 . 0 . 0 ... 1 @2op | 281 | + num_pages = FIELD_EX64(value, GITS_CBASER, SIZE) + 1; |
282 | + | ||
283 | + memset(&s->cq, 0 , sizeof(s->cq)); | ||
284 | + s->cq.valid = FIELD_EX64(value, GITS_CBASER, VALID); | ||
285 | + | ||
286 | + if (s->cq.valid) { | ||
287 | + s->cq.max_entries = (num_pages * GITS_PAGE_SIZE_4K) / | ||
288 | + GITS_CMDQ_ENTRY_SIZE; | ||
289 | + s->cq.base_addr = FIELD_EX64(value, GITS_CBASER, PHYADDR); | ||
290 | + s->cq.base_addr <<= R_GITS_CBASER_PHYADDR_SHIFT; | ||
291 | + } | ||
81 | +} | 292 | +} |
82 | + | 293 | + |
294 | static MemTxResult gicv3_its_translation_write(void *opaque, hwaddr offset, | ||
295 | uint64_t data, unsigned size, | ||
296 | MemTxAttrs attrs) | ||
297 | @@ -XXX,XX +XXX,XX @@ static bool its_writel(GICv3ITSState *s, hwaddr offset, | ||
298 | uint64_t value, MemTxAttrs attrs) | ||
299 | { | ||
300 | bool result = true; | ||
301 | + int index; | ||
302 | |||
303 | + switch (offset) { | ||
304 | + case GITS_CTLR: | ||
305 | + s->ctlr |= (value & ~(s->ctlr)); | ||
306 | + | ||
307 | + if (s->ctlr & ITS_CTLR_ENABLED) { | ||
308 | + extract_table_params(s); | ||
309 | + extract_cmdq_params(s); | ||
310 | + s->creadr = 0; | ||
311 | + } | ||
312 | + break; | ||
313 | + case GITS_CBASER: | ||
314 | + /* | ||
315 | + * IMPDEF choice:- GITS_CBASER register becomes RO if ITS is | ||
316 | + * already enabled | ||
317 | + */ | ||
318 | + if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
319 | + s->cbaser = deposit64(s->cbaser, 0, 32, value); | ||
320 | + s->creadr = 0; | ||
321 | + s->cwriter = s->creadr; | ||
322 | + } | ||
323 | + break; | ||
324 | + case GITS_CBASER + 4: | ||
325 | + /* | ||
326 | + * IMPDEF choice:- GITS_CBASER register becomes RO if ITS is | ||
327 | + * already enabled | ||
328 | + */ | ||
329 | + if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
330 | + s->cbaser = deposit64(s->cbaser, 32, 32, value); | ||
331 | + s->creadr = 0; | ||
332 | + s->cwriter = s->creadr; | ||
333 | + } | ||
334 | + break; | ||
335 | + case GITS_CWRITER: | ||
336 | + s->cwriter = deposit64(s->cwriter, 0, 32, | ||
337 | + (value & ~R_GITS_CWRITER_RETRY_MASK)); | ||
338 | + break; | ||
339 | + case GITS_CWRITER + 4: | ||
340 | + s->cwriter = deposit64(s->cwriter, 32, 32, value); | ||
341 | + break; | ||
342 | + case GITS_CREADR: | ||
343 | + if (s->gicv3->gicd_ctlr & GICD_CTLR_DS) { | ||
344 | + s->creadr = deposit64(s->creadr, 0, 32, | ||
345 | + (value & ~R_GITS_CREADR_STALLED_MASK)); | ||
346 | + } else { | ||
347 | + /* RO register, ignore the write */ | ||
348 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
349 | + "%s: invalid guest write to RO register at offset " | ||
350 | + TARGET_FMT_plx "\n", __func__, offset); | ||
351 | + } | ||
352 | + break; | ||
353 | + case GITS_CREADR + 4: | ||
354 | + if (s->gicv3->gicd_ctlr & GICD_CTLR_DS) { | ||
355 | + s->creadr = deposit64(s->creadr, 32, 32, value); | ||
356 | + } else { | ||
357 | + /* RO register, ignore the write */ | ||
358 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
359 | + "%s: invalid guest write to RO register at offset " | ||
360 | + TARGET_FMT_plx "\n", __func__, offset); | ||
361 | + } | ||
362 | + break; | ||
363 | + case GITS_BASER ... GITS_BASER + 0x3f: | ||
364 | + /* | ||
365 | + * IMPDEF choice:- GITS_BASERn register becomes RO if ITS is | ||
366 | + * already enabled | ||
367 | + */ | ||
368 | + if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
369 | + index = (offset - GITS_BASER) / 8; | ||
370 | + | ||
371 | + if (offset & 7) { | ||
372 | + value <<= 32; | ||
373 | + value &= ~GITS_BASER_RO_MASK; | ||
374 | + s->baser[index] &= GITS_BASER_RO_MASK | MAKE_64BIT_MASK(0, 32); | ||
375 | + s->baser[index] |= value; | ||
376 | + } else { | ||
377 | + value &= ~GITS_BASER_RO_MASK; | ||
378 | + s->baser[index] &= GITS_BASER_RO_MASK | MAKE_64BIT_MASK(32, 32); | ||
379 | + s->baser[index] |= value; | ||
380 | + } | ||
381 | + } | ||
382 | + break; | ||
383 | + case GITS_IIDR: | ||
384 | + case GITS_IDREGS ... GITS_IDREGS + 0x2f: | ||
385 | + /* RO registers, ignore the write */ | ||
386 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
387 | + "%s: invalid guest write to RO register at offset " | ||
388 | + TARGET_FMT_plx "\n", __func__, offset); | ||
389 | + break; | ||
390 | + default: | ||
391 | + result = false; | ||
392 | + break; | ||
393 | + } | ||
394 | return result; | ||
395 | } | ||
396 | |||
397 | @@ -XXX,XX +XXX,XX @@ static bool its_readl(GICv3ITSState *s, hwaddr offset, | ||
398 | uint64_t *data, MemTxAttrs attrs) | ||
399 | { | ||
400 | bool result = true; | ||
401 | + int index; | ||
402 | |||
403 | + switch (offset) { | ||
404 | + case GITS_CTLR: | ||
405 | + *data = s->ctlr; | ||
406 | + break; | ||
407 | + case GITS_IIDR: | ||
408 | + *data = gicv3_iidr(); | ||
409 | + break; | ||
410 | + case GITS_IDREGS ... GITS_IDREGS + 0x2f: | ||
411 | + /* ID registers */ | ||
412 | + *data = gicv3_idreg(offset - GITS_IDREGS); | ||
413 | + break; | ||
414 | + case GITS_TYPER: | ||
415 | + *data = extract64(s->typer, 0, 32); | ||
416 | + break; | ||
417 | + case GITS_TYPER + 4: | ||
418 | + *data = extract64(s->typer, 32, 32); | ||
419 | + break; | ||
420 | + case GITS_CBASER: | ||
421 | + *data = extract64(s->cbaser, 0, 32); | ||
422 | + break; | ||
423 | + case GITS_CBASER + 4: | ||
424 | + *data = extract64(s->cbaser, 32, 32); | ||
425 | + break; | ||
426 | + case GITS_CREADR: | ||
427 | + *data = extract64(s->creadr, 0, 32); | ||
428 | + break; | ||
429 | + case GITS_CREADR + 4: | ||
430 | + *data = extract64(s->creadr, 32, 32); | ||
431 | + break; | ||
432 | + case GITS_CWRITER: | ||
433 | + *data = extract64(s->cwriter, 0, 32); | ||
434 | + break; | ||
435 | + case GITS_CWRITER + 4: | ||
436 | + *data = extract64(s->cwriter, 32, 32); | ||
437 | + break; | ||
438 | + case GITS_BASER ... GITS_BASER + 0x3f: | ||
439 | + index = (offset - GITS_BASER) / 8; | ||
440 | + if (offset & 7) { | ||
441 | + *data = extract64(s->baser[index], 32, 32); | ||
442 | + } else { | ||
443 | + *data = extract64(s->baser[index], 0, 32); | ||
444 | + } | ||
445 | + break; | ||
446 | + default: | ||
447 | + result = false; | ||
448 | + break; | ||
449 | + } | ||
450 | return result; | ||
451 | } | ||
452 | |||
453 | @@ -XXX,XX +XXX,XX @@ static bool its_writell(GICv3ITSState *s, hwaddr offset, | ||
454 | uint64_t value, MemTxAttrs attrs) | ||
455 | { | ||
456 | bool result = true; | ||
457 | + int index; | ||
458 | |||
459 | + switch (offset) { | ||
460 | + case GITS_BASER ... GITS_BASER + 0x3f: | ||
461 | + /* | ||
462 | + * IMPDEF choice:- GITS_BASERn register becomes RO if ITS is | ||
463 | + * already enabled | ||
464 | + */ | ||
465 | + if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
466 | + index = (offset - GITS_BASER) / 8; | ||
467 | + s->baser[index] &= GITS_BASER_RO_MASK; | ||
468 | + s->baser[index] |= (value & ~GITS_BASER_RO_MASK); | ||
469 | + } | ||
470 | + break; | ||
471 | + case GITS_CBASER: | ||
472 | + /* | ||
473 | + * IMPDEF choice:- GITS_CBASER register becomes RO if ITS is | ||
474 | + * already enabled | ||
475 | + */ | ||
476 | + if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
477 | + s->cbaser = value; | ||
478 | + s->creadr = 0; | ||
479 | + s->cwriter = s->creadr; | ||
480 | + } | ||
481 | + break; | ||
482 | + case GITS_CWRITER: | ||
483 | + s->cwriter = value & ~R_GITS_CWRITER_RETRY_MASK; | ||
484 | + break; | ||
485 | + case GITS_CREADR: | ||
486 | + if (s->gicv3->gicd_ctlr & GICD_CTLR_DS) { | ||
487 | + s->creadr = value & ~R_GITS_CREADR_STALLED_MASK; | ||
488 | + } else { | ||
489 | + /* RO register, ignore the write */ | ||
490 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
491 | + "%s: invalid guest write to RO register at offset " | ||
492 | + TARGET_FMT_plx "\n", __func__, offset); | ||
493 | + } | ||
494 | + break; | ||
495 | + case GITS_TYPER: | ||
496 | + /* RO registers, ignore the write */ | ||
497 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
498 | + "%s: invalid guest write to RO register at offset " | ||
499 | + TARGET_FMT_plx "\n", __func__, offset); | ||
500 | + break; | ||
501 | + default: | ||
502 | + result = false; | ||
503 | + break; | ||
504 | + } | ||
505 | return result; | ||
506 | } | ||
507 | |||
508 | @@ -XXX,XX +XXX,XX @@ static bool its_readll(GICv3ITSState *s, hwaddr offset, | ||
509 | uint64_t *data, MemTxAttrs attrs) | ||
510 | { | ||
511 | bool result = true; | ||
512 | + int index; | ||
513 | |||
514 | + switch (offset) { | ||
515 | + case GITS_TYPER: | ||
516 | + *data = s->typer; | ||
517 | + break; | ||
518 | + case GITS_BASER ... GITS_BASER + 0x3f: | ||
519 | + index = (offset - GITS_BASER) / 8; | ||
520 | + *data = s->baser[index]; | ||
521 | + break; | ||
522 | + case GITS_CBASER: | ||
523 | + *data = s->cbaser; | ||
524 | + break; | ||
525 | + case GITS_CREADR: | ||
526 | + *data = s->creadr; | ||
527 | + break; | ||
528 | + case GITS_CWRITER: | ||
529 | + *data = s->cwriter; | ||
530 | + break; | ||
531 | + default: | ||
532 | + result = false; | ||
533 | + break; | ||
534 | + } | ||
535 | return result; | ||
536 | } | ||
537 | |||
538 | @@ -XXX,XX +XXX,XX @@ static void gicv3_arm_its_realize(DeviceState *dev, Error **errp) | ||
539 | |||
540 | gicv3_its_init_mmio(s, &gicv3_its_control_ops, &gicv3_its_translation_ops); | ||
541 | |||
542 | + address_space_init(&s->gicv3->dma_as, s->gicv3->dma, | ||
543 | + "gicv3-its-sysmem"); | ||
544 | + | ||
545 | /* set the ITS default features supported */ | ||
546 | s->typer = FIELD_DP64(s->typer, GITS_TYPER, PHYSICAL, | ||
547 | GITS_TYPE_PHYSICAL); | ||
548 | @@ -XXX,XX +XXX,XX @@ static void gicv3_its_reset(DeviceState *dev) | ||
549 | GITS_CTE_SIZE - 1); | ||
550 | } | ||
551 | |||
552 | +static void gicv3_its_post_load(GICv3ITSState *s) | ||
83 | +{ | 553 | +{ |
84 | + VSHLL_TU 111 1 1110 0 . 11 .. 01 ... 1 1110 0 0 . 0 ... 1 @2_shll_esize_b | 554 | + if (s->ctlr & ITS_CTLR_ENABLED) { |
85 | + VSHLL_TU 111 1 1110 0 . 11 .. 01 ... 1 1110 0 0 . 0 ... 1 @2_shll_esize_h | 555 | + extract_table_params(s); |
86 | + | 556 | + extract_cmdq_params(s); |
87 | + VRMULH_U 111 1 1110 0 . .. ...1 ... 1 1110 . 0 . 0 ... 1 @2op | 557 | + } |
88 | +} | 558 | +} |
89 | 559 | + | |
90 | VMAX_S 111 0 1111 0 . .. ... 0 ... 0 0110 . 1 . 0 ... 0 @2op | 560 | static Property gicv3_its_props[] = { |
91 | VMAX_U 111 1 1111 0 . .. ... 0 ... 0 0110 . 1 . 0 ... 0 @2op | 561 | DEFINE_PROP_LINK("parent-gicv3", GICv3ITSState, gicv3, "arm-gicv3", |
92 | @@ -XXX,XX +XXX,XX @@ VRSHRI_S 111 0 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_w | 562 | GICv3State *), |
93 | VRSHRI_U 111 1 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_b | 563 | @@ -XXX,XX +XXX,XX @@ static void gicv3_its_class_init(ObjectClass *klass, void *data) |
94 | VRSHRI_U 111 1 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_h | 564 | { |
95 | VRSHRI_U 111 1 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_w | 565 | DeviceClass *dc = DEVICE_CLASS(klass); |
96 | + | 566 | GICv3ITSClass *ic = ARM_GICV3_ITS_CLASS(klass); |
97 | +# VSHLL T1 encoding; the T2 VSHLL encoding is elsewhere in this file | 567 | + GICv3ITSCommonClass *icc = ARM_GICV3_ITS_COMMON_CLASS(klass); |
98 | +VSHLL_BS 111 0 1110 1 . 1 .. ... ... 0 1111 0 1 . 0 ... 0 @2_shll_b | 568 | |
99 | +VSHLL_BS 111 0 1110 1 . 1 .. ... ... 0 1111 0 1 . 0 ... 0 @2_shll_h | 569 | dc->realize = gicv3_arm_its_realize; |
100 | + | 570 | device_class_set_props(dc, gicv3_its_props); |
101 | +VSHLL_BU 111 1 1110 1 . 1 .. ... ... 0 1111 0 1 . 0 ... 0 @2_shll_b | 571 | device_class_set_parent_reset(dc, gicv3_its_reset, &ic->parent_reset); |
102 | +VSHLL_BU 111 1 1110 1 . 1 .. ... ... 0 1111 0 1 . 0 ... 0 @2_shll_h | 572 | + icc->post_load = gicv3_its_post_load; |
103 | + | 573 | } |
104 | +VSHLL_TS 111 0 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_b | 574 | |
105 | +VSHLL_TS 111 0 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_h | 575 | static const TypeInfo gicv3_its_info = { |
106 | + | ||
107 | +VSHLL_TU 111 1 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_b | ||
108 | +VSHLL_TU 111 1 1110 1 . 1 .. ... ... 1 1111 0 1 . 0 ... 0 @2_shll_h | ||
109 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
110 | index XXXXXXX..XXXXXXX 100644 | ||
111 | --- a/target/arm/mve_helper.c | ||
112 | +++ b/target/arm/mve_helper.c | ||
113 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT_SAT_S(vqshli_s, DO_SQSHL_OP) | ||
114 | DO_2SHIFT_SAT_S(vqshlui_s, DO_SUQSHL_OP) | ||
115 | DO_2SHIFT_U(vrshli_u, DO_VRSHLU) | ||
116 | DO_2SHIFT_S(vrshli_s, DO_VRSHLS) | ||
117 | + | ||
118 | +/* | ||
119 | + * Long shifts taking half-sized inputs from top or bottom of the input | ||
120 | + * vector and producing a double-width result. ESIZE, TYPE are for | ||
121 | + * the input, and LESIZE, LTYPE for the output. | ||
122 | + * Unlike the normal shift helpers, we do not handle negative shift counts, | ||
123 | + * because the long shift is strictly left-only. | ||
124 | + */ | ||
125 | +#define DO_VSHLL(OP, TOP, ESIZE, TYPE, LESIZE, LTYPE) \ | ||
126 | + void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
127 | + void *vm, uint32_t shift) \ | ||
128 | + { \ | ||
129 | + LTYPE *d = vd; \ | ||
130 | + TYPE *m = vm; \ | ||
131 | + uint16_t mask = mve_element_mask(env); \ | ||
132 | + unsigned le; \ | ||
133 | + assert(shift <= 16); \ | ||
134 | + for (le = 0; le < 16 / LESIZE; le++, mask >>= LESIZE) { \ | ||
135 | + LTYPE r = (LTYPE)m[H##ESIZE(le * 2 + TOP)] << shift; \ | ||
136 | + mergemask(&d[H##LESIZE(le)], r, mask); \ | ||
137 | + } \ | ||
138 | + mve_advance_vpt(env); \ | ||
139 | + } | ||
140 | + | ||
141 | +#define DO_VSHLL_ALL(OP, TOP) \ | ||
142 | + DO_VSHLL(OP##sb, TOP, 1, int8_t, 2, int16_t) \ | ||
143 | + DO_VSHLL(OP##ub, TOP, 1, uint8_t, 2, uint16_t) \ | ||
144 | + DO_VSHLL(OP##sh, TOP, 2, int16_t, 4, int32_t) \ | ||
145 | + DO_VSHLL(OP##uh, TOP, 2, uint16_t, 4, uint32_t) \ | ||
146 | + | ||
147 | +DO_VSHLL_ALL(vshllb, false) | ||
148 | +DO_VSHLL_ALL(vshllt, true) | ||
149 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
150 | index XXXXXXX..XXXXXXX 100644 | ||
151 | --- a/target/arm/translate-mve.c | ||
152 | +++ b/target/arm/translate-mve.c | ||
153 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT(VSHRI_S, vshli_s, true) | ||
154 | DO_2SHIFT(VSHRI_U, vshli_u, true) | ||
155 | DO_2SHIFT(VRSHRI_S, vrshli_s, true) | ||
156 | DO_2SHIFT(VRSHRI_U, vrshli_u, true) | ||
157 | + | ||
158 | +#define DO_VSHLL(INSN, FN) \ | ||
159 | + static bool trans_##INSN(DisasContext *s, arg_2shift *a) \ | ||
160 | + { \ | ||
161 | + static MVEGenTwoOpShiftFn * const fns[] = { \ | ||
162 | + gen_helper_mve_##FN##b, \ | ||
163 | + gen_helper_mve_##FN##h, \ | ||
164 | + }; \ | ||
165 | + return do_2shift(s, a, fns[a->size], false); \ | ||
166 | + } | ||
167 | + | ||
168 | +DO_VSHLL(VSHLL_BS, vshllbs) | ||
169 | +DO_VSHLL(VSHLL_BU, vshllbu) | ||
170 | +DO_VSHLL(VSHLL_TS, vshllts) | ||
171 | +DO_VSHLL(VSHLL_TU, vshlltu) | ||
172 | -- | 576 | -- |
173 | 2.20.1 | 577 | 2.20.1 |
174 | 578 | ||
175 | 579 | diff view generated by jsdifflib |
1 | Implement the MVE shifts by register, which perform | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | shifts on a single general-purpose register. | ||
3 | 2 | ||
3 | Added functionality to trigger ITS command queue processing on | ||
4 | write to CWRITE register and process each command queue entry to | ||
5 | identify the command type and handle commands like MAPD,MAPC,SYNC. | ||
6 | |||
7 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> | ||
8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | Reviewed-by: Eric Auger <eric.auger@redhat.com> | ||
10 | Tested-by: Neil Armstrong <narmstrong@baylibre.com> | ||
11 | Message-id: 20210910143951.92242-4-shashi.mallela@linaro.org | ||
4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
6 | Message-id: 20210628135835.6690-19-peter.maydell@linaro.org | ||
7 | --- | 13 | --- |
8 | target/arm/helper-mve.h | 2 ++ | 14 | hw/intc/gicv3_internal.h | 40 +++++ |
9 | target/arm/translate.h | 1 + | 15 | hw/intc/arm_gicv3_its.c | 319 +++++++++++++++++++++++++++++++++++++++ |
10 | target/arm/t32.decode | 18 ++++++++++++++---- | 16 | 2 files changed, 359 insertions(+) |
11 | target/arm/mve_helper.c | 10 ++++++++++ | ||
12 | target/arm/translate.c | 30 ++++++++++++++++++++++++++++++ | ||
13 | 5 files changed, 57 insertions(+), 4 deletions(-) | ||
14 | 17 | ||
15 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 18 | diff --git a/hw/intc/gicv3_internal.h b/hw/intc/gicv3_internal.h |
16 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/helper-mve.h | 20 | --- a/hw/intc/gicv3_internal.h |
18 | +++ b/target/arm/helper-mve.h | 21 | +++ b/hw/intc/gicv3_internal.h |
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(mve_uqrshll48, TCG_CALL_NO_RWG, i64, env, i64, i32) | 22 | @@ -XXX,XX +XXX,XX @@ FIELD(GITS_TYPER, CIL, 36, 1) |
20 | 23 | #define L1TABLE_ENTRY_SIZE 8 | |
21 | DEF_HELPER_FLAGS_3(mve_uqshl, TCG_CALL_NO_RWG, i32, env, i32, i32) | 24 | |
22 | DEF_HELPER_FLAGS_3(mve_sqshl, TCG_CALL_NO_RWG, i32, env, i32, i32) | 25 | #define GITS_CMDQ_ENTRY_SIZE 32 |
23 | +DEF_HELPER_FLAGS_3(mve_uqrshl, TCG_CALL_NO_RWG, i32, env, i32, i32) | 26 | +#define NUM_BYTES_IN_DW 8 |
24 | +DEF_HELPER_FLAGS_3(mve_sqrshr, TCG_CALL_NO_RWG, i32, env, i32, i32) | 27 | + |
25 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 28 | +#define CMD_MASK 0xff |
29 | + | ||
30 | +/* ITS Commands */ | ||
31 | +#define GITS_CMD_CLEAR 0x04 | ||
32 | +#define GITS_CMD_DISCARD 0x0F | ||
33 | +#define GITS_CMD_INT 0x03 | ||
34 | +#define GITS_CMD_MAPC 0x09 | ||
35 | +#define GITS_CMD_MAPD 0x08 | ||
36 | +#define GITS_CMD_MAPI 0x0B | ||
37 | +#define GITS_CMD_MAPTI 0x0A | ||
38 | +#define GITS_CMD_INV 0x0C | ||
39 | +#define GITS_CMD_INVALL 0x0D | ||
40 | +#define GITS_CMD_SYNC 0x05 | ||
41 | + | ||
42 | +/* MAPC command fields */ | ||
43 | +#define ICID_LENGTH 16 | ||
44 | +#define ICID_MASK ((1U << ICID_LENGTH) - 1) | ||
45 | +FIELD(MAPC, RDBASE, 16, 32) | ||
46 | + | ||
47 | +#define RDBASE_PROCNUM_LENGTH 16 | ||
48 | +#define RDBASE_PROCNUM_MASK ((1ULL << RDBASE_PROCNUM_LENGTH) - 1) | ||
49 | + | ||
50 | +/* MAPD command fields */ | ||
51 | +#define ITTADDR_LENGTH 44 | ||
52 | +#define ITTADDR_SHIFT 8 | ||
53 | +#define ITTADDR_MASK MAKE_64BIT_MASK(ITTADDR_SHIFT, ITTADDR_LENGTH) | ||
54 | +#define SIZE_MASK 0x1f | ||
55 | + | ||
56 | +#define DEVID_SHIFT 32 | ||
57 | +#define DEVID_MASK MAKE_64BIT_MASK(32, 32) | ||
58 | + | ||
59 | +#define VALID_SHIFT 63 | ||
60 | +#define CMD_FIELD_VALID_MASK (1ULL << VALID_SHIFT) | ||
61 | +#define L2_TABLE_VALID_MASK CMD_FIELD_VALID_MASK | ||
62 | +#define TABLE_ENTRY_VALID_MASK (1ULL << 0) | ||
63 | |||
64 | /** | ||
65 | * Default features advertised by this version of ITS | ||
66 | @@ -XXX,XX +XXX,XX @@ FIELD(GITS_TYPER, CIL, 36, 1) | ||
67 | * Valid = 1 bit,ITTAddr = 44 bits,Size = 5 bits | ||
68 | */ | ||
69 | #define GITS_DTE_SIZE (0x8ULL) | ||
70 | +#define GITS_DTE_ITTADDR_SHIFT 6 | ||
71 | +#define GITS_DTE_ITTADDR_MASK MAKE_64BIT_MASK(GITS_DTE_ITTADDR_SHIFT, \ | ||
72 | + ITTADDR_LENGTH) | ||
73 | |||
74 | /* | ||
75 | * 8 bytes Collection Table Entry size | ||
76 | diff --git a/hw/intc/arm_gicv3_its.c b/hw/intc/arm_gicv3_its.c | ||
26 | index XXXXXXX..XXXXXXX 100644 | 77 | index XXXXXXX..XXXXXXX 100644 |
27 | --- a/target/arm/translate.h | 78 | --- a/hw/intc/arm_gicv3_its.c |
28 | +++ b/target/arm/translate.h | 79 | +++ b/hw/intc/arm_gicv3_its.c |
29 | @@ -XXX,XX +XXX,XX @@ typedef void AtomicThreeOpFn(TCGv_i64, TCGv_i64, TCGv_i64, TCGArg, MemOp); | 80 | @@ -XXX,XX +XXX,XX @@ static uint64_t baser_base_addr(uint64_t value, uint32_t page_sz) |
30 | typedef void WideShiftImmFn(TCGv_i64, TCGv_i64, int64_t shift); | 81 | return result; |
31 | typedef void WideShiftFn(TCGv_i64, TCGv_ptr, TCGv_i64, TCGv_i32); | ||
32 | typedef void ShiftImmFn(TCGv_i32, TCGv_i32, int32_t shift); | ||
33 | +typedef void ShiftFn(TCGv_i32, TCGv_ptr, TCGv_i32, TCGv_i32); | ||
34 | |||
35 | /** | ||
36 | * arm_tbflags_from_tb: | ||
37 | diff --git a/target/arm/t32.decode b/target/arm/t32.decode | ||
38 | index XXXXXXX..XXXXXXX 100644 | ||
39 | --- a/target/arm/t32.decode | ||
40 | +++ b/target/arm/t32.decode | ||
41 | @@ -XXX,XX +XXX,XX @@ | ||
42 | &mve_shl_ri rdalo rdahi shim | ||
43 | &mve_shl_rr rdalo rdahi rm | ||
44 | &mve_sh_ri rda shim | ||
45 | +&mve_sh_rr rda rm | ||
46 | |||
47 | # rdahi: bits [3:1] from insn, bit 0 is 1 | ||
48 | # rdalo: bits [3:1] from insn, bit 0 is 0 | ||
49 | @@ -XXX,XX +XXX,XX @@ | ||
50 | &mve_shl_rr rdalo=%rdalo_17 rdahi=%rdahi_9 | ||
51 | @mve_sh_ri ....... .... . rda:4 . ... ... . .. .. .... \ | ||
52 | &mve_sh_ri shim=%imm5_12_6 | ||
53 | +@mve_sh_rr ....... .... . rda:4 rm:4 .... .... .... &mve_sh_rr | ||
54 | |||
55 | { | ||
56 | TST_xrri 1110101 0000 1 .... 0 ... 1111 .... .... @S_xrr_shi | ||
57 | @@ -XXX,XX +XXX,XX @@ BIC_rrri 1110101 0001 . .... 0 ... .... .... .... @s_rrr_shi | ||
58 | SQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 11 1111 @mve_shl_ri | ||
59 | } | ||
60 | |||
61 | - LSLL_rr 1110101 0010 1 ... 0 .... ... 1 0000 1101 @mve_shl_rr | ||
62 | - ASRL_rr 1110101 0010 1 ... 0 .... ... 1 0010 1101 @mve_shl_rr | ||
63 | - UQRSHLL64_rr 1110101 0010 1 ... 1 .... ... 1 0000 1101 @mve_shl_rr | ||
64 | - SQRSHRL64_rr 1110101 0010 1 ... 1 .... ... 1 0010 1101 @mve_shl_rr | ||
65 | + { | ||
66 | + UQRSHL_rr 1110101 0010 1 .... .... 1111 0000 1101 @mve_sh_rr | ||
67 | + LSLL_rr 1110101 0010 1 ... 0 .... ... 1 0000 1101 @mve_shl_rr | ||
68 | + UQRSHLL64_rr 1110101 0010 1 ... 1 .... ... 1 0000 1101 @mve_shl_rr | ||
69 | + } | ||
70 | + | ||
71 | + { | ||
72 | + SQRSHR_rr 1110101 0010 1 .... .... 1111 0010 1101 @mve_sh_rr | ||
73 | + ASRL_rr 1110101 0010 1 ... 0 .... ... 1 0010 1101 @mve_shl_rr | ||
74 | + SQRSHRL64_rr 1110101 0010 1 ... 1 .... ... 1 0010 1101 @mve_shl_rr | ||
75 | + } | ||
76 | + | ||
77 | UQRSHLL48_rr 1110101 0010 1 ... 1 .... ... 1 1000 1101 @mve_shl_rr | ||
78 | SQRSHRL48_rr 1110101 0010 1 ... 1 .... ... 1 1010 1101 @mve_shl_rr | ||
79 | ] | ||
80 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
81 | index XXXXXXX..XXXXXXX 100644 | ||
82 | --- a/target/arm/mve_helper.c | ||
83 | +++ b/target/arm/mve_helper.c | ||
84 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(mve_sqshl)(CPUARMState *env, uint32_t n, uint32_t shift) | ||
85 | { | ||
86 | return do_sqrshl_bhs(n, (int8_t)shift, 32, false, &env->QF); | ||
87 | } | 82 | } |
88 | + | 83 | |
89 | +uint32_t HELPER(mve_uqrshl)(CPUARMState *env, uint32_t n, uint32_t shift) | 84 | +static bool update_cte(GICv3ITSState *s, uint16_t icid, bool valid, |
85 | + uint64_t rdbase) | ||
90 | +{ | 86 | +{ |
91 | + return do_uqrshl_bhs(n, (int8_t)shift, 32, true, &env->QF); | 87 | + AddressSpace *as = &s->gicv3->dma_as; |
88 | + uint64_t value; | ||
89 | + uint64_t l2t_addr; | ||
90 | + bool valid_l2t; | ||
91 | + uint32_t l2t_id; | ||
92 | + uint32_t max_l2_entries; | ||
93 | + uint64_t cte = 0; | ||
94 | + MemTxResult res = MEMTX_OK; | ||
95 | + | ||
96 | + if (!s->ct.valid) { | ||
97 | + return true; | ||
98 | + } | ||
99 | + | ||
100 | + if (valid) { | ||
101 | + /* add mapping entry to collection table */ | ||
102 | + cte = (valid & TABLE_ENTRY_VALID_MASK) | (rdbase << 1ULL); | ||
103 | + } | ||
104 | + | ||
105 | + /* | ||
106 | + * The specification defines the format of level 1 entries of a | ||
107 | + * 2-level table, but the format of level 2 entries and the format | ||
108 | + * of flat-mapped tables is IMPDEF. | ||
109 | + */ | ||
110 | + if (s->ct.indirect) { | ||
111 | + l2t_id = icid / (s->ct.page_sz / L1TABLE_ENTRY_SIZE); | ||
112 | + | ||
113 | + value = address_space_ldq_le(as, | ||
114 | + s->ct.base_addr + | ||
115 | + (l2t_id * L1TABLE_ENTRY_SIZE), | ||
116 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
117 | + | ||
118 | + if (res != MEMTX_OK) { | ||
119 | + return false; | ||
120 | + } | ||
121 | + | ||
122 | + valid_l2t = (value & L2_TABLE_VALID_MASK) != 0; | ||
123 | + | ||
124 | + if (valid_l2t) { | ||
125 | + max_l2_entries = s->ct.page_sz / s->ct.entry_sz; | ||
126 | + | ||
127 | + l2t_addr = value & ((1ULL << 51) - 1); | ||
128 | + | ||
129 | + address_space_stq_le(as, l2t_addr + | ||
130 | + ((icid % max_l2_entries) * GITS_CTE_SIZE), | ||
131 | + cte, MEMTXATTRS_UNSPECIFIED, &res); | ||
132 | + } | ||
133 | + } else { | ||
134 | + /* Flat level table */ | ||
135 | + address_space_stq_le(as, s->ct.base_addr + (icid * GITS_CTE_SIZE), | ||
136 | + cte, MEMTXATTRS_UNSPECIFIED, &res); | ||
137 | + } | ||
138 | + if (res != MEMTX_OK) { | ||
139 | + return false; | ||
140 | + } else { | ||
141 | + return true; | ||
142 | + } | ||
92 | +} | 143 | +} |
93 | + | 144 | + |
94 | +uint32_t HELPER(mve_sqrshr)(CPUARMState *env, uint32_t n, uint32_t shift) | 145 | +static bool process_mapc(GICv3ITSState *s, uint32_t offset) |
95 | +{ | 146 | +{ |
96 | + return do_sqrshl_bhs(n, -(int8_t)shift, 32, true, &env->QF); | 147 | + AddressSpace *as = &s->gicv3->dma_as; |
148 | + uint16_t icid; | ||
149 | + uint64_t rdbase; | ||
150 | + bool valid; | ||
151 | + MemTxResult res = MEMTX_OK; | ||
152 | + bool result = false; | ||
153 | + uint64_t value; | ||
154 | + | ||
155 | + offset += NUM_BYTES_IN_DW; | ||
156 | + offset += NUM_BYTES_IN_DW; | ||
157 | + | ||
158 | + value = address_space_ldq_le(as, s->cq.base_addr + offset, | ||
159 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
160 | + | ||
161 | + if (res != MEMTX_OK) { | ||
162 | + return result; | ||
163 | + } | ||
164 | + | ||
165 | + icid = value & ICID_MASK; | ||
166 | + | ||
167 | + rdbase = (value & R_MAPC_RDBASE_MASK) >> R_MAPC_RDBASE_SHIFT; | ||
168 | + rdbase &= RDBASE_PROCNUM_MASK; | ||
169 | + | ||
170 | + valid = (value & CMD_FIELD_VALID_MASK); | ||
171 | + | ||
172 | + if ((icid > s->ct.maxids.max_collids) || (rdbase > s->gicv3->num_cpu)) { | ||
173 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
174 | + "ITS MAPC: invalid collection table attributes " | ||
175 | + "icid %d rdbase %lu\n", icid, rdbase); | ||
176 | + /* | ||
177 | + * in this implementation, in case of error | ||
178 | + * we ignore this command and move onto the next | ||
179 | + * command in the queue | ||
180 | + */ | ||
181 | + } else { | ||
182 | + result = update_cte(s, icid, valid, rdbase); | ||
183 | + } | ||
184 | + | ||
185 | + return result; | ||
97 | +} | 186 | +} |
98 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 187 | + |
99 | index XXXXXXX..XXXXXXX 100644 | 188 | +static bool update_dte(GICv3ITSState *s, uint32_t devid, bool valid, |
100 | --- a/target/arm/translate.c | 189 | + uint8_t size, uint64_t itt_addr) |
101 | +++ b/target/arm/translate.c | ||
102 | @@ -XXX,XX +XXX,XX @@ static bool trans_UQSHL_ri(DisasContext *s, arg_mve_sh_ri *a) | ||
103 | return do_mve_sh_ri(s, a, gen_mve_uqshl); | ||
104 | } | ||
105 | |||
106 | +static bool do_mve_sh_rr(DisasContext *s, arg_mve_sh_rr *a, ShiftFn *fn) | ||
107 | +{ | 190 | +{ |
108 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_1M)) { | 191 | + AddressSpace *as = &s->gicv3->dma_as; |
109 | + /* Decode falls through to ORR/MOV UNPREDICTABLE handling */ | 192 | + uint64_t value; |
193 | + uint64_t l2t_addr; | ||
194 | + bool valid_l2t; | ||
195 | + uint32_t l2t_id; | ||
196 | + uint32_t max_l2_entries; | ||
197 | + uint64_t dte = 0; | ||
198 | + MemTxResult res = MEMTX_OK; | ||
199 | + | ||
200 | + if (s->dt.valid) { | ||
201 | + if (valid) { | ||
202 | + /* add mapping entry to device table */ | ||
203 | + dte = (valid & TABLE_ENTRY_VALID_MASK) | | ||
204 | + ((size & SIZE_MASK) << 1U) | | ||
205 | + (itt_addr << GITS_DTE_ITTADDR_SHIFT); | ||
206 | + } | ||
207 | + } else { | ||
208 | + return true; | ||
209 | + } | ||
210 | + | ||
211 | + /* | ||
212 | + * The specification defines the format of level 1 entries of a | ||
213 | + * 2-level table, but the format of level 2 entries and the format | ||
214 | + * of flat-mapped tables is IMPDEF. | ||
215 | + */ | ||
216 | + if (s->dt.indirect) { | ||
217 | + l2t_id = devid / (s->dt.page_sz / L1TABLE_ENTRY_SIZE); | ||
218 | + | ||
219 | + value = address_space_ldq_le(as, | ||
220 | + s->dt.base_addr + | ||
221 | + (l2t_id * L1TABLE_ENTRY_SIZE), | ||
222 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
223 | + | ||
224 | + if (res != MEMTX_OK) { | ||
225 | + return false; | ||
226 | + } | ||
227 | + | ||
228 | + valid_l2t = (value & L2_TABLE_VALID_MASK) != 0; | ||
229 | + | ||
230 | + if (valid_l2t) { | ||
231 | + max_l2_entries = s->dt.page_sz / s->dt.entry_sz; | ||
232 | + | ||
233 | + l2t_addr = value & ((1ULL << 51) - 1); | ||
234 | + | ||
235 | + address_space_stq_le(as, l2t_addr + | ||
236 | + ((devid % max_l2_entries) * GITS_DTE_SIZE), | ||
237 | + dte, MEMTXATTRS_UNSPECIFIED, &res); | ||
238 | + } | ||
239 | + } else { | ||
240 | + /* Flat level table */ | ||
241 | + address_space_stq_le(as, s->dt.base_addr + (devid * GITS_DTE_SIZE), | ||
242 | + dte, MEMTXATTRS_UNSPECIFIED, &res); | ||
243 | + } | ||
244 | + if (res != MEMTX_OK) { | ||
110 | + return false; | 245 | + return false; |
111 | + } | 246 | + } else { |
112 | + if (!dc_isar_feature(aa32_mve, s) || | ||
113 | + !arm_dc_feature(s, ARM_FEATURE_M_MAIN) || | ||
114 | + a->rda == 13 || a->rda == 15 || a->rm == 13 || a->rm == 15 || | ||
115 | + a->rm == a->rda) { | ||
116 | + /* These rda/rm cases are UNPREDICTABLE; we choose to UNDEF */ | ||
117 | + unallocated_encoding(s); | ||
118 | + return true; | 247 | + return true; |
119 | + } | 248 | + } |
120 | + | ||
121 | + /* The helper takes care of the sign-extension of the low 8 bits of Rm */ | ||
122 | + fn(cpu_R[a->rda], cpu_env, cpu_R[a->rda], cpu_R[a->rm]); | ||
123 | + return true; | ||
124 | +} | 249 | +} |
125 | + | 250 | + |
126 | +static bool trans_SQRSHR_rr(DisasContext *s, arg_mve_sh_rr *a) | 251 | +static bool process_mapd(GICv3ITSState *s, uint64_t value, uint32_t offset) |
127 | +{ | 252 | +{ |
128 | + return do_mve_sh_rr(s, a, gen_helper_mve_sqrshr); | 253 | + AddressSpace *as = &s->gicv3->dma_as; |
254 | + uint32_t devid; | ||
255 | + uint8_t size; | ||
256 | + uint64_t itt_addr; | ||
257 | + bool valid; | ||
258 | + MemTxResult res = MEMTX_OK; | ||
259 | + bool result = false; | ||
260 | + | ||
261 | + devid = ((value & DEVID_MASK) >> DEVID_SHIFT); | ||
262 | + | ||
263 | + offset += NUM_BYTES_IN_DW; | ||
264 | + value = address_space_ldq_le(as, s->cq.base_addr + offset, | ||
265 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
266 | + | ||
267 | + if (res != MEMTX_OK) { | ||
268 | + return result; | ||
269 | + } | ||
270 | + | ||
271 | + size = (value & SIZE_MASK); | ||
272 | + | ||
273 | + offset += NUM_BYTES_IN_DW; | ||
274 | + value = address_space_ldq_le(as, s->cq.base_addr + offset, | ||
275 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
276 | + | ||
277 | + if (res != MEMTX_OK) { | ||
278 | + return result; | ||
279 | + } | ||
280 | + | ||
281 | + itt_addr = (value & ITTADDR_MASK) >> ITTADDR_SHIFT; | ||
282 | + | ||
283 | + valid = (value & CMD_FIELD_VALID_MASK); | ||
284 | + | ||
285 | + if ((devid > s->dt.maxids.max_devids) || | ||
286 | + (size > FIELD_EX64(s->typer, GITS_TYPER, IDBITS))) { | ||
287 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
288 | + "ITS MAPD: invalid device table attributes " | ||
289 | + "devid %d or size %d\n", devid, size); | ||
290 | + /* | ||
291 | + * in this implementation, in case of error | ||
292 | + * we ignore this command and move onto the next | ||
293 | + * command in the queue | ||
294 | + */ | ||
295 | + } else { | ||
296 | + result = update_dte(s, devid, valid, size, itt_addr); | ||
297 | + } | ||
298 | + | ||
299 | + return result; | ||
129 | +} | 300 | +} |
130 | + | 301 | + |
131 | +static bool trans_UQRSHL_rr(DisasContext *s, arg_mve_sh_rr *a) | 302 | +/* |
303 | + * Current implementation blocks until all | ||
304 | + * commands are processed | ||
305 | + */ | ||
306 | +static void process_cmdq(GICv3ITSState *s) | ||
132 | +{ | 307 | +{ |
133 | + return do_mve_sh_rr(s, a, gen_helper_mve_uqrshl); | 308 | + uint32_t wr_offset = 0; |
309 | + uint32_t rd_offset = 0; | ||
310 | + uint32_t cq_offset = 0; | ||
311 | + uint64_t data; | ||
312 | + AddressSpace *as = &s->gicv3->dma_as; | ||
313 | + MemTxResult res = MEMTX_OK; | ||
314 | + bool result = true; | ||
315 | + uint8_t cmd; | ||
316 | + | ||
317 | + if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
318 | + return; | ||
319 | + } | ||
320 | + | ||
321 | + wr_offset = FIELD_EX64(s->cwriter, GITS_CWRITER, OFFSET); | ||
322 | + | ||
323 | + if (wr_offset > s->cq.max_entries) { | ||
324 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
325 | + "%s: invalid write offset " | ||
326 | + "%d\n", __func__, wr_offset); | ||
327 | + return; | ||
328 | + } | ||
329 | + | ||
330 | + rd_offset = FIELD_EX64(s->creadr, GITS_CREADR, OFFSET); | ||
331 | + | ||
332 | + if (rd_offset > s->cq.max_entries) { | ||
333 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
334 | + "%s: invalid read offset " | ||
335 | + "%d\n", __func__, rd_offset); | ||
336 | + return; | ||
337 | + } | ||
338 | + | ||
339 | + while (wr_offset != rd_offset) { | ||
340 | + cq_offset = (rd_offset * GITS_CMDQ_ENTRY_SIZE); | ||
341 | + data = address_space_ldq_le(as, s->cq.base_addr + cq_offset, | ||
342 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
343 | + if (res != MEMTX_OK) { | ||
344 | + result = false; | ||
345 | + } | ||
346 | + cmd = (data & CMD_MASK); | ||
347 | + | ||
348 | + switch (cmd) { | ||
349 | + case GITS_CMD_INT: | ||
350 | + break; | ||
351 | + case GITS_CMD_CLEAR: | ||
352 | + break; | ||
353 | + case GITS_CMD_SYNC: | ||
354 | + /* | ||
355 | + * Current implementation makes a blocking synchronous call | ||
356 | + * for every command issued earlier, hence the internal state | ||
357 | + * is already consistent by the time SYNC command is executed. | ||
358 | + * Hence no further processing is required for SYNC command. | ||
359 | + */ | ||
360 | + break; | ||
361 | + case GITS_CMD_MAPD: | ||
362 | + result = process_mapd(s, data, cq_offset); | ||
363 | + break; | ||
364 | + case GITS_CMD_MAPC: | ||
365 | + result = process_mapc(s, cq_offset); | ||
366 | + break; | ||
367 | + case GITS_CMD_MAPTI: | ||
368 | + break; | ||
369 | + case GITS_CMD_MAPI: | ||
370 | + break; | ||
371 | + case GITS_CMD_DISCARD: | ||
372 | + break; | ||
373 | + case GITS_CMD_INV: | ||
374 | + case GITS_CMD_INVALL: | ||
375 | + break; | ||
376 | + default: | ||
377 | + break; | ||
378 | + } | ||
379 | + if (result) { | ||
380 | + rd_offset++; | ||
381 | + rd_offset %= s->cq.max_entries; | ||
382 | + s->creadr = FIELD_DP64(s->creadr, GITS_CREADR, OFFSET, rd_offset); | ||
383 | + } else { | ||
384 | + /* | ||
385 | + * in this implementation, in case of dma read/write error | ||
386 | + * we stall the command processing | ||
387 | + */ | ||
388 | + s->creadr = FIELD_DP64(s->creadr, GITS_CREADR, STALLED, 1); | ||
389 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
390 | + "%s: %x cmd processing failed\n", __func__, cmd); | ||
391 | + break; | ||
392 | + } | ||
393 | + } | ||
134 | +} | 394 | +} |
135 | + | 395 | + |
136 | /* | 396 | /* |
137 | * Multiply and multiply accumulate | 397 | * This function extracts the ITS Device and Collection table specific |
138 | */ | 398 | * parameters (like base_addr, size etc) from GITS_BASER register. |
399 | @@ -XXX,XX +XXX,XX @@ static bool its_writel(GICv3ITSState *s, hwaddr offset, | ||
400 | extract_table_params(s); | ||
401 | extract_cmdq_params(s); | ||
402 | s->creadr = 0; | ||
403 | + process_cmdq(s); | ||
404 | } | ||
405 | break; | ||
406 | case GITS_CBASER: | ||
407 | @@ -XXX,XX +XXX,XX @@ static bool its_writel(GICv3ITSState *s, hwaddr offset, | ||
408 | case GITS_CWRITER: | ||
409 | s->cwriter = deposit64(s->cwriter, 0, 32, | ||
410 | (value & ~R_GITS_CWRITER_RETRY_MASK)); | ||
411 | + if (s->cwriter != s->creadr) { | ||
412 | + process_cmdq(s); | ||
413 | + } | ||
414 | break; | ||
415 | case GITS_CWRITER + 4: | ||
416 | s->cwriter = deposit64(s->cwriter, 32, 32, value); | ||
417 | @@ -XXX,XX +XXX,XX @@ static bool its_writell(GICv3ITSState *s, hwaddr offset, | ||
418 | break; | ||
419 | case GITS_CWRITER: | ||
420 | s->cwriter = value & ~R_GITS_CWRITER_RETRY_MASK; | ||
421 | + if (s->cwriter != s->creadr) { | ||
422 | + process_cmdq(s); | ||
423 | + } | ||
424 | break; | ||
425 | case GITS_CREADR: | ||
426 | if (s->gicv3->gicd_ctlr & GICD_CTLR_DS) { | ||
139 | -- | 427 | -- |
140 | 2.20.1 | 428 | 2.20.1 |
141 | 429 | ||
142 | 430 | diff view generated by jsdifflib |
1 | Implement the MVE logical-immediate insns (VMOV, VMVN, | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | VORR and VBIC). These have essentially the same encoding | ||
3 | as their Neon equivalents, and we implement the decode | ||
4 | in the same way. | ||
5 | 2 | ||
3 | Added ITS command queue handling for MAPTI,MAPI commands,handled ITS | ||
4 | translation which triggers an LPI via INT command as well as write | ||
5 | to GITS_TRANSLATER register,defined enum to differentiate between ITS | ||
6 | command interrupt trigger and GITS_TRANSLATER based interrupt trigger. | ||
7 | Each of these commands make use of other functionalities implemented to | ||
8 | get device table entry,collection table entry or interrupt translation | ||
9 | table entry required for their processing. | ||
10 | |||
11 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> | ||
12 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | Message-id: 20210910143951.92242-5-shashi.mallela@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20210628135835.6690-7-peter.maydell@linaro.org | ||
9 | --- | 15 | --- |
10 | target/arm/helper-mve.h | 4 +++ | 16 | hw/intc/gicv3_internal.h | 12 + |
11 | target/arm/mve.decode | 17 +++++++++++++ | 17 | include/hw/intc/arm_gicv3_common.h | 2 + |
12 | target/arm/mve_helper.c | 24 ++++++++++++++++++ | 18 | hw/intc/arm_gicv3_its.c | 365 ++++++++++++++++++++++++++++- |
13 | target/arm/translate-mve.c | 50 ++++++++++++++++++++++++++++++++++++++ | 19 | 3 files changed, 378 insertions(+), 1 deletion(-) |
14 | 4 files changed, 95 insertions(+) | ||
15 | 20 | ||
16 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 21 | diff --git a/hw/intc/gicv3_internal.h b/hw/intc/gicv3_internal.h |
17 | index XXXXXXX..XXXXXXX 100644 | 22 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-mve.h | 23 | --- a/hw/intc/gicv3_internal.h |
19 | +++ b/target/arm/helper-mve.h | 24 | +++ b/hw/intc/gicv3_internal.h |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(mve_vaddvsh, TCG_CALL_NO_WG, i32, env, ptr, i32) | 25 | @@ -XXX,XX +XXX,XX @@ FIELD(MAPC, RDBASE, 16, 32) |
21 | DEF_HELPER_FLAGS_3(mve_vaddvuh, TCG_CALL_NO_WG, i32, env, ptr, i32) | 26 | #define ITTADDR_MASK MAKE_64BIT_MASK(ITTADDR_SHIFT, ITTADDR_LENGTH) |
22 | DEF_HELPER_FLAGS_3(mve_vaddvsw, TCG_CALL_NO_WG, i32, env, ptr, i32) | 27 | #define SIZE_MASK 0x1f |
23 | DEF_HELPER_FLAGS_3(mve_vaddvuw, TCG_CALL_NO_WG, i32, env, ptr, i32) | 28 | |
24 | + | 29 | +/* MAPI command fields */ |
25 | +DEF_HELPER_FLAGS_3(mve_vmovi, TCG_CALL_NO_WG, void, env, ptr, i64) | 30 | +#define EVENTID_MASK ((1ULL << 32) - 1) |
26 | +DEF_HELPER_FLAGS_3(mve_vandi, TCG_CALL_NO_WG, void, env, ptr, i64) | 31 | + |
27 | +DEF_HELPER_FLAGS_3(mve_vorri, TCG_CALL_NO_WG, void, env, ptr, i64) | 32 | +/* MAPTI command fields */ |
28 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | 33 | +#define pINTID_SHIFT 32 |
34 | +#define pINTID_MASK MAKE_64BIT_MASK(32, 32) | ||
35 | + | ||
36 | #define DEVID_SHIFT 32 | ||
37 | #define DEVID_MASK MAKE_64BIT_MASK(32, 32) | ||
38 | |||
39 | @@ -XXX,XX +XXX,XX @@ FIELD(MAPC, RDBASE, 16, 32) | ||
40 | * Values: | vPEID | ICID | | ||
41 | */ | ||
42 | #define ITS_ITT_ENTRY_SIZE 0xC | ||
43 | +#define ITE_ENTRY_INTTYPE_SHIFT 1 | ||
44 | +#define ITE_ENTRY_INTID_SHIFT 2 | ||
45 | +#define ITE_ENTRY_INTID_MASK MAKE_64BIT_MASK(2, 24) | ||
46 | +#define ITE_ENTRY_INTSP_SHIFT 26 | ||
47 | +#define ITE_ENTRY_ICID_MASK MAKE_64BIT_MASK(0, 16) | ||
48 | |||
49 | /* 16 bits EventId */ | ||
50 | #define ITS_IDBITS GICD_TYPER_IDBITS | ||
51 | diff --git a/include/hw/intc/arm_gicv3_common.h b/include/hw/intc/arm_gicv3_common.h | ||
29 | index XXXXXXX..XXXXXXX 100644 | 52 | index XXXXXXX..XXXXXXX 100644 |
30 | --- a/target/arm/mve.decode | 53 | --- a/include/hw/intc/arm_gicv3_common.h |
31 | +++ b/target/arm/mve.decode | 54 | +++ b/include/hw/intc/arm_gicv3_common.h |
32 | @@ -XXX,XX +XXX,XX @@ | 55 | @@ -XXX,XX +XXX,XX @@ |
33 | # VQDMULL has size in bit 28: 0 for 16 bit, 1 for 32 bit | 56 | #define GICV3_MAXIRQ 1020 |
34 | %size_28 28:1 !function=plus_1 | 57 | #define GICV3_MAXSPI (GICV3_MAXIRQ - GIC_INTERNAL) |
35 | 58 | ||
36 | +# 1imm format immediate | 59 | +#define GICV3_LPI_INTID_START 8192 |
37 | +%imm_28_16_0 28:1 16:3 0:4 | 60 | + |
38 | + | 61 | #define GICV3_REDIST_SIZE 0x20000 |
39 | &vldr_vstr rn qd imm p a w size l u | 62 | |
40 | &1op qd qm size | 63 | /* Number of SGI target-list bits */ |
41 | &2op qd qm qn size | 64 | diff --git a/hw/intc/arm_gicv3_its.c b/hw/intc/arm_gicv3_its.c |
42 | &2scalar qd qn rm size | ||
43 | +&1imm qd imm cmode op | ||
44 | |||
45 | @vldr_vstr ....... . . . . l:1 rn:4 ... ...... imm:7 &vldr_vstr qd=%qd u=0 | ||
46 | # Note that both Rn and Qd are 3 bits only (no D bit) | ||
47 | @@ -XXX,XX +XXX,XX @@ | ||
48 | @2op_nosz .... .... .... .... .... .... .... .... &2op qd=%qd qm=%qm qn=%qn size=0 | ||
49 | @2op_sz28 .... .... .... .... .... .... .... .... &2op qd=%qd qm=%qm qn=%qn \ | ||
50 | size=%size_28 | ||
51 | +@1imm .... .... .... .... .... cmode:4 .. op:1 . .... &1imm qd=%qd imm=%imm_28_16_0 | ||
52 | |||
53 | # The _rev suffix indicates that Vn and Vm are reversed. This is | ||
54 | # the case for shifts. In the Arm ARM these insns are documented | ||
55 | @@ -XXX,XX +XXX,XX @@ VADDV 111 u:1 1110 1111 size:2 01 ... 0 1111 0 0 a:1 0 qm:3 0 rda=%rd | ||
56 | # Predicate operations | ||
57 | %mask_22_13 22:1 13:3 | ||
58 | VPST 1111 1110 0 . 11 000 1 ... 0 1111 0100 1101 mask=%mask_22_13 | ||
59 | + | ||
60 | +# Logical immediate operations (1 reg and modified-immediate) | ||
61 | + | ||
62 | +# The cmode/op bits here decode VORR/VBIC/VMOV/VMVN, but | ||
63 | +# not in a way we can conveniently represent in decodetree without | ||
64 | +# a lot of repetition: | ||
65 | +# VORR: op=0, (cmode & 1) && cmode < 12 | ||
66 | +# VBIC: op=1, (cmode & 1) && cmode < 12 | ||
67 | +# VMOV: everything else | ||
68 | +# So we have a single decode line and check the cmode/op in the | ||
69 | +# trans function. | ||
70 | +Vimm_1r 111 . 1111 1 . 00 0 ... ... 0 .... 0 1 . 1 .... @1imm | ||
71 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
72 | index XXXXXXX..XXXXXXX 100644 | 65 | index XXXXXXX..XXXXXXX 100644 |
73 | --- a/target/arm/mve_helper.c | 66 | --- a/hw/intc/arm_gicv3_its.c |
74 | +++ b/target/arm/mve_helper.c | 67 | +++ b/hw/intc/arm_gicv3_its.c |
75 | @@ -XXX,XX +XXX,XX @@ DO_1OP(vnegw, 4, int32_t, DO_NEG) | 68 | @@ -XXX,XX +XXX,XX @@ struct GICv3ITSClass { |
76 | DO_1OP(vfnegh, 8, uint64_t, DO_FNEGH) | 69 | void (*parent_reset)(DeviceState *dev); |
77 | DO_1OP(vfnegs, 8, uint64_t, DO_FNEGS) | 70 | }; |
78 | 71 | ||
79 | +/* | 72 | +/* |
80 | + * 1 operand immediates: Vda is destination and possibly also one source. | 73 | + * This is an internal enum used to distinguish between LPI triggered |
81 | + * All these insns work at 64-bit widths. | 74 | + * via command queue and LPI triggered via gits_translater write. |
82 | + */ | 75 | + */ |
83 | +#define DO_1OP_IMM(OP, FN) \ | 76 | +typedef enum ItsCmdType { |
84 | + void HELPER(mve_##OP)(CPUARMState *env, void *vda, uint64_t imm) \ | 77 | + NONE = 0, /* internal indication for GITS_TRANSLATER write */ |
85 | + { \ | 78 | + CLEAR = 1, |
86 | + uint64_t *da = vda; \ | 79 | + DISCARD = 2, |
87 | + uint16_t mask = mve_element_mask(env); \ | 80 | + INT = 3, |
88 | + unsigned e; \ | 81 | +} ItsCmdType; |
89 | + for (e = 0; e < 16 / 8; e++, mask >>= 8) { \ | 82 | + |
90 | + mergemask(&da[H8(e)], FN(da[H8(e)], imm), mask); \ | 83 | +typedef struct { |
91 | + } \ | 84 | + uint32_t iteh; |
92 | + mve_advance_vpt(env); \ | 85 | + uint64_t itel; |
93 | + } | 86 | +} IteEntry; |
94 | + | 87 | + |
95 | +#define DO_MOVI(N, I) (I) | 88 | static uint64_t baser_base_addr(uint64_t value, uint32_t page_sz) |
96 | +#define DO_ANDI(N, I) ((N) & (I)) | 89 | { |
97 | +#define DO_ORRI(N, I) ((N) | (I)) | 90 | uint64_t result = 0; |
98 | + | 91 | @@ -XXX,XX +XXX,XX @@ static uint64_t baser_base_addr(uint64_t value, uint32_t page_sz) |
99 | +DO_1OP_IMM(vmovi, DO_MOVI) | 92 | return result; |
100 | +DO_1OP_IMM(vandi, DO_ANDI) | ||
101 | +DO_1OP_IMM(vorri, DO_ORRI) | ||
102 | + | ||
103 | #define DO_2OP(OP, ESIZE, TYPE, FN) \ | ||
104 | void HELPER(glue(mve_, OP))(CPUARMState *env, \ | ||
105 | void *vd, void *vn, void *vm) \ | ||
106 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
107 | index XXXXXXX..XXXXXXX 100644 | ||
108 | --- a/target/arm/translate-mve.c | ||
109 | +++ b/target/arm/translate-mve.c | ||
110 | @@ -XXX,XX +XXX,XX @@ typedef void MVEGenTwoOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr); | ||
111 | typedef void MVEGenTwoOpScalarFn(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
112 | typedef void MVEGenDualAccOpFn(TCGv_i64, TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i64); | ||
113 | typedef void MVEGenVADDVFn(TCGv_i32, TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
114 | +typedef void MVEGenOneOpImmFn(TCGv_ptr, TCGv_ptr, TCGv_i64); | ||
115 | |||
116 | /* Return the offset of a Qn register (same semantics as aa32_vfp_qreg()) */ | ||
117 | static inline long mve_qreg_offset(unsigned reg) | ||
118 | @@ -XXX,XX +XXX,XX @@ static bool trans_VADDV(DisasContext *s, arg_VADDV *a) | ||
119 | mve_update_eci(s); | ||
120 | return true; | ||
121 | } | 93 | } |
122 | + | 94 | |
123 | +static bool do_1imm(DisasContext *s, arg_1imm *a, MVEGenOneOpImmFn *fn) | 95 | +static bool get_cte(GICv3ITSState *s, uint16_t icid, uint64_t *cte, |
124 | +{ | 96 | + MemTxResult *res) |
125 | + TCGv_ptr qd; | 97 | +{ |
126 | + uint64_t imm; | 98 | + AddressSpace *as = &s->gicv3->dma_as; |
127 | + | 99 | + uint64_t l2t_addr; |
128 | + if (!dc_isar_feature(aa32_mve, s) || | 100 | + uint64_t value; |
129 | + !mve_check_qreg_bank(s, a->qd) || | 101 | + bool valid_l2t; |
130 | + !fn) { | 102 | + uint32_t l2t_id; |
103 | + uint32_t max_l2_entries; | ||
104 | + | ||
105 | + if (s->ct.indirect) { | ||
106 | + l2t_id = icid / (s->ct.page_sz / L1TABLE_ENTRY_SIZE); | ||
107 | + | ||
108 | + value = address_space_ldq_le(as, | ||
109 | + s->ct.base_addr + | ||
110 | + (l2t_id * L1TABLE_ENTRY_SIZE), | ||
111 | + MEMTXATTRS_UNSPECIFIED, res); | ||
112 | + | ||
113 | + if (*res == MEMTX_OK) { | ||
114 | + valid_l2t = (value & L2_TABLE_VALID_MASK) != 0; | ||
115 | + | ||
116 | + if (valid_l2t) { | ||
117 | + max_l2_entries = s->ct.page_sz / s->ct.entry_sz; | ||
118 | + | ||
119 | + l2t_addr = value & ((1ULL << 51) - 1); | ||
120 | + | ||
121 | + *cte = address_space_ldq_le(as, l2t_addr + | ||
122 | + ((icid % max_l2_entries) * GITS_CTE_SIZE), | ||
123 | + MEMTXATTRS_UNSPECIFIED, res); | ||
124 | + } | ||
125 | + } | ||
126 | + } else { | ||
127 | + /* Flat level table */ | ||
128 | + *cte = address_space_ldq_le(as, s->ct.base_addr + | ||
129 | + (icid * GITS_CTE_SIZE), | ||
130 | + MEMTXATTRS_UNSPECIFIED, res); | ||
131 | + } | ||
132 | + | ||
133 | + return (*cte & TABLE_ENTRY_VALID_MASK) != 0; | ||
134 | +} | ||
135 | + | ||
136 | +static bool update_ite(GICv3ITSState *s, uint32_t eventid, uint64_t dte, | ||
137 | + IteEntry ite) | ||
138 | +{ | ||
139 | + AddressSpace *as = &s->gicv3->dma_as; | ||
140 | + uint64_t itt_addr; | ||
141 | + MemTxResult res = MEMTX_OK; | ||
142 | + | ||
143 | + itt_addr = (dte & GITS_DTE_ITTADDR_MASK) >> GITS_DTE_ITTADDR_SHIFT; | ||
144 | + itt_addr <<= ITTADDR_SHIFT; /* 256 byte aligned */ | ||
145 | + | ||
146 | + address_space_stq_le(as, itt_addr + (eventid * (sizeof(uint64_t) + | ||
147 | + sizeof(uint32_t))), ite.itel, MEMTXATTRS_UNSPECIFIED, | ||
148 | + &res); | ||
149 | + | ||
150 | + if (res == MEMTX_OK) { | ||
151 | + address_space_stl_le(as, itt_addr + (eventid * (sizeof(uint64_t) + | ||
152 | + sizeof(uint32_t))) + sizeof(uint32_t), ite.iteh, | ||
153 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
154 | + } | ||
155 | + if (res != MEMTX_OK) { | ||
131 | + return false; | 156 | + return false; |
132 | + } | 157 | + } else { |
133 | + if (!mve_eci_check(s) || !vfp_access_check(s)) { | ||
134 | + return true; | 158 | + return true; |
135 | + } | 159 | + } |
136 | + | 160 | +} |
137 | + imm = asimd_imm_const(a->imm, a->cmode, a->op); | 161 | + |
138 | + | 162 | +static bool get_ite(GICv3ITSState *s, uint32_t eventid, uint64_t dte, |
139 | + qd = mve_qreg_ptr(a->qd); | 163 | + uint16_t *icid, uint32_t *pIntid, MemTxResult *res) |
140 | + fn(cpu_env, qd, tcg_constant_i64(imm)); | 164 | +{ |
141 | + tcg_temp_free_ptr(qd); | 165 | + AddressSpace *as = &s->gicv3->dma_as; |
142 | + mve_update_eci(s); | 166 | + uint64_t itt_addr; |
143 | + return true; | 167 | + bool status = false; |
144 | +} | 168 | + IteEntry ite = {}; |
145 | + | 169 | + |
146 | +static bool trans_Vimm_1r(DisasContext *s, arg_1imm *a) | 170 | + itt_addr = (dte & GITS_DTE_ITTADDR_MASK) >> GITS_DTE_ITTADDR_SHIFT; |
147 | +{ | 171 | + itt_addr <<= ITTADDR_SHIFT; /* 256 byte aligned */ |
148 | + /* Handle decode of cmode/op here between VORR/VBIC/VMOV */ | 172 | + |
149 | + MVEGenOneOpImmFn *fn; | 173 | + ite.itel = address_space_ldq_le(as, itt_addr + |
150 | + | 174 | + (eventid * (sizeof(uint64_t) + |
151 | + if ((a->cmode & 1) && a->cmode < 12) { | 175 | + sizeof(uint32_t))), MEMTXATTRS_UNSPECIFIED, |
152 | + if (a->op) { | 176 | + res); |
153 | + /* | 177 | + |
154 | + * For op=1, the immediate will be inverted by asimd_imm_const(), | 178 | + if (*res == MEMTX_OK) { |
155 | + * so the VBIC becomes a logical AND operation. | 179 | + ite.iteh = address_space_ldl_le(as, itt_addr + |
156 | + */ | 180 | + (eventid * (sizeof(uint64_t) + |
157 | + fn = gen_helper_mve_vandi; | 181 | + sizeof(uint32_t))) + sizeof(uint32_t), |
182 | + MEMTXATTRS_UNSPECIFIED, res); | ||
183 | + | ||
184 | + if (*res == MEMTX_OK) { | ||
185 | + if (ite.itel & TABLE_ENTRY_VALID_MASK) { | ||
186 | + if ((ite.itel >> ITE_ENTRY_INTTYPE_SHIFT) & | ||
187 | + GITS_TYPE_PHYSICAL) { | ||
188 | + *pIntid = (ite.itel & ITE_ENTRY_INTID_MASK) >> | ||
189 | + ITE_ENTRY_INTID_SHIFT; | ||
190 | + *icid = ite.iteh & ITE_ENTRY_ICID_MASK; | ||
191 | + status = true; | ||
192 | + } | ||
193 | + } | ||
194 | + } | ||
195 | + } | ||
196 | + return status; | ||
197 | +} | ||
198 | + | ||
199 | +static uint64_t get_dte(GICv3ITSState *s, uint32_t devid, MemTxResult *res) | ||
200 | +{ | ||
201 | + AddressSpace *as = &s->gicv3->dma_as; | ||
202 | + uint64_t l2t_addr; | ||
203 | + uint64_t value; | ||
204 | + bool valid_l2t; | ||
205 | + uint32_t l2t_id; | ||
206 | + uint32_t max_l2_entries; | ||
207 | + | ||
208 | + if (s->dt.indirect) { | ||
209 | + l2t_id = devid / (s->dt.page_sz / L1TABLE_ENTRY_SIZE); | ||
210 | + | ||
211 | + value = address_space_ldq_le(as, | ||
212 | + s->dt.base_addr + | ||
213 | + (l2t_id * L1TABLE_ENTRY_SIZE), | ||
214 | + MEMTXATTRS_UNSPECIFIED, res); | ||
215 | + | ||
216 | + if (*res == MEMTX_OK) { | ||
217 | + valid_l2t = (value & L2_TABLE_VALID_MASK) != 0; | ||
218 | + | ||
219 | + if (valid_l2t) { | ||
220 | + max_l2_entries = s->dt.page_sz / s->dt.entry_sz; | ||
221 | + | ||
222 | + l2t_addr = value & ((1ULL << 51) - 1); | ||
223 | + | ||
224 | + value = address_space_ldq_le(as, l2t_addr + | ||
225 | + ((devid % max_l2_entries) * GITS_DTE_SIZE), | ||
226 | + MEMTXATTRS_UNSPECIFIED, res); | ||
227 | + } | ||
228 | + } | ||
229 | + } else { | ||
230 | + /* Flat level table */ | ||
231 | + value = address_space_ldq_le(as, s->dt.base_addr + | ||
232 | + (devid * GITS_DTE_SIZE), | ||
233 | + MEMTXATTRS_UNSPECIFIED, res); | ||
234 | + } | ||
235 | + | ||
236 | + return value; | ||
237 | +} | ||
238 | + | ||
239 | +/* | ||
240 | + * This function handles the processing of following commands based on | ||
241 | + * the ItsCmdType parameter passed:- | ||
242 | + * 1. triggering of lpi interrupt translation via ITS INT command | ||
243 | + * 2. triggering of lpi interrupt translation via gits_translater register | ||
244 | + * 3. handling of ITS CLEAR command | ||
245 | + * 4. handling of ITS DISCARD command | ||
246 | + */ | ||
247 | +static bool process_its_cmd(GICv3ITSState *s, uint64_t value, uint32_t offset, | ||
248 | + ItsCmdType cmd) | ||
249 | +{ | ||
250 | + AddressSpace *as = &s->gicv3->dma_as; | ||
251 | + uint32_t devid, eventid; | ||
252 | + MemTxResult res = MEMTX_OK; | ||
253 | + bool dte_valid; | ||
254 | + uint64_t dte = 0; | ||
255 | + uint32_t max_eventid; | ||
256 | + uint16_t icid = 0; | ||
257 | + uint32_t pIntid = 0; | ||
258 | + bool ite_valid = false; | ||
259 | + uint64_t cte = 0; | ||
260 | + bool cte_valid = false; | ||
261 | + bool result = false; | ||
262 | + | ||
263 | + if (cmd == NONE) { | ||
264 | + devid = offset; | ||
265 | + } else { | ||
266 | + devid = ((value & DEVID_MASK) >> DEVID_SHIFT); | ||
267 | + | ||
268 | + offset += NUM_BYTES_IN_DW; | ||
269 | + value = address_space_ldq_le(as, s->cq.base_addr + offset, | ||
270 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
271 | + } | ||
272 | + | ||
273 | + if (res != MEMTX_OK) { | ||
274 | + return result; | ||
275 | + } | ||
276 | + | ||
277 | + eventid = (value & EVENTID_MASK); | ||
278 | + | ||
279 | + dte = get_dte(s, devid, &res); | ||
280 | + | ||
281 | + if (res != MEMTX_OK) { | ||
282 | + return result; | ||
283 | + } | ||
284 | + dte_valid = dte & TABLE_ENTRY_VALID_MASK; | ||
285 | + | ||
286 | + if (dte_valid) { | ||
287 | + max_eventid = (1UL << (((dte >> 1U) & SIZE_MASK) + 1)); | ||
288 | + | ||
289 | + ite_valid = get_ite(s, eventid, dte, &icid, &pIntid, &res); | ||
290 | + | ||
291 | + if (res != MEMTX_OK) { | ||
292 | + return result; | ||
293 | + } | ||
294 | + | ||
295 | + if (ite_valid) { | ||
296 | + cte_valid = get_cte(s, icid, &cte, &res); | ||
297 | + } | ||
298 | + | ||
299 | + if (res != MEMTX_OK) { | ||
300 | + return result; | ||
301 | + } | ||
302 | + } | ||
303 | + | ||
304 | + if ((devid > s->dt.maxids.max_devids) || !dte_valid || !ite_valid || | ||
305 | + !cte_valid || (eventid > max_eventid)) { | ||
306 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
307 | + "%s: invalid command attributes " | ||
308 | + "devid %d or eventid %d or invalid dte %d or" | ||
309 | + "invalid cte %d or invalid ite %d\n", | ||
310 | + __func__, devid, eventid, dte_valid, cte_valid, | ||
311 | + ite_valid); | ||
312 | + /* | ||
313 | + * in this implementation, in case of error | ||
314 | + * we ignore this command and move onto the next | ||
315 | + * command in the queue | ||
316 | + */ | ||
317 | + } else { | ||
318 | + /* | ||
319 | + * Current implementation only supports rdbase == procnum | ||
320 | + * Hence rdbase physical address is ignored | ||
321 | + */ | ||
322 | + if (cmd == DISCARD) { | ||
323 | + IteEntry ite = {}; | ||
324 | + /* remove mapping from interrupt translation table */ | ||
325 | + result = update_ite(s, eventid, dte, ite); | ||
326 | + } | ||
327 | + } | ||
328 | + | ||
329 | + return result; | ||
330 | +} | ||
331 | + | ||
332 | +static bool process_mapti(GICv3ITSState *s, uint64_t value, uint32_t offset, | ||
333 | + bool ignore_pInt) | ||
334 | +{ | ||
335 | + AddressSpace *as = &s->gicv3->dma_as; | ||
336 | + uint32_t devid, eventid; | ||
337 | + uint32_t pIntid = 0; | ||
338 | + uint32_t max_eventid, max_Intid; | ||
339 | + bool dte_valid; | ||
340 | + MemTxResult res = MEMTX_OK; | ||
341 | + uint16_t icid = 0; | ||
342 | + uint64_t dte = 0; | ||
343 | + IteEntry ite; | ||
344 | + uint32_t int_spurious = INTID_SPURIOUS; | ||
345 | + bool result = false; | ||
346 | + | ||
347 | + devid = ((value & DEVID_MASK) >> DEVID_SHIFT); | ||
348 | + offset += NUM_BYTES_IN_DW; | ||
349 | + value = address_space_ldq_le(as, s->cq.base_addr + offset, | ||
350 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
351 | + | ||
352 | + if (res != MEMTX_OK) { | ||
353 | + return result; | ||
354 | + } | ||
355 | + | ||
356 | + eventid = (value & EVENTID_MASK); | ||
357 | + | ||
358 | + if (!ignore_pInt) { | ||
359 | + pIntid = ((value & pINTID_MASK) >> pINTID_SHIFT); | ||
360 | + } | ||
361 | + | ||
362 | + offset += NUM_BYTES_IN_DW; | ||
363 | + value = address_space_ldq_le(as, s->cq.base_addr + offset, | ||
364 | + MEMTXATTRS_UNSPECIFIED, &res); | ||
365 | + | ||
366 | + if (res != MEMTX_OK) { | ||
367 | + return result; | ||
368 | + } | ||
369 | + | ||
370 | + icid = value & ICID_MASK; | ||
371 | + | ||
372 | + dte = get_dte(s, devid, &res); | ||
373 | + | ||
374 | + if (res != MEMTX_OK) { | ||
375 | + return result; | ||
376 | + } | ||
377 | + dte_valid = dte & TABLE_ENTRY_VALID_MASK; | ||
378 | + | ||
379 | + max_eventid = (1UL << (((dte >> 1U) & SIZE_MASK) + 1)); | ||
380 | + | ||
381 | + if (!ignore_pInt) { | ||
382 | + max_Intid = (1ULL << (GICD_TYPER_IDBITS + 1)) - 1; | ||
383 | + } | ||
384 | + | ||
385 | + if ((devid > s->dt.maxids.max_devids) || (icid > s->ct.maxids.max_collids) | ||
386 | + || !dte_valid || (eventid > max_eventid) || | ||
387 | + (!ignore_pInt && (((pIntid < GICV3_LPI_INTID_START) || | ||
388 | + (pIntid > max_Intid)) && (pIntid != INTID_SPURIOUS)))) { | ||
389 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
390 | + "%s: invalid command attributes " | ||
391 | + "devid %d or icid %d or eventid %d or pIntid %d or" | ||
392 | + "unmapped dte %d\n", __func__, devid, icid, eventid, | ||
393 | + pIntid, dte_valid); | ||
394 | + /* | ||
395 | + * in this implementation, in case of error | ||
396 | + * we ignore this command and move onto the next | ||
397 | + * command in the queue | ||
398 | + */ | ||
399 | + } else { | ||
400 | + /* add ite entry to interrupt translation table */ | ||
401 | + ite.itel = (dte_valid & TABLE_ENTRY_VALID_MASK) | | ||
402 | + (GITS_TYPE_PHYSICAL << ITE_ENTRY_INTTYPE_SHIFT); | ||
403 | + | ||
404 | + if (ignore_pInt) { | ||
405 | + ite.itel |= (eventid << ITE_ENTRY_INTID_SHIFT); | ||
158 | + } else { | 406 | + } else { |
159 | + fn = gen_helper_mve_vorri; | 407 | + ite.itel |= (pIntid << ITE_ENTRY_INTID_SHIFT); |
160 | + } | 408 | + } |
161 | + } else { | 409 | + ite.itel |= (int_spurious << ITE_ENTRY_INTSP_SHIFT); |
162 | + /* There is one unallocated cmode/op combination in this space */ | 410 | + ite.iteh = icid; |
163 | + if (a->cmode == 15 && a->op == 1) { | 411 | + |
164 | + return false; | 412 | + result = update_ite(s, eventid, dte, ite); |
165 | + } | 413 | + } |
166 | + /* asimd_imm_const() sorts out VMVNI vs VMOVI for us */ | 414 | + |
167 | + fn = gen_helper_mve_vmovi; | 415 | + return result; |
168 | + } | 416 | +} |
169 | + return do_1imm(s, a, fn); | 417 | + |
170 | +} | 418 | static bool update_cte(GICv3ITSState *s, uint16_t icid, bool valid, |
419 | uint64_t rdbase) | ||
420 | { | ||
421 | @@ -XXX,XX +XXX,XX @@ static void process_cmdq(GICv3ITSState *s) | ||
422 | |||
423 | switch (cmd) { | ||
424 | case GITS_CMD_INT: | ||
425 | + res = process_its_cmd(s, data, cq_offset, INT); | ||
426 | break; | ||
427 | case GITS_CMD_CLEAR: | ||
428 | + res = process_its_cmd(s, data, cq_offset, CLEAR); | ||
429 | break; | ||
430 | case GITS_CMD_SYNC: | ||
431 | /* | ||
432 | @@ -XXX,XX +XXX,XX @@ static void process_cmdq(GICv3ITSState *s) | ||
433 | result = process_mapc(s, cq_offset); | ||
434 | break; | ||
435 | case GITS_CMD_MAPTI: | ||
436 | + result = process_mapti(s, data, cq_offset, false); | ||
437 | break; | ||
438 | case GITS_CMD_MAPI: | ||
439 | + result = process_mapti(s, data, cq_offset, true); | ||
440 | break; | ||
441 | case GITS_CMD_DISCARD: | ||
442 | + result = process_its_cmd(s, data, cq_offset, DISCARD); | ||
443 | break; | ||
444 | case GITS_CMD_INV: | ||
445 | case GITS_CMD_INVALL: | ||
446 | @@ -XXX,XX +XXX,XX @@ static MemTxResult gicv3_its_translation_write(void *opaque, hwaddr offset, | ||
447 | uint64_t data, unsigned size, | ||
448 | MemTxAttrs attrs) | ||
449 | { | ||
450 | - return MEMTX_OK; | ||
451 | + GICv3ITSState *s = (GICv3ITSState *)opaque; | ||
452 | + bool result = true; | ||
453 | + uint32_t devid = 0; | ||
454 | + | ||
455 | + switch (offset) { | ||
456 | + case GITS_TRANSLATER: | ||
457 | + if (s->ctlr & ITS_CTLR_ENABLED) { | ||
458 | + devid = attrs.requester_id; | ||
459 | + result = process_its_cmd(s, data, devid, NONE); | ||
460 | + } | ||
461 | + break; | ||
462 | + default: | ||
463 | + break; | ||
464 | + } | ||
465 | + | ||
466 | + if (result) { | ||
467 | + return MEMTX_OK; | ||
468 | + } else { | ||
469 | + return MEMTX_ERROR; | ||
470 | + } | ||
471 | } | ||
472 | |||
473 | static bool its_writel(GICv3ITSState *s, hwaddr offset, | ||
171 | -- | 474 | -- |
172 | 2.20.1 | 475 | 2.20.1 |
173 | 476 | ||
174 | 477 | diff view generated by jsdifflib |
1 | From: Maxim Uvarov <maxim.uvarov@linaro.org> | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | qemu has 2 type of functions: shutdown and reboot. Shutdown | 3 | Added properties to enable ITS feature and define qemu system |
4 | function has to be used for machine shutdown. Otherwise we cause | 4 | address space memory in gicv3 common,setup distributor and |
5 | a reset with a bogus "cause" value, when we intended a shutdown. | 5 | redistributor registers to indicate LPI support. |
6 | 6 | ||
7 | Signed-off-by: Maxim Uvarov <maxim.uvarov@linaro.org> | 7 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> |
8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
9 | Message-id: 20210625111842.3790-3-maxim.uvarov@linaro.org | 9 | Tested-by: Neil Armstrong <narmstrong@baylibre.com> |
10 | [PMM: tweaked commit message] | 10 | Message-id: 20210910143951.92242-6-shashi.mallela@linaro.org |
11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
12 | --- | 12 | --- |
13 | hw/gpio/gpio_pwr.c | 2 +- | 13 | hw/intc/gicv3_internal.h | 2 ++ |
14 | 1 file changed, 1 insertion(+), 1 deletion(-) | 14 | include/hw/intc/arm_gicv3_common.h | 1 + |
15 | hw/intc/arm_gicv3_common.c | 12 ++++++++++++ | ||
16 | hw/intc/arm_gicv3_dist.c | 5 ++++- | ||
17 | hw/intc/arm_gicv3_redist.c | 12 +++++++++--- | ||
18 | 5 files changed, 28 insertions(+), 4 deletions(-) | ||
15 | 19 | ||
16 | diff --git a/hw/gpio/gpio_pwr.c b/hw/gpio/gpio_pwr.c | 20 | diff --git a/hw/intc/gicv3_internal.h b/hw/intc/gicv3_internal.h |
17 | index XXXXXXX..XXXXXXX 100644 | 21 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/hw/gpio/gpio_pwr.c | 22 | --- a/hw/intc/gicv3_internal.h |
19 | +++ b/hw/gpio/gpio_pwr.c | 23 | +++ b/hw/intc/gicv3_internal.h |
20 | @@ -XXX,XX +XXX,XX @@ static void gpio_pwr_reset(void *opaque, int n, int level) | 24 | @@ -XXX,XX +XXX,XX @@ |
21 | static void gpio_pwr_shutdown(void *opaque, int n, int level) | 25 | #define GICD_CTLR_E1NWF (1U << 7) |
22 | { | 26 | #define GICD_CTLR_RWP (1U << 31) |
23 | if (level) { | 27 | |
24 | - qemu_system_reset_request(SHUTDOWN_CAUSE_GUEST_SHUTDOWN); | 28 | +#define GICD_TYPER_LPIS_SHIFT 17 |
25 | + qemu_system_shutdown_request(SHUTDOWN_CAUSE_GUEST_SHUTDOWN); | 29 | + |
30 | /* 16 bits EventId */ | ||
31 | #define GICD_TYPER_IDBITS 0xf | ||
32 | |||
33 | diff --git a/include/hw/intc/arm_gicv3_common.h b/include/hw/intc/arm_gicv3_common.h | ||
34 | index XXXXXXX..XXXXXXX 100644 | ||
35 | --- a/include/hw/intc/arm_gicv3_common.h | ||
36 | +++ b/include/hw/intc/arm_gicv3_common.h | ||
37 | @@ -XXX,XX +XXX,XX @@ struct GICv3State { | ||
38 | uint32_t num_cpu; | ||
39 | uint32_t num_irq; | ||
40 | uint32_t revision; | ||
41 | + bool lpi_enable; | ||
42 | bool security_extn; | ||
43 | bool irq_reset_nonsecure; | ||
44 | bool gicd_no_migration_shift_bug; | ||
45 | diff --git a/hw/intc/arm_gicv3_common.c b/hw/intc/arm_gicv3_common.c | ||
46 | index XXXXXXX..XXXXXXX 100644 | ||
47 | --- a/hw/intc/arm_gicv3_common.c | ||
48 | +++ b/hw/intc/arm_gicv3_common.c | ||
49 | @@ -XXX,XX +XXX,XX @@ static void arm_gicv3_common_realize(DeviceState *dev, Error **errp) | ||
50 | return; | ||
51 | } | ||
52 | |||
53 | + if (s->lpi_enable && !s->dma) { | ||
54 | + error_setg(errp, "Redist-ITS: Guest 'sysmem' reference link not set"); | ||
55 | + return; | ||
56 | + } | ||
57 | + | ||
58 | s->cpu = g_new0(GICv3CPUState, s->num_cpu); | ||
59 | |||
60 | for (i = 0; i < s->num_cpu; i++) { | ||
61 | @@ -XXX,XX +XXX,XX @@ static void arm_gicv3_common_realize(DeviceState *dev, Error **errp) | ||
62 | (1 << 24) | | ||
63 | (i << 8) | | ||
64 | (last << 4); | ||
65 | + | ||
66 | + if (s->lpi_enable) { | ||
67 | + s->cpu[i].gicr_typer |= GICR_TYPER_PLPIS; | ||
68 | + } | ||
26 | } | 69 | } |
27 | } | 70 | } |
28 | 71 | ||
72 | @@ -XXX,XX +XXX,XX @@ static Property arm_gicv3_common_properties[] = { | ||
73 | DEFINE_PROP_UINT32("num-cpu", GICv3State, num_cpu, 1), | ||
74 | DEFINE_PROP_UINT32("num-irq", GICv3State, num_irq, 32), | ||
75 | DEFINE_PROP_UINT32("revision", GICv3State, revision, 3), | ||
76 | + DEFINE_PROP_BOOL("has-lpi", GICv3State, lpi_enable, 0), | ||
77 | DEFINE_PROP_BOOL("has-security-extensions", GICv3State, security_extn, 0), | ||
78 | DEFINE_PROP_ARRAY("redist-region-count", GICv3State, nb_redist_regions, | ||
79 | redist_region_count, qdev_prop_uint32, uint32_t), | ||
80 | + DEFINE_PROP_LINK("sysmem", GICv3State, dma, TYPE_MEMORY_REGION, | ||
81 | + MemoryRegion *), | ||
82 | DEFINE_PROP_END_OF_LIST(), | ||
83 | }; | ||
84 | |||
85 | diff --git a/hw/intc/arm_gicv3_dist.c b/hw/intc/arm_gicv3_dist.c | ||
86 | index XXXXXXX..XXXXXXX 100644 | ||
87 | --- a/hw/intc/arm_gicv3_dist.c | ||
88 | +++ b/hw/intc/arm_gicv3_dist.c | ||
89 | @@ -XXX,XX +XXX,XX @@ static bool gicd_readl(GICv3State *s, hwaddr offset, | ||
90 | * A3V == 1 (non-zero values of Affinity level 3 supported) | ||
91 | * IDbits == 0xf (we support 16-bit interrupt identifiers) | ||
92 | * DVIS == 0 (Direct virtual LPI injection not supported) | ||
93 | - * LPIS == 0 (LPIs not supported) | ||
94 | + * LPIS == 1 (LPIs are supported if affinity routing is enabled) | ||
95 | + * num_LPIs == 0b00000 (bits [15:11],Number of LPIs as indicated | ||
96 | + * by GICD_TYPER.IDbits) | ||
97 | * MBIS == 0 (message-based SPIs not supported) | ||
98 | * SecurityExtn == 1 if security extns supported | ||
99 | * CPUNumber == 0 since for us ARE is always 1 | ||
100 | @@ -XXX,XX +XXX,XX @@ static bool gicd_readl(GICv3State *s, hwaddr offset, | ||
101 | bool sec_extn = !(s->gicd_ctlr & GICD_CTLR_DS); | ||
102 | |||
103 | *data = (1 << 25) | (1 << 24) | (sec_extn << 10) | | ||
104 | + (s->lpi_enable << GICD_TYPER_LPIS_SHIFT) | | ||
105 | (0xf << 19) | itlinesnumber; | ||
106 | return true; | ||
107 | } | ||
108 | diff --git a/hw/intc/arm_gicv3_redist.c b/hw/intc/arm_gicv3_redist.c | ||
109 | index XXXXXXX..XXXXXXX 100644 | ||
110 | --- a/hw/intc/arm_gicv3_redist.c | ||
111 | +++ b/hw/intc/arm_gicv3_redist.c | ||
112 | @@ -XXX,XX +XXX,XX @@ static MemTxResult gicr_writel(GICv3CPUState *cs, hwaddr offset, | ||
113 | case GICR_CTLR: | ||
114 | /* For our implementation, GICR_TYPER.DPGS is 0 and so all | ||
115 | * the DPG bits are RAZ/WI. We don't do anything asynchronously, | ||
116 | - * so UWP and RWP are RAZ/WI. And GICR_TYPER.LPIS is 0 (we don't | ||
117 | - * implement LPIs) so Enable_LPIs is RES0. So there are no writable | ||
118 | - * bits for us. | ||
119 | + * so UWP and RWP are RAZ/WI. GICR_TYPER.LPIS is 1 (we | ||
120 | + * implement LPIs) so Enable_LPIs is programmable. | ||
121 | */ | ||
122 | + if (cs->gicr_typer & GICR_TYPER_PLPIS) { | ||
123 | + if (value & GICR_CTLR_ENABLE_LPIS) { | ||
124 | + cs->gicr_ctlr |= GICR_CTLR_ENABLE_LPIS; | ||
125 | + } else { | ||
126 | + cs->gicr_ctlr &= ~GICR_CTLR_ENABLE_LPIS; | ||
127 | + } | ||
128 | + } | ||
129 | return MEMTX_OK; | ||
130 | case GICR_STATUSR: | ||
131 | /* RAZ/WI for our implementation */ | ||
29 | -- | 132 | -- |
30 | 2.20.1 | 133 | 2.20.1 |
31 | 134 | ||
32 | 135 | diff view generated by jsdifflib |
1 | Implement the MVE vector shift right by immediate insns VSHRI and | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | VRSHRI. As with Neon, we implement these by using helper functions | 2 | |
3 | which perform left shifts but allow negative shift counts to indicate | 3 | Implemented lpi processing at redistributor to get lpi config info |
4 | right shifts. | 4 | from lpi configuration table,determine priority,set pending state in |
5 | 5 | lpi pending table and forward the lpi to cpuif.Added logic to invoke | |
6 | redistributor lpi processing with translated LPI which set/clear LPI | ||
7 | from ITS device as part of ITS INT,CLEAR,DISCARD command and | ||
8 | GITS_TRANSLATER processing. | ||
9 | |||
10 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> | ||
11 | Tested-by: Neil Armstrong <narmstrong@baylibre.com> | ||
12 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | Message-id: 20210910143951.92242-7-shashi.mallela@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20210628135835.6690-9-peter.maydell@linaro.org | ||
9 | --- | 15 | --- |
10 | target/arm/helper-mve.h | 12 ++++++++++++ | 16 | hw/intc/gicv3_internal.h | 9 ++ |
11 | target/arm/translate.h | 20 ++++++++++++++++++++ | 17 | include/hw/intc/arm_gicv3_common.h | 7 ++ |
12 | target/arm/mve.decode | 28 ++++++++++++++++++++++++++++ | 18 | hw/intc/arm_gicv3.c | 14 +++ |
13 | target/arm/mve_helper.c | 7 +++++++ | 19 | hw/intc/arm_gicv3_common.c | 1 + |
14 | target/arm/translate-mve.c | 5 +++++ | 20 | hw/intc/arm_gicv3_cpuif.c | 7 +- |
15 | target/arm/translate-neon.c | 18 ------------------ | 21 | hw/intc/arm_gicv3_its.c | 23 +++++ |
16 | 6 files changed, 72 insertions(+), 18 deletions(-) | 22 | hw/intc/arm_gicv3_redist.c | 141 +++++++++++++++++++++++++++++ |
17 | 23 | 7 files changed, 200 insertions(+), 2 deletions(-) | |
18 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 24 | |
19 | index XXXXXXX..XXXXXXX 100644 | 25 | diff --git a/hw/intc/gicv3_internal.h b/hw/intc/gicv3_internal.h |
20 | --- a/target/arm/helper-mve.h | 26 | index XXXXXXX..XXXXXXX 100644 |
21 | +++ b/target/arm/helper-mve.h | 27 | --- a/hw/intc/gicv3_internal.h |
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(mve_vmovi, TCG_CALL_NO_WG, void, env, ptr, i64) | 28 | +++ b/hw/intc/gicv3_internal.h |
23 | DEF_HELPER_FLAGS_3(mve_vandi, TCG_CALL_NO_WG, void, env, ptr, i64) | 29 | @@ -XXX,XX +XXX,XX @@ FIELD(GICR_PENDBASER, PHYADDR, 16, 36) |
24 | DEF_HELPER_FLAGS_3(mve_vorri, TCG_CALL_NO_WG, void, env, ptr, i64) | 30 | FIELD(GICR_PENDBASER, OUTERCACHE, 56, 3) |
25 | 31 | FIELD(GICR_PENDBASER, PTZ, 62, 1) | |
26 | +DEF_HELPER_FLAGS_4(mve_vshli_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 32 | |
27 | +DEF_HELPER_FLAGS_4(mve_vshli_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 33 | +#define GICR_PROPBASER_IDBITS_THRESHOLD 0xd |
28 | +DEF_HELPER_FLAGS_4(mve_vshli_sw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 34 | + |
29 | + | 35 | #define ICC_CTLR_EL1_CBPR (1U << 0) |
30 | DEF_HELPER_FLAGS_4(mve_vshli_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 36 | #define ICC_CTLR_EL1_EOIMODE (1U << 1) |
31 | DEF_HELPER_FLAGS_4(mve_vshli_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 37 | #define ICC_CTLR_EL1_PMHE (1U << 6) |
32 | DEF_HELPER_FLAGS_4(mve_vshli_uw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 38 | @@ -XXX,XX +XXX,XX @@ FIELD(GITS_TYPER, CIL, 36, 1) |
33 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vqshli_uw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 39 | |
34 | DEF_HELPER_FLAGS_4(mve_vqshlui_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 40 | #define L1TABLE_ENTRY_SIZE 8 |
35 | DEF_HELPER_FLAGS_4(mve_vqshlui_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 41 | |
36 | DEF_HELPER_FLAGS_4(mve_vqshlui_sw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 42 | +#define LPI_CTE_ENABLED TABLE_ENTRY_VALID_MASK |
37 | + | 43 | +#define LPI_PRIORITY_MASK 0xfc |
38 | +DEF_HELPER_FLAGS_4(mve_vrshli_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 44 | + |
39 | +DEF_HELPER_FLAGS_4(mve_vrshli_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 45 | #define GITS_CMDQ_ENTRY_SIZE 32 |
40 | +DEF_HELPER_FLAGS_4(mve_vrshli_sw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 46 | #define NUM_BYTES_IN_DW 8 |
41 | + | 47 | |
42 | +DEF_HELPER_FLAGS_4(mve_vrshli_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 48 | @@ -XXX,XX +XXX,XX @@ FIELD(MAPC, RDBASE, 16, 32) |
43 | +DEF_HELPER_FLAGS_4(mve_vrshli_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 49 | * Valid = 1 bit,RDBase = 36 bits(considering max RDBASE) |
44 | +DEF_HELPER_FLAGS_4(mve_vrshli_uw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 50 | */ |
45 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 51 | #define GITS_CTE_SIZE (0x8ULL) |
46 | index XXXXXXX..XXXXXXX 100644 | 52 | +#define GITS_CTE_RDBASE_PROCNUM_MASK MAKE_64BIT_MASK(1, RDBASE_PROCNUM_LENGTH) |
47 | --- a/target/arm/translate.h | 53 | |
48 | +++ b/target/arm/translate.h | 54 | /* Special interrupt IDs */ |
49 | @@ -XXX,XX +XXX,XX @@ static inline int times_2_plus_1(DisasContext *s, int x) | 55 | #define INTID_SECURE 1020 |
50 | return x * 2 + 1; | 56 | @@ -XXX,XX +XXX,XX @@ MemTxResult gicv3_redist_write(void *opaque, hwaddr offset, uint64_t data, |
57 | unsigned size, MemTxAttrs attrs); | ||
58 | void gicv3_dist_set_irq(GICv3State *s, int irq, int level); | ||
59 | void gicv3_redist_set_irq(GICv3CPUState *cs, int irq, int level); | ||
60 | +void gicv3_redist_process_lpi(GICv3CPUState *cs, int irq, int level); | ||
61 | +void gicv3_redist_lpi_pending(GICv3CPUState *cs, int irq, int level); | ||
62 | +void gicv3_redist_update_lpi(GICv3CPUState *cs); | ||
63 | void gicv3_redist_send_sgi(GICv3CPUState *cs, int grp, int irq, bool ns); | ||
64 | void gicv3_init_cpuif(GICv3State *s); | ||
65 | |||
66 | diff --git a/include/hw/intc/arm_gicv3_common.h b/include/hw/intc/arm_gicv3_common.h | ||
67 | index XXXXXXX..XXXXXXX 100644 | ||
68 | --- a/include/hw/intc/arm_gicv3_common.h | ||
69 | +++ b/include/hw/intc/arm_gicv3_common.h | ||
70 | @@ -XXX,XX +XXX,XX @@ struct GICv3CPUState { | ||
71 | * real state above; it doesn't need to be migrated. | ||
72 | */ | ||
73 | PendingIrq hppi; | ||
74 | + | ||
75 | + /* | ||
76 | + * Cached information recalculated from LPI tables | ||
77 | + * in guest memory | ||
78 | + */ | ||
79 | + PendingIrq hpplpi; | ||
80 | + | ||
81 | /* This is temporary working state, to avoid a malloc in gicv3_update() */ | ||
82 | bool seenbetter; | ||
83 | }; | ||
84 | diff --git a/hw/intc/arm_gicv3.c b/hw/intc/arm_gicv3.c | ||
85 | index XXXXXXX..XXXXXXX 100644 | ||
86 | --- a/hw/intc/arm_gicv3.c | ||
87 | +++ b/hw/intc/arm_gicv3.c | ||
88 | @@ -XXX,XX +XXX,XX @@ static void gicv3_redist_update_noirqset(GICv3CPUState *cs) | ||
89 | cs->hppi.grp = gicv3_irq_group(cs->gic, cs, cs->hppi.irq); | ||
90 | } | ||
91 | |||
92 | + if ((cs->gicr_ctlr & GICR_CTLR_ENABLE_LPIS) && cs->gic->lpi_enable && | ||
93 | + (cs->hpplpi.prio != 0xff)) { | ||
94 | + if (irqbetter(cs, cs->hpplpi.irq, cs->hpplpi.prio)) { | ||
95 | + cs->hppi.irq = cs->hpplpi.irq; | ||
96 | + cs->hppi.prio = cs->hpplpi.prio; | ||
97 | + cs->hppi.grp = cs->hpplpi.grp; | ||
98 | + seenbetter = true; | ||
99 | + } | ||
100 | + } | ||
101 | + | ||
102 | /* If the best interrupt we just found would preempt whatever | ||
103 | * was the previous best interrupt before this update, then | ||
104 | * we know it's definitely the best one now. | ||
105 | @@ -XXX,XX +XXX,XX @@ static void gicv3_set_irq(void *opaque, int irq, int level) | ||
106 | |||
107 | static void arm_gicv3_post_load(GICv3State *s) | ||
108 | { | ||
109 | + int i; | ||
110 | /* Recalculate our cached idea of the current highest priority | ||
111 | * pending interrupt, but don't set IRQ or FIQ lines. | ||
112 | */ | ||
113 | + for (i = 0; i < s->num_cpu; i++) { | ||
114 | + gicv3_redist_update_lpi(&s->cpu[i]); | ||
115 | + } | ||
116 | gicv3_full_update_noirqset(s); | ||
117 | /* Repopulate the cache of GICv3CPUState pointers for target CPUs */ | ||
118 | gicv3_cache_all_target_cpustates(s); | ||
119 | diff --git a/hw/intc/arm_gicv3_common.c b/hw/intc/arm_gicv3_common.c | ||
120 | index XXXXXXX..XXXXXXX 100644 | ||
121 | --- a/hw/intc/arm_gicv3_common.c | ||
122 | +++ b/hw/intc/arm_gicv3_common.c | ||
123 | @@ -XXX,XX +XXX,XX @@ static void arm_gicv3_common_reset(DeviceState *dev) | ||
124 | memset(cs->gicr_ipriorityr, 0, sizeof(cs->gicr_ipriorityr)); | ||
125 | |||
126 | cs->hppi.prio = 0xff; | ||
127 | + cs->hpplpi.prio = 0xff; | ||
128 | |||
129 | /* State in the CPU interface must *not* be reset here, because it | ||
130 | * is part of the CPU's reset domain, not the GIC device's. | ||
131 | diff --git a/hw/intc/arm_gicv3_cpuif.c b/hw/intc/arm_gicv3_cpuif.c | ||
132 | index XXXXXXX..XXXXXXX 100644 | ||
133 | --- a/hw/intc/arm_gicv3_cpuif.c | ||
134 | +++ b/hw/intc/arm_gicv3_cpuif.c | ||
135 | @@ -XXX,XX +XXX,XX @@ static void icc_activate_irq(GICv3CPUState *cs, int irq) | ||
136 | cs->gicr_iactiver0 = deposit32(cs->gicr_iactiver0, irq, 1, 1); | ||
137 | cs->gicr_ipendr0 = deposit32(cs->gicr_ipendr0, irq, 1, 0); | ||
138 | gicv3_redist_update(cs); | ||
139 | - } else { | ||
140 | + } else if (irq < GICV3_LPI_INTID_START) { | ||
141 | gicv3_gicd_active_set(cs->gic, irq); | ||
142 | gicv3_gicd_pending_clear(cs->gic, irq); | ||
143 | gicv3_update(cs->gic, irq, 1); | ||
144 | + } else { | ||
145 | + gicv3_redist_lpi_pending(cs, irq, 0); | ||
146 | } | ||
51 | } | 147 | } |
52 | 148 | ||
53 | +static inline int rsub_64(DisasContext *s, int x) | 149 | @@ -XXX,XX +XXX,XX @@ static void icc_eoir_write(CPUARMState *env, const ARMCPRegInfo *ri, |
150 | trace_gicv3_icc_eoir_write(is_eoir0 ? 0 : 1, | ||
151 | gicv3_redist_affid(cs), value); | ||
152 | |||
153 | - if (irq >= cs->gic->num_irq) { | ||
154 | + if ((irq >= cs->gic->num_irq) && | ||
155 | + !(cs->gic->lpi_enable && (irq >= GICV3_LPI_INTID_START))) { | ||
156 | /* This handles two cases: | ||
157 | * 1. If software writes the ID of a spurious interrupt [ie 1020-1023] | ||
158 | * to the GICC_EOIR, the GIC ignores that write. | ||
159 | diff --git a/hw/intc/arm_gicv3_its.c b/hw/intc/arm_gicv3_its.c | ||
160 | index XXXXXXX..XXXXXXX 100644 | ||
161 | --- a/hw/intc/arm_gicv3_its.c | ||
162 | +++ b/hw/intc/arm_gicv3_its.c | ||
163 | @@ -XXX,XX +XXX,XX @@ static bool process_its_cmd(GICv3ITSState *s, uint64_t value, uint32_t offset, | ||
164 | uint64_t cte = 0; | ||
165 | bool cte_valid = false; | ||
166 | bool result = false; | ||
167 | + uint64_t rdbase; | ||
168 | |||
169 | if (cmd == NONE) { | ||
170 | devid = offset; | ||
171 | @@ -XXX,XX +XXX,XX @@ static bool process_its_cmd(GICv3ITSState *s, uint64_t value, uint32_t offset, | ||
172 | * Current implementation only supports rdbase == procnum | ||
173 | * Hence rdbase physical address is ignored | ||
174 | */ | ||
175 | + rdbase = (cte & GITS_CTE_RDBASE_PROCNUM_MASK) >> 1U; | ||
176 | + | ||
177 | + if (rdbase > s->gicv3->num_cpu) { | ||
178 | + return result; | ||
179 | + } | ||
180 | + | ||
181 | + if ((cmd == CLEAR) || (cmd == DISCARD)) { | ||
182 | + gicv3_redist_process_lpi(&s->gicv3->cpu[rdbase], pIntid, 0); | ||
183 | + } else { | ||
184 | + gicv3_redist_process_lpi(&s->gicv3->cpu[rdbase], pIntid, 1); | ||
185 | + } | ||
186 | + | ||
187 | if (cmd == DISCARD) { | ||
188 | IteEntry ite = {}; | ||
189 | /* remove mapping from interrupt translation table */ | ||
190 | @@ -XXX,XX +XXX,XX @@ static void process_cmdq(GICv3ITSState *s) | ||
191 | MemTxResult res = MEMTX_OK; | ||
192 | bool result = true; | ||
193 | uint8_t cmd; | ||
194 | + int i; | ||
195 | |||
196 | if (!(s->ctlr & ITS_CTLR_ENABLED)) { | ||
197 | return; | ||
198 | @@ -XXX,XX +XXX,XX @@ static void process_cmdq(GICv3ITSState *s) | ||
199 | break; | ||
200 | case GITS_CMD_INV: | ||
201 | case GITS_CMD_INVALL: | ||
202 | + /* | ||
203 | + * Current implementation doesn't cache any ITS tables, | ||
204 | + * but the calculated lpi priority information. We only | ||
205 | + * need to trigger lpi priority re-calculation to be in | ||
206 | + * sync with LPI config table or pending table changes. | ||
207 | + */ | ||
208 | + for (i = 0; i < s->gicv3->num_cpu; i++) { | ||
209 | + gicv3_redist_update_lpi(&s->gicv3->cpu[i]); | ||
210 | + } | ||
211 | break; | ||
212 | default: | ||
213 | break; | ||
214 | diff --git a/hw/intc/arm_gicv3_redist.c b/hw/intc/arm_gicv3_redist.c | ||
215 | index XXXXXXX..XXXXXXX 100644 | ||
216 | --- a/hw/intc/arm_gicv3_redist.c | ||
217 | +++ b/hw/intc/arm_gicv3_redist.c | ||
218 | @@ -XXX,XX +XXX,XX @@ static MemTxResult gicr_writel(GICv3CPUState *cs, hwaddr offset, | ||
219 | if (cs->gicr_typer & GICR_TYPER_PLPIS) { | ||
220 | if (value & GICR_CTLR_ENABLE_LPIS) { | ||
221 | cs->gicr_ctlr |= GICR_CTLR_ENABLE_LPIS; | ||
222 | + /* Check for any pending interr in pending table */ | ||
223 | + gicv3_redist_update_lpi(cs); | ||
224 | + gicv3_redist_update(cs); | ||
225 | } else { | ||
226 | cs->gicr_ctlr &= ~GICR_CTLR_ENABLE_LPIS; | ||
227 | } | ||
228 | @@ -XXX,XX +XXX,XX @@ MemTxResult gicv3_redist_write(void *opaque, hwaddr offset, uint64_t data, | ||
229 | return r; | ||
230 | } | ||
231 | |||
232 | +static void gicv3_redist_check_lpi_priority(GICv3CPUState *cs, int irq) | ||
54 | +{ | 233 | +{ |
55 | + return 64 - x; | 234 | + AddressSpace *as = &cs->gic->dma_as; |
235 | + uint64_t lpict_baddr; | ||
236 | + uint8_t lpite; | ||
237 | + uint8_t prio; | ||
238 | + | ||
239 | + lpict_baddr = cs->gicr_propbaser & R_GICR_PROPBASER_PHYADDR_MASK; | ||
240 | + | ||
241 | + address_space_read(as, lpict_baddr + ((irq - GICV3_LPI_INTID_START) * | ||
242 | + sizeof(lpite)), MEMTXATTRS_UNSPECIFIED, &lpite, | ||
243 | + sizeof(lpite)); | ||
244 | + | ||
245 | + if (!(lpite & LPI_CTE_ENABLED)) { | ||
246 | + return; | ||
247 | + } | ||
248 | + | ||
249 | + if (cs->gic->gicd_ctlr & GICD_CTLR_DS) { | ||
250 | + prio = lpite & LPI_PRIORITY_MASK; | ||
251 | + } else { | ||
252 | + prio = ((lpite & LPI_PRIORITY_MASK) >> 1) | 0x80; | ||
253 | + } | ||
254 | + | ||
255 | + if ((prio < cs->hpplpi.prio) || | ||
256 | + ((prio == cs->hpplpi.prio) && (irq <= cs->hpplpi.irq))) { | ||
257 | + cs->hpplpi.irq = irq; | ||
258 | + cs->hpplpi.prio = prio; | ||
259 | + /* LPIs are always non-secure Grp1 interrupts */ | ||
260 | + cs->hpplpi.grp = GICV3_G1NS; | ||
261 | + } | ||
56 | +} | 262 | +} |
57 | + | 263 | + |
58 | +static inline int rsub_32(DisasContext *s, int x) | 264 | +void gicv3_redist_update_lpi(GICv3CPUState *cs) |
59 | +{ | 265 | +{ |
60 | + return 32 - x; | 266 | + /* |
267 | + * This function scans the LPI pending table and for each pending | ||
268 | + * LPI, reads the corresponding entry from LPI configuration table | ||
269 | + * to extract the priority info and determine if the current LPI | ||
270 | + * priority is lower than the last computed high priority lpi interrupt. | ||
271 | + * If yes, replace current LPI as the new high priority lpi interrupt. | ||
272 | + */ | ||
273 | + AddressSpace *as = &cs->gic->dma_as; | ||
274 | + uint64_t lpipt_baddr; | ||
275 | + uint32_t pendt_size = 0; | ||
276 | + uint8_t pend; | ||
277 | + int i, bit; | ||
278 | + uint64_t idbits; | ||
279 | + | ||
280 | + idbits = MIN(FIELD_EX64(cs->gicr_propbaser, GICR_PROPBASER, IDBITS), | ||
281 | + GICD_TYPER_IDBITS); | ||
282 | + | ||
283 | + if (!(cs->gicr_ctlr & GICR_CTLR_ENABLE_LPIS) || !cs->gicr_propbaser || | ||
284 | + !cs->gicr_pendbaser) { | ||
285 | + return; | ||
286 | + } | ||
287 | + | ||
288 | + cs->hpplpi.prio = 0xff; | ||
289 | + | ||
290 | + lpipt_baddr = cs->gicr_pendbaser & R_GICR_PENDBASER_PHYADDR_MASK; | ||
291 | + | ||
292 | + /* Determine the highest priority pending interrupt among LPIs */ | ||
293 | + pendt_size = (1ULL << (idbits + 1)); | ||
294 | + | ||
295 | + for (i = GICV3_LPI_INTID_START / 8; i < pendt_size / 8; i++) { | ||
296 | + address_space_read(as, lpipt_baddr + i, MEMTXATTRS_UNSPECIFIED, &pend, | ||
297 | + sizeof(pend)); | ||
298 | + | ||
299 | + while (pend) { | ||
300 | + bit = ctz32(pend); | ||
301 | + gicv3_redist_check_lpi_priority(cs, i * 8 + bit); | ||
302 | + pend &= ~(1 << bit); | ||
303 | + } | ||
304 | + } | ||
61 | +} | 305 | +} |
62 | + | 306 | + |
63 | +static inline int rsub_16(DisasContext *s, int x) | 307 | +void gicv3_redist_lpi_pending(GICv3CPUState *cs, int irq, int level) |
64 | +{ | 308 | +{ |
65 | + return 16 - x; | 309 | + /* |
310 | + * This function updates the pending bit in lpi pending table for | ||
311 | + * the irq being activated or deactivated. | ||
312 | + */ | ||
313 | + AddressSpace *as = &cs->gic->dma_as; | ||
314 | + uint64_t lpipt_baddr; | ||
315 | + bool ispend = false; | ||
316 | + uint8_t pend; | ||
317 | + | ||
318 | + /* | ||
319 | + * get the bit value corresponding to this irq in the | ||
320 | + * lpi pending table | ||
321 | + */ | ||
322 | + lpipt_baddr = cs->gicr_pendbaser & R_GICR_PENDBASER_PHYADDR_MASK; | ||
323 | + | ||
324 | + address_space_read(as, lpipt_baddr + ((irq / 8) * sizeof(pend)), | ||
325 | + MEMTXATTRS_UNSPECIFIED, &pend, sizeof(pend)); | ||
326 | + | ||
327 | + ispend = extract32(pend, irq % 8, 1); | ||
328 | + | ||
329 | + /* no change in the value of pending bit, return */ | ||
330 | + if (ispend == level) { | ||
331 | + return; | ||
332 | + } | ||
333 | + pend = deposit32(pend, irq % 8, 1, level ? 1 : 0); | ||
334 | + | ||
335 | + address_space_write(as, lpipt_baddr + ((irq / 8) * sizeof(pend)), | ||
336 | + MEMTXATTRS_UNSPECIFIED, &pend, sizeof(pend)); | ||
337 | + | ||
338 | + /* | ||
339 | + * check if this LPI is better than the current hpplpi, if yes | ||
340 | + * just set hpplpi.prio and .irq without doing a full rescan | ||
341 | + */ | ||
342 | + if (level) { | ||
343 | + gicv3_redist_check_lpi_priority(cs, irq); | ||
344 | + } else { | ||
345 | + if (irq == cs->hpplpi.irq) { | ||
346 | + gicv3_redist_update_lpi(cs); | ||
347 | + } | ||
348 | + } | ||
66 | +} | 349 | +} |
67 | + | 350 | + |
68 | +static inline int rsub_8(DisasContext *s, int x) | 351 | +void gicv3_redist_process_lpi(GICv3CPUState *cs, int irq, int level) |
69 | +{ | 352 | +{ |
70 | + return 8 - x; | 353 | + uint64_t idbits; |
354 | + | ||
355 | + idbits = MIN(FIELD_EX64(cs->gicr_propbaser, GICR_PROPBASER, IDBITS), | ||
356 | + GICD_TYPER_IDBITS); | ||
357 | + | ||
358 | + if (!(cs->gicr_ctlr & GICR_CTLR_ENABLE_LPIS) || !cs->gicr_propbaser || | ||
359 | + !cs->gicr_pendbaser || (irq > (1ULL << (idbits + 1)) - 1) || | ||
360 | + irq < GICV3_LPI_INTID_START) { | ||
361 | + return; | ||
362 | + } | ||
363 | + | ||
364 | + /* set/clear the pending bit for this irq */ | ||
365 | + gicv3_redist_lpi_pending(cs, irq, level); | ||
366 | + | ||
367 | + gicv3_redist_update(cs); | ||
71 | +} | 368 | +} |
72 | + | 369 | + |
73 | static inline int arm_dc_feature(DisasContext *dc, int feature) | 370 | void gicv3_redist_set_irq(GICv3CPUState *cs, int irq, int level) |
74 | { | 371 | { |
75 | return (dc->features & (1ULL << feature)) != 0; | 372 | /* Update redistributor state for a change in an external PPI input line */ |
76 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | ||
77 | index XXXXXXX..XXXXXXX 100644 | ||
78 | --- a/target/arm/mve.decode | ||
79 | +++ b/target/arm/mve.decode | ||
80 | @@ -XXX,XX +XXX,XX @@ | ||
81 | @2_shl_h .... .... .. 01 shift:4 .... .... .... .... &2shift qd=%qd qm=%qm size=1 | ||
82 | @2_shl_w .... .... .. 1 shift:5 .... .... .... .... &2shift qd=%qd qm=%qm size=2 | ||
83 | |||
84 | +# Right shifts are encoded as N - shift, where N is the element size in bits. | ||
85 | +%rshift_i5 16:5 !function=rsub_32 | ||
86 | +%rshift_i4 16:4 !function=rsub_16 | ||
87 | +%rshift_i3 16:3 !function=rsub_8 | ||
88 | + | ||
89 | +@2_shr_b .... .... .. 001 ... .... .... .... .... &2shift qd=%qd qm=%qm \ | ||
90 | + size=0 shift=%rshift_i3 | ||
91 | +@2_shr_h .... .... .. 01 .... .... .... .... .... &2shift qd=%qd qm=%qm \ | ||
92 | + size=1 shift=%rshift_i4 | ||
93 | +@2_shr_w .... .... .. 1 ..... .... .... .... .... &2shift qd=%qd qm=%qm \ | ||
94 | + size=2 shift=%rshift_i5 | ||
95 | + | ||
96 | # Vector loads and stores | ||
97 | |||
98 | # Widening loads and narrowing stores: | ||
99 | @@ -XXX,XX +XXX,XX @@ VQSHLI_U 111 1 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_w | ||
100 | VQSHLUI 111 1 1111 1 . ... ... ... 0 0110 0 1 . 1 ... 0 @2_shl_b | ||
101 | VQSHLUI 111 1 1111 1 . ... ... ... 0 0110 0 1 . 1 ... 0 @2_shl_h | ||
102 | VQSHLUI 111 1 1111 1 . ... ... ... 0 0110 0 1 . 1 ... 0 @2_shl_w | ||
103 | + | ||
104 | +VSHRI_S 111 0 1111 1 . ... ... ... 0 0000 0 1 . 1 ... 0 @2_shr_b | ||
105 | +VSHRI_S 111 0 1111 1 . ... ... ... 0 0000 0 1 . 1 ... 0 @2_shr_h | ||
106 | +VSHRI_S 111 0 1111 1 . ... ... ... 0 0000 0 1 . 1 ... 0 @2_shr_w | ||
107 | + | ||
108 | +VSHRI_U 111 1 1111 1 . ... ... ... 0 0000 0 1 . 1 ... 0 @2_shr_b | ||
109 | +VSHRI_U 111 1 1111 1 . ... ... ... 0 0000 0 1 . 1 ... 0 @2_shr_h | ||
110 | +VSHRI_U 111 1 1111 1 . ... ... ... 0 0000 0 1 . 1 ... 0 @2_shr_w | ||
111 | + | ||
112 | +VRSHRI_S 111 0 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_b | ||
113 | +VRSHRI_S 111 0 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_h | ||
114 | +VRSHRI_S 111 0 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_w | ||
115 | + | ||
116 | +VRSHRI_U 111 1 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_b | ||
117 | +VRSHRI_U 111 1 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_h | ||
118 | +VRSHRI_U 111 1 1111 1 . ... ... ... 0 0010 0 1 . 1 ... 0 @2_shr_w | ||
119 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
120 | index XXXXXXX..XXXXXXX 100644 | ||
121 | --- a/target/arm/mve_helper.c | ||
122 | +++ b/target/arm/mve_helper.c | ||
123 | @@ -XXX,XX +XXX,XX @@ DO_VADDV(vaddvuw, 4, uint32_t) | ||
124 | DO_2SHIFT(OP##b, 1, uint8_t, FN) \ | ||
125 | DO_2SHIFT(OP##h, 2, uint16_t, FN) \ | ||
126 | DO_2SHIFT(OP##w, 4, uint32_t, FN) | ||
127 | +#define DO_2SHIFT_S(OP, FN) \ | ||
128 | + DO_2SHIFT(OP##b, 1, int8_t, FN) \ | ||
129 | + DO_2SHIFT(OP##h, 2, int16_t, FN) \ | ||
130 | + DO_2SHIFT(OP##w, 4, int32_t, FN) | ||
131 | |||
132 | #define DO_2SHIFT_SAT_U(OP, FN) \ | ||
133 | DO_2SHIFT_SAT(OP##b, 1, uint8_t, FN) \ | ||
134 | @@ -XXX,XX +XXX,XX @@ DO_VADDV(vaddvuw, 4, uint32_t) | ||
135 | DO_2SHIFT_SAT(OP##w, 4, int32_t, FN) | ||
136 | |||
137 | DO_2SHIFT_U(vshli_u, DO_VSHLU) | ||
138 | +DO_2SHIFT_S(vshli_s, DO_VSHLS) | ||
139 | DO_2SHIFT_SAT_U(vqshli_u, DO_UQSHL_OP) | ||
140 | DO_2SHIFT_SAT_S(vqshli_s, DO_SQSHL_OP) | ||
141 | DO_2SHIFT_SAT_S(vqshlui_s, DO_SUQSHL_OP) | ||
142 | +DO_2SHIFT_U(vrshli_u, DO_VRSHLU) | ||
143 | +DO_2SHIFT_S(vrshli_s, DO_VRSHLS) | ||
144 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
145 | index XXXXXXX..XXXXXXX 100644 | ||
146 | --- a/target/arm/translate-mve.c | ||
147 | +++ b/target/arm/translate-mve.c | ||
148 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT(VSHLI, vshli_u, false) | ||
149 | DO_2SHIFT(VQSHLI_S, vqshli_s, false) | ||
150 | DO_2SHIFT(VQSHLI_U, vqshli_u, false) | ||
151 | DO_2SHIFT(VQSHLUI, vqshlui_s, false) | ||
152 | +/* These right shifts use a left-shift helper with negated shift count */ | ||
153 | +DO_2SHIFT(VSHRI_S, vshli_s, true) | ||
154 | +DO_2SHIFT(VSHRI_U, vshli_u, true) | ||
155 | +DO_2SHIFT(VRSHRI_S, vrshli_s, true) | ||
156 | +DO_2SHIFT(VRSHRI_U, vrshli_u, true) | ||
157 | diff --git a/target/arm/translate-neon.c b/target/arm/translate-neon.c | ||
158 | index XXXXXXX..XXXXXXX 100644 | ||
159 | --- a/target/arm/translate-neon.c | ||
160 | +++ b/target/arm/translate-neon.c | ||
161 | @@ -XXX,XX +XXX,XX @@ static inline int plus1(DisasContext *s, int x) | ||
162 | return x + 1; | ||
163 | } | ||
164 | |||
165 | -static inline int rsub_64(DisasContext *s, int x) | ||
166 | -{ | ||
167 | - return 64 - x; | ||
168 | -} | ||
169 | - | ||
170 | -static inline int rsub_32(DisasContext *s, int x) | ||
171 | -{ | ||
172 | - return 32 - x; | ||
173 | -} | ||
174 | -static inline int rsub_16(DisasContext *s, int x) | ||
175 | -{ | ||
176 | - return 16 - x; | ||
177 | -} | ||
178 | -static inline int rsub_8(DisasContext *s, int x) | ||
179 | -{ | ||
180 | - return 8 - x; | ||
181 | -} | ||
182 | - | ||
183 | static inline int neon_3same_fp_size(DisasContext *s, int x) | ||
184 | { | ||
185 | /* Convert 0==fp32, 1==fp16 into a MO_* value */ | ||
186 | -- | 373 | -- |
187 | 2.20.1 | 374 | 2.20.1 |
188 | 375 | ||
189 | 376 | diff view generated by jsdifflib |
1 | From: Joe Komlodi <joe.komlodi@xilinx.com> | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | If the CPU is running in default NaN mode (FPCR.DN == 1) and we execute | 3 | Added expected IORT files applicable with latest GICv3 |
4 | FRSQRTE, FRECPE, or FRECPX with a signaling NaN, parts_silence_nan_frac() will | 4 | ITS changes.Temporarily differences in these files are |
5 | assert due to fpst->default_nan_mode being set. | 5 | okay. |
6 | 6 | ||
7 | To avoid this, we check to see what NaN mode we're running in before we call | 7 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> |
8 | floatxx_silence_nan(). | 8 | Acked-by: Igor Mammedov <imammedo@redhat.com> |
9 | |||
10 | Signed-off-by: Joe Komlodi <joe.komlodi@xilinx.com> | ||
11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
12 | Message-id: 1624662174-175828-2-git-send-email-joe.komlodi@xilinx.com | ||
13 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
10 | Message-id: 20210910143951.92242-8-shashi.mallela@linaro.org | ||
14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
15 | --- | 12 | --- |
16 | target/arm/helper-a64.c | 12 +++++++++--- | 13 | tests/qtest/bios-tables-test-allowed-diff.h | 4 ++++ |
17 | target/arm/vfp_helper.c | 24 ++++++++++++++++++------ | 14 | tests/data/acpi/virt/IORT | 0 |
18 | 2 files changed, 27 insertions(+), 9 deletions(-) | 15 | tests/data/acpi/virt/IORT.memhp | 0 |
16 | tests/data/acpi/virt/IORT.numamem | 0 | ||
17 | tests/data/acpi/virt/IORT.pxb | 0 | ||
18 | 5 files changed, 4 insertions(+) | ||
19 | create mode 100644 tests/data/acpi/virt/IORT | ||
20 | create mode 100644 tests/data/acpi/virt/IORT.memhp | ||
21 | create mode 100644 tests/data/acpi/virt/IORT.numamem | ||
22 | create mode 100644 tests/data/acpi/virt/IORT.pxb | ||
19 | 23 | ||
20 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 24 | diff --git a/tests/qtest/bios-tables-test-allowed-diff.h b/tests/qtest/bios-tables-test-allowed-diff.h |
21 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
22 | --- a/target/arm/helper-a64.c | 26 | --- a/tests/qtest/bios-tables-test-allowed-diff.h |
23 | +++ b/target/arm/helper-a64.c | 27 | +++ b/tests/qtest/bios-tables-test-allowed-diff.h |
24 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(frecpx_f16)(uint32_t a, void *fpstp) | 28 | @@ -1 +1,5 @@ |
25 | float16 nan = a; | 29 | /* List of comma-separated changed AML files to ignore */ |
26 | if (float16_is_signaling_nan(a, fpst)) { | 30 | +"tests/data/acpi/virt/IORT", |
27 | float_raise(float_flag_invalid, fpst); | 31 | +"tests/data/acpi/virt/IORT.memhp", |
28 | - nan = float16_silence_nan(a, fpst); | 32 | +"tests/data/acpi/virt/IORT.numamem", |
29 | + if (!fpst->default_nan_mode) { | 33 | +"tests/data/acpi/virt/IORT.pxb", |
30 | + nan = float16_silence_nan(a, fpst); | 34 | diff --git a/tests/data/acpi/virt/IORT b/tests/data/acpi/virt/IORT |
31 | + } | 35 | new file mode 100644 |
32 | } | 36 | index XXXXXXX..XXXXXXX |
33 | if (fpst->default_nan_mode) { | 37 | diff --git a/tests/data/acpi/virt/IORT.memhp b/tests/data/acpi/virt/IORT.memhp |
34 | nan = float16_default_nan(fpst); | 38 | new file mode 100644 |
35 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(frecpx_f32)(float32 a, void *fpstp) | 39 | index XXXXXXX..XXXXXXX |
36 | float32 nan = a; | 40 | diff --git a/tests/data/acpi/virt/IORT.numamem b/tests/data/acpi/virt/IORT.numamem |
37 | if (float32_is_signaling_nan(a, fpst)) { | 41 | new file mode 100644 |
38 | float_raise(float_flag_invalid, fpst); | 42 | index XXXXXXX..XXXXXXX |
39 | - nan = float32_silence_nan(a, fpst); | 43 | diff --git a/tests/data/acpi/virt/IORT.pxb b/tests/data/acpi/virt/IORT.pxb |
40 | + if (!fpst->default_nan_mode) { | 44 | new file mode 100644 |
41 | + nan = float32_silence_nan(a, fpst); | 45 | index XXXXXXX..XXXXXXX |
42 | + } | ||
43 | } | ||
44 | if (fpst->default_nan_mode) { | ||
45 | nan = float32_default_nan(fpst); | ||
46 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(frecpx_f64)(float64 a, void *fpstp) | ||
47 | float64 nan = a; | ||
48 | if (float64_is_signaling_nan(a, fpst)) { | ||
49 | float_raise(float_flag_invalid, fpst); | ||
50 | - nan = float64_silence_nan(a, fpst); | ||
51 | + if (!fpst->default_nan_mode) { | ||
52 | + nan = float64_silence_nan(a, fpst); | ||
53 | + } | ||
54 | } | ||
55 | if (fpst->default_nan_mode) { | ||
56 | nan = float64_default_nan(fpst); | ||
57 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
58 | index XXXXXXX..XXXXXXX 100644 | ||
59 | --- a/target/arm/vfp_helper.c | ||
60 | +++ b/target/arm/vfp_helper.c | ||
61 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(recpe_f16)(uint32_t input, void *fpstp) | ||
62 | float16 nan = f16; | ||
63 | if (float16_is_signaling_nan(f16, fpst)) { | ||
64 | float_raise(float_flag_invalid, fpst); | ||
65 | - nan = float16_silence_nan(f16, fpst); | ||
66 | + if (!fpst->default_nan_mode) { | ||
67 | + nan = float16_silence_nan(f16, fpst); | ||
68 | + } | ||
69 | } | ||
70 | if (fpst->default_nan_mode) { | ||
71 | nan = float16_default_nan(fpst); | ||
72 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(recpe_f32)(float32 input, void *fpstp) | ||
73 | float32 nan = f32; | ||
74 | if (float32_is_signaling_nan(f32, fpst)) { | ||
75 | float_raise(float_flag_invalid, fpst); | ||
76 | - nan = float32_silence_nan(f32, fpst); | ||
77 | + if (!fpst->default_nan_mode) { | ||
78 | + nan = float32_silence_nan(f32, fpst); | ||
79 | + } | ||
80 | } | ||
81 | if (fpst->default_nan_mode) { | ||
82 | nan = float32_default_nan(fpst); | ||
83 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp) | ||
84 | float64 nan = f64; | ||
85 | if (float64_is_signaling_nan(f64, fpst)) { | ||
86 | float_raise(float_flag_invalid, fpst); | ||
87 | - nan = float64_silence_nan(f64, fpst); | ||
88 | + if (!fpst->default_nan_mode) { | ||
89 | + nan = float64_silence_nan(f64, fpst); | ||
90 | + } | ||
91 | } | ||
92 | if (fpst->default_nan_mode) { | ||
93 | nan = float64_default_nan(fpst); | ||
94 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(rsqrte_f16)(uint32_t input, void *fpstp) | ||
95 | float16 nan = f16; | ||
96 | if (float16_is_signaling_nan(f16, s)) { | ||
97 | float_raise(float_flag_invalid, s); | ||
98 | - nan = float16_silence_nan(f16, s); | ||
99 | + if (!s->default_nan_mode) { | ||
100 | + nan = float16_silence_nan(f16, fpstp); | ||
101 | + } | ||
102 | } | ||
103 | if (s->default_nan_mode) { | ||
104 | nan = float16_default_nan(s); | ||
105 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrte_f32)(float32 input, void *fpstp) | ||
106 | float32 nan = f32; | ||
107 | if (float32_is_signaling_nan(f32, s)) { | ||
108 | float_raise(float_flag_invalid, s); | ||
109 | - nan = float32_silence_nan(f32, s); | ||
110 | + if (!s->default_nan_mode) { | ||
111 | + nan = float32_silence_nan(f32, fpstp); | ||
112 | + } | ||
113 | } | ||
114 | if (s->default_nan_mode) { | ||
115 | nan = float32_default_nan(s); | ||
116 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp) | ||
117 | float64 nan = f64; | ||
118 | if (float64_is_signaling_nan(f64, s)) { | ||
119 | float_raise(float_flag_invalid, s); | ||
120 | - nan = float64_silence_nan(f64, s); | ||
121 | + if (!s->default_nan_mode) { | ||
122 | + nan = float64_silence_nan(f64, fpstp); | ||
123 | + } | ||
124 | } | ||
125 | if (s->default_nan_mode) { | ||
126 | nan = float64_default_nan(s); | ||
127 | -- | 46 | -- |
128 | 2.20.1 | 47 | 2.20.1 |
129 | 48 | ||
130 | 49 | diff view generated by jsdifflib |
1 | Implement the MVE saturating shift-right-and-narrow insns | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | VQSHRN, VQSHRUN, VQRSHRN and VQRSHRUN. | ||
3 | 2 | ||
4 | do_srshr() is borrowed from sve_helper.c. | 3 | Included creation of ITS as part of virt platform GIC |
4 | initialization. This Emulated ITS model now co-exists with kvm | ||
5 | ITS and is enabled in absence of kvm irq kernel support in a | ||
6 | platform. | ||
5 | 7 | ||
8 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> | ||
9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | Message-id: 20210910143951.92242-9-shashi.mallela@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20210628135835.6690-13-peter.maydell@linaro.org | ||
9 | --- | 12 | --- |
10 | target/arm/helper-mve.h | 30 +++++++++++ | 13 | include/hw/arm/virt.h | 2 ++ |
11 | target/arm/mve.decode | 28 ++++++++++ | 14 | target/arm/kvm_arm.h | 4 ++-- |
12 | target/arm/mve_helper.c | 104 +++++++++++++++++++++++++++++++++++++ | 15 | hw/arm/virt.c | 29 +++++++++++++++++++++++++++-- |
13 | target/arm/translate-mve.c | 12 +++++ | 16 | 3 files changed, 31 insertions(+), 4 deletions(-) |
14 | 4 files changed, 174 insertions(+) | ||
15 | 17 | ||
16 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 18 | diff --git a/include/hw/arm/virt.h b/include/hw/arm/virt.h |
17 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-mve.h | 20 | --- a/include/hw/arm/virt.h |
19 | +++ b/target/arm/helper-mve.h | 21 | +++ b/include/hw/arm/virt.h |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vrshrnbb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 22 | @@ -XXX,XX +XXX,XX @@ struct VirtMachineClass { |
21 | DEF_HELPER_FLAGS_4(mve_vrshrnbh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 23 | MachineClass parent; |
22 | DEF_HELPER_FLAGS_4(mve_vrshrntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 24 | bool disallow_affinity_adjustment; |
23 | DEF_HELPER_FLAGS_4(mve_vrshrnth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 25 | bool no_its; |
24 | + | 26 | + bool no_tcg_its; |
25 | +DEF_HELPER_FLAGS_4(mve_vqshrnb_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 27 | bool no_pmu; |
26 | +DEF_HELPER_FLAGS_4(mve_vqshrnb_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 28 | bool claim_edge_triggered_timers; |
27 | +DEF_HELPER_FLAGS_4(mve_vqshrnt_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 29 | bool smbios_old_sys_ver; |
28 | +DEF_HELPER_FLAGS_4(mve_vqshrnt_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 30 | @@ -XXX,XX +XXX,XX @@ struct VirtMachineState { |
29 | + | 31 | bool highmem; |
30 | +DEF_HELPER_FLAGS_4(mve_vqshrnb_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 32 | bool highmem_ecam; |
31 | +DEF_HELPER_FLAGS_4(mve_vqshrnb_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 33 | bool its; |
32 | +DEF_HELPER_FLAGS_4(mve_vqshrnt_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 34 | + bool tcg_its; |
33 | +DEF_HELPER_FLAGS_4(mve_vqshrnt_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 35 | bool virt; |
34 | + | 36 | bool ras; |
35 | +DEF_HELPER_FLAGS_4(mve_vqshrunbb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 37 | bool mte; |
36 | +DEF_HELPER_FLAGS_4(mve_vqshrunbh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 38 | diff --git a/target/arm/kvm_arm.h b/target/arm/kvm_arm.h |
37 | +DEF_HELPER_FLAGS_4(mve_vqshruntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
38 | +DEF_HELPER_FLAGS_4(mve_vqshrunth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
39 | + | ||
40 | +DEF_HELPER_FLAGS_4(mve_vqrshrnb_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
41 | +DEF_HELPER_FLAGS_4(mve_vqrshrnb_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
42 | +DEF_HELPER_FLAGS_4(mve_vqrshrnt_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
43 | +DEF_HELPER_FLAGS_4(mve_vqrshrnt_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
44 | + | ||
45 | +DEF_HELPER_FLAGS_4(mve_vqrshrnb_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
46 | +DEF_HELPER_FLAGS_4(mve_vqrshrnb_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
47 | +DEF_HELPER_FLAGS_4(mve_vqrshrnt_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
48 | +DEF_HELPER_FLAGS_4(mve_vqrshrnt_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
49 | + | ||
50 | +DEF_HELPER_FLAGS_4(mve_vqrshrunbb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
51 | +DEF_HELPER_FLAGS_4(mve_vqrshrunbh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
52 | +DEF_HELPER_FLAGS_4(mve_vqrshruntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
53 | +DEF_HELPER_FLAGS_4(mve_vqrshrunth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
54 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | ||
55 | index XXXXXXX..XXXXXXX 100644 | 39 | index XXXXXXX..XXXXXXX 100644 |
56 | --- a/target/arm/mve.decode | 40 | --- a/target/arm/kvm_arm.h |
57 | +++ b/target/arm/mve.decode | 41 | +++ b/target/arm/kvm_arm.h |
58 | @@ -XXX,XX +XXX,XX @@ VRSHRNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 1 @2_shr_b | 42 | @@ -XXX,XX +XXX,XX @@ static inline const char *its_class_name(void) |
59 | VRSHRNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 1 @2_shr_h | 43 | /* KVM implementation requires this capability */ |
60 | VRSHRNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 1 @2_shr_b | 44 | return kvm_direct_msi_enabled() ? "arm-its-kvm" : NULL; |
61 | VRSHRNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 1 @2_shr_h | 45 | } else { |
62 | + | 46 | - /* Software emulation is not implemented yet */ |
63 | +VQSHRNB_S 111 0 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 0 @2_shr_b | 47 | - return NULL; |
64 | +VQSHRNB_S 111 0 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 0 @2_shr_h | 48 | + /* Software emulation based model */ |
65 | +VQSHRNT_S 111 0 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 0 @2_shr_b | 49 | + return "arm-gicv3-its"; |
66 | +VQSHRNT_S 111 0 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 0 @2_shr_h | ||
67 | +VQSHRNB_U 111 1 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 0 @2_shr_b | ||
68 | +VQSHRNB_U 111 1 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 0 @2_shr_h | ||
69 | +VQSHRNT_U 111 1 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 0 @2_shr_b | ||
70 | +VQSHRNT_U 111 1 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 0 @2_shr_h | ||
71 | + | ||
72 | +VQSHRUNB 111 0 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 0 @2_shr_b | ||
73 | +VQSHRUNB 111 0 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 0 @2_shr_h | ||
74 | +VQSHRUNT 111 0 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 0 @2_shr_b | ||
75 | +VQSHRUNT 111 0 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 0 @2_shr_h | ||
76 | + | ||
77 | +VQRSHRNB_S 111 0 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 1 @2_shr_b | ||
78 | +VQRSHRNB_S 111 0 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 1 @2_shr_h | ||
79 | +VQRSHRNT_S 111 0 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 1 @2_shr_b | ||
80 | +VQRSHRNT_S 111 0 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 1 @2_shr_h | ||
81 | +VQRSHRNB_U 111 1 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 1 @2_shr_b | ||
82 | +VQRSHRNB_U 111 1 1110 1 . ... ... ... 0 1111 0 1 . 0 ... 1 @2_shr_h | ||
83 | +VQRSHRNT_U 111 1 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 1 @2_shr_b | ||
84 | +VQRSHRNT_U 111 1 1110 1 . ... ... ... 1 1111 0 1 . 0 ... 1 @2_shr_h | ||
85 | + | ||
86 | +VQRSHRUNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 0 @2_shr_b | ||
87 | +VQRSHRUNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 0 @2_shr_h | ||
88 | +VQRSHRUNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 0 @2_shr_b | ||
89 | +VQRSHRUNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 0 @2_shr_h | ||
90 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
91 | index XXXXXXX..XXXXXXX 100644 | ||
92 | --- a/target/arm/mve_helper.c | ||
93 | +++ b/target/arm/mve_helper.c | ||
94 | @@ -XXX,XX +XXX,XX @@ static inline uint64_t do_urshr(uint64_t x, unsigned sh) | ||
95 | } | 50 | } |
96 | } | 51 | } |
97 | 52 | ||
98 | +static inline int64_t do_srshr(int64_t x, unsigned sh) | 53 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c |
99 | +{ | 54 | index XXXXXXX..XXXXXXX 100644 |
100 | + if (likely(sh < 64)) { | 55 | --- a/hw/arm/virt.c |
101 | + return (x >> sh) + ((x >> (sh - 1)) & 1); | 56 | +++ b/hw/arm/virt.c |
102 | + } else { | 57 | @@ -XXX,XX +XXX,XX @@ static void create_its(VirtMachineState *vms) |
103 | + /* Rounding the sign bit always produces 0. */ | 58 | const char *itsclass = its_class_name(); |
104 | + return 0; | 59 | DeviceState *dev; |
105 | + } | 60 | |
106 | +} | 61 | + if (!strcmp(itsclass, "arm-gicv3-its")) { |
107 | + | 62 | + if (!vms->tcg_its) { |
108 | DO_VSHRN_ALL(vshrn, DO_SHR) | 63 | + itsclass = NULL; |
109 | DO_VSHRN_ALL(vrshrn, do_urshr) | 64 | + } |
110 | + | ||
111 | +static inline int32_t do_sat_bhs(int64_t val, int64_t min, int64_t max, | ||
112 | + bool *satp) | ||
113 | +{ | ||
114 | + if (val > max) { | ||
115 | + *satp = true; | ||
116 | + return max; | ||
117 | + } else if (val < min) { | ||
118 | + *satp = true; | ||
119 | + return min; | ||
120 | + } else { | ||
121 | + return val; | ||
122 | + } | ||
123 | +} | ||
124 | + | ||
125 | +/* Saturating narrowing right shifts */ | ||
126 | +#define DO_VSHRN_SAT(OP, TOP, ESIZE, TYPE, LESIZE, LTYPE, FN) \ | ||
127 | + void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
128 | + void *vm, uint32_t shift) \ | ||
129 | + { \ | ||
130 | + LTYPE *m = vm; \ | ||
131 | + TYPE *d = vd; \ | ||
132 | + uint16_t mask = mve_element_mask(env); \ | ||
133 | + bool qc = false; \ | ||
134 | + unsigned le; \ | ||
135 | + for (le = 0; le < 16 / LESIZE; le++, mask >>= LESIZE) { \ | ||
136 | + bool sat = false; \ | ||
137 | + TYPE r = FN(m[H##LESIZE(le)], shift, &sat); \ | ||
138 | + mergemask(&d[H##ESIZE(le * 2 + TOP)], r, mask); \ | ||
139 | + qc |= sat && (mask & 1 << (TOP * ESIZE)); \ | ||
140 | + } \ | ||
141 | + if (qc) { \ | ||
142 | + env->vfp.qc[0] = qc; \ | ||
143 | + } \ | ||
144 | + mve_advance_vpt(env); \ | ||
145 | + } | 65 | + } |
146 | + | 66 | + |
147 | +#define DO_VSHRN_SAT_UB(BOP, TOP, FN) \ | 67 | if (!itsclass) { |
148 | + DO_VSHRN_SAT(BOP, false, 1, uint8_t, 2, uint16_t, FN) \ | 68 | /* Do nothing if not supported */ |
149 | + DO_VSHRN_SAT(TOP, true, 1, uint8_t, 2, uint16_t, FN) | 69 | return; |
70 | @@ -XXX,XX +XXX,XX @@ static void create_v2m(VirtMachineState *vms) | ||
71 | vms->msi_controller = VIRT_MSI_CTRL_GICV2M; | ||
72 | } | ||
73 | |||
74 | -static void create_gic(VirtMachineState *vms) | ||
75 | +static void create_gic(VirtMachineState *vms, MemoryRegion *mem) | ||
76 | { | ||
77 | MachineState *ms = MACHINE(vms); | ||
78 | /* We create a standalone GIC */ | ||
79 | @@ -XXX,XX +XXX,XX @@ static void create_gic(VirtMachineState *vms) | ||
80 | nb_redist_regions); | ||
81 | qdev_prop_set_uint32(vms->gic, "redist-region-count[0]", redist0_count); | ||
82 | |||
83 | + if (!kvm_irqchip_in_kernel()) { | ||
84 | + if (vms->tcg_its) { | ||
85 | + object_property_set_link(OBJECT(vms->gic), "sysmem", | ||
86 | + OBJECT(mem), &error_fatal); | ||
87 | + qdev_prop_set_bit(vms->gic, "has-lpi", true); | ||
88 | + } | ||
89 | + } | ||
150 | + | 90 | + |
151 | +#define DO_VSHRN_SAT_UH(BOP, TOP, FN) \ | 91 | if (nb_redist_regions == 2) { |
152 | + DO_VSHRN_SAT(BOP, false, 2, uint16_t, 4, uint32_t, FN) \ | 92 | uint32_t redist1_capacity = |
153 | + DO_VSHRN_SAT(TOP, true, 2, uint16_t, 4, uint32_t, FN) | 93 | vms->memmap[VIRT_HIGH_GIC_REDIST2].size / GICV3_REDIST_SIZE; |
94 | @@ -XXX,XX +XXX,XX @@ static void machvirt_init(MachineState *machine) | ||
95 | |||
96 | virt_flash_fdt(vms, sysmem, secure_sysmem ?: sysmem); | ||
97 | |||
98 | - create_gic(vms); | ||
99 | + create_gic(vms, sysmem); | ||
100 | |||
101 | virt_cpu_post_init(vms, sysmem); | ||
102 | |||
103 | @@ -XXX,XX +XXX,XX @@ static void virt_instance_init(Object *obj) | ||
104 | } else { | ||
105 | /* Default allows ITS instantiation */ | ||
106 | vms->its = true; | ||
154 | + | 107 | + |
155 | +#define DO_VSHRN_SAT_SB(BOP, TOP, FN) \ | 108 | + if (vmc->no_tcg_its) { |
156 | + DO_VSHRN_SAT(BOP, false, 1, int8_t, 2, int16_t, FN) \ | 109 | + vms->tcg_its = false; |
157 | + DO_VSHRN_SAT(TOP, true, 1, int8_t, 2, int16_t, FN) | 110 | + } else { |
111 | + vms->tcg_its = true; | ||
112 | + } | ||
113 | } | ||
114 | |||
115 | /* Default disallows iommu instantiation */ | ||
116 | @@ -XXX,XX +XXX,XX @@ DEFINE_VIRT_MACHINE_AS_LATEST(6, 2) | ||
117 | |||
118 | static void virt_machine_6_1_options(MachineClass *mc) | ||
119 | { | ||
120 | + VirtMachineClass *vmc = VIRT_MACHINE_CLASS(OBJECT_CLASS(mc)); | ||
158 | + | 121 | + |
159 | +#define DO_VSHRN_SAT_SH(BOP, TOP, FN) \ | 122 | virt_machine_6_2_options(mc); |
160 | + DO_VSHRN_SAT(BOP, false, 2, int16_t, 4, int32_t, FN) \ | 123 | compat_props_add(mc->compat_props, hw_compat_6_1, hw_compat_6_1_len); |
161 | + DO_VSHRN_SAT(TOP, true, 2, int16_t, 4, int32_t, FN) | ||
162 | + | 124 | + |
163 | +#define DO_SHRN_SB(N, M, SATP) \ | 125 | + /* qemu ITS was introduced with 6.2 */ |
164 | + do_sat_bhs((int64_t)(N) >> (M), INT8_MIN, INT8_MAX, SATP) | 126 | + vmc->no_tcg_its = true; |
165 | +#define DO_SHRN_UB(N, M, SATP) \ | 127 | } |
166 | + do_sat_bhs((uint64_t)(N) >> (M), 0, UINT8_MAX, SATP) | 128 | DEFINE_VIRT_MACHINE(6, 1) |
167 | +#define DO_SHRUN_B(N, M, SATP) \ | 129 | |
168 | + do_sat_bhs((int64_t)(N) >> (M), 0, UINT8_MAX, SATP) | ||
169 | + | ||
170 | +#define DO_SHRN_SH(N, M, SATP) \ | ||
171 | + do_sat_bhs((int64_t)(N) >> (M), INT16_MIN, INT16_MAX, SATP) | ||
172 | +#define DO_SHRN_UH(N, M, SATP) \ | ||
173 | + do_sat_bhs((uint64_t)(N) >> (M), 0, UINT16_MAX, SATP) | ||
174 | +#define DO_SHRUN_H(N, M, SATP) \ | ||
175 | + do_sat_bhs((int64_t)(N) >> (M), 0, UINT16_MAX, SATP) | ||
176 | + | ||
177 | +#define DO_RSHRN_SB(N, M, SATP) \ | ||
178 | + do_sat_bhs(do_srshr(N, M), INT8_MIN, INT8_MAX, SATP) | ||
179 | +#define DO_RSHRN_UB(N, M, SATP) \ | ||
180 | + do_sat_bhs(do_urshr(N, M), 0, UINT8_MAX, SATP) | ||
181 | +#define DO_RSHRUN_B(N, M, SATP) \ | ||
182 | + do_sat_bhs(do_srshr(N, M), 0, UINT8_MAX, SATP) | ||
183 | + | ||
184 | +#define DO_RSHRN_SH(N, M, SATP) \ | ||
185 | + do_sat_bhs(do_srshr(N, M), INT16_MIN, INT16_MAX, SATP) | ||
186 | +#define DO_RSHRN_UH(N, M, SATP) \ | ||
187 | + do_sat_bhs(do_urshr(N, M), 0, UINT16_MAX, SATP) | ||
188 | +#define DO_RSHRUN_H(N, M, SATP) \ | ||
189 | + do_sat_bhs(do_srshr(N, M), 0, UINT16_MAX, SATP) | ||
190 | + | ||
191 | +DO_VSHRN_SAT_SB(vqshrnb_sb, vqshrnt_sb, DO_SHRN_SB) | ||
192 | +DO_VSHRN_SAT_SH(vqshrnb_sh, vqshrnt_sh, DO_SHRN_SH) | ||
193 | +DO_VSHRN_SAT_UB(vqshrnb_ub, vqshrnt_ub, DO_SHRN_UB) | ||
194 | +DO_VSHRN_SAT_UH(vqshrnb_uh, vqshrnt_uh, DO_SHRN_UH) | ||
195 | +DO_VSHRN_SAT_SB(vqshrunbb, vqshruntb, DO_SHRUN_B) | ||
196 | +DO_VSHRN_SAT_SH(vqshrunbh, vqshrunth, DO_SHRUN_H) | ||
197 | + | ||
198 | +DO_VSHRN_SAT_SB(vqrshrnb_sb, vqrshrnt_sb, DO_RSHRN_SB) | ||
199 | +DO_VSHRN_SAT_SH(vqrshrnb_sh, vqrshrnt_sh, DO_RSHRN_SH) | ||
200 | +DO_VSHRN_SAT_UB(vqrshrnb_ub, vqrshrnt_ub, DO_RSHRN_UB) | ||
201 | +DO_VSHRN_SAT_UH(vqrshrnb_uh, vqrshrnt_uh, DO_RSHRN_UH) | ||
202 | +DO_VSHRN_SAT_SB(vqrshrunbb, vqrshruntb, DO_RSHRUN_B) | ||
203 | +DO_VSHRN_SAT_SH(vqrshrunbh, vqrshrunth, DO_RSHRUN_H) | ||
204 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
205 | index XXXXXXX..XXXXXXX 100644 | ||
206 | --- a/target/arm/translate-mve.c | ||
207 | +++ b/target/arm/translate-mve.c | ||
208 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT_N(VSHRNB, vshrnb) | ||
209 | DO_2SHIFT_N(VSHRNT, vshrnt) | ||
210 | DO_2SHIFT_N(VRSHRNB, vrshrnb) | ||
211 | DO_2SHIFT_N(VRSHRNT, vrshrnt) | ||
212 | +DO_2SHIFT_N(VQSHRNB_S, vqshrnb_s) | ||
213 | +DO_2SHIFT_N(VQSHRNT_S, vqshrnt_s) | ||
214 | +DO_2SHIFT_N(VQSHRNB_U, vqshrnb_u) | ||
215 | +DO_2SHIFT_N(VQSHRNT_U, vqshrnt_u) | ||
216 | +DO_2SHIFT_N(VQSHRUNB, vqshrunb) | ||
217 | +DO_2SHIFT_N(VQSHRUNT, vqshrunt) | ||
218 | +DO_2SHIFT_N(VQRSHRNB_S, vqrshrnb_s) | ||
219 | +DO_2SHIFT_N(VQRSHRNT_S, vqrshrnt_s) | ||
220 | +DO_2SHIFT_N(VQRSHRNB_U, vqrshrnb_u) | ||
221 | +DO_2SHIFT_N(VQRSHRNT_U, vqrshrnt_u) | ||
222 | +DO_2SHIFT_N(VQRSHRUNB, vqrshrunb) | ||
223 | +DO_2SHIFT_N(VQRSHRUNT, vqrshrunt) | ||
224 | -- | 130 | -- |
225 | 2.20.1 | 131 | 2.20.1 |
226 | 132 | ||
227 | 133 | diff view generated by jsdifflib |
1 | From: Philippe Mathieu-Daudé <f4bug@amsat.org> | 1 | From: Shashi Mallela <shashi.mallela@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Add a test booting and quickly shutdown a raspi2 machine, | 3 | Updated expected IORT files applicable with latest GICv3 |
4 | to test the power management model: | 4 | ITS changes. |
5 | 5 | ||
6 | (1/1) tests/acceptance/boot_linux_console.py:BootLinuxConsole.test_arm_raspi2_initrd: | 6 | Full diff of new file disassembly: |
7 | console: [ 0.000000] Booting Linux on physical CPU 0xf00 | ||
8 | console: [ 0.000000] Linux version 4.14.98-v7+ (dom@dom-XPS-13-9370) (gcc version 4.9.3 (crosstool-NG crosstool-ng-1.22.0-88-g8460611)) #1200 SMP Tue Feb 12 20:27:48 GMT 2019 | ||
9 | console: [ 0.000000] CPU: ARMv7 Processor [410fc075] revision 5 (ARMv7), cr=10c5387d | ||
10 | console: [ 0.000000] CPU: div instructions available: patching division code | ||
11 | console: [ 0.000000] CPU: PIPT / VIPT nonaliasing data cache, VIPT aliasing instruction cache | ||
12 | console: [ 0.000000] OF: fdt: Machine model: Raspberry Pi 2 Model B | ||
13 | ... | ||
14 | console: Boot successful. | ||
15 | console: cat /proc/cpuinfo | ||
16 | console: / # cat /proc/cpuinfo | ||
17 | ... | ||
18 | console: processor : 3 | ||
19 | console: model name : ARMv7 Processor rev 5 (v7l) | ||
20 | console: BogoMIPS : 125.00 | ||
21 | console: Features : half thumb fastmult vfp edsp neon vfpv3 tls vfpv4 idiva idivt vfpd32 lpae evtstrm | ||
22 | console: CPU implementer : 0x41 | ||
23 | console: CPU architecture: 7 | ||
24 | console: CPU variant : 0x0 | ||
25 | console: CPU part : 0xc07 | ||
26 | console: CPU revision : 5 | ||
27 | console: Hardware : BCM2835 | ||
28 | console: Revision : 0000 | ||
29 | console: Serial : 0000000000000000 | ||
30 | console: cat /proc/iomem | ||
31 | console: / # cat /proc/iomem | ||
32 | console: 00000000-3bffffff : System RAM | ||
33 | console: 00008000-00afffff : Kernel code | ||
34 | console: 00c00000-00d468ef : Kernel data | ||
35 | console: 3f006000-3f006fff : dwc_otg | ||
36 | console: 3f007000-3f007eff : /soc/dma@7e007000 | ||
37 | console: 3f00b880-3f00b8bf : /soc/mailbox@7e00b880 | ||
38 | console: 3f100000-3f100027 : /soc/watchdog@7e100000 | ||
39 | console: 3f101000-3f102fff : /soc/cprman@7e101000 | ||
40 | console: 3f200000-3f2000b3 : /soc/gpio@7e200000 | ||
41 | PASS (24.59 s) | ||
42 | RESULTS : PASS 1 | ERROR 0 | FAIL 0 | SKIP 0 | WARN 0 | INTERRUPT 0 | CANCEL 0 | ||
43 | JOB TIME : 25.02 s | ||
44 | 7 | ||
45 | Signed-off-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | 8 | /* |
46 | Reviewed-by: Wainer dos Santos Moschetta <wainersm@redhat.com> | 9 | * Intel ACPI Component Architecture |
47 | Message-id: 20210531113837.1689775-1-f4bug@amsat.org | 10 | * AML/ASL+ Disassembler version 20180629 (64-bit version) |
11 | * Copyright (c) 2000 - 2018 Intel Corporation | ||
12 | * | ||
13 | * Disassembly of tests/data/acpi/virt/IORT.pxb, Tue Jun 29 17:35:38 2021 | ||
14 | * | ||
15 | * ACPI Data Table [IORT] | ||
16 | * | ||
17 | * Format: [HexOffset DecimalOffset ByteLength] FieldName : FieldValue | ||
18 | */ | ||
19 | |||
20 | [000h 0000 4] Signature : "IORT" [IO Remapping Table] | ||
21 | [004h 0004 4] Table Length : 0000007C | ||
22 | [008h 0008 1] Revision : 00 | ||
23 | [009h 0009 1] Checksum : 07 | ||
24 | [00Ah 0010 6] Oem ID : "BOCHS " | ||
25 | [010h 0016 8] Oem Table ID : "BXPC " | ||
26 | [018h 0024 4] Oem Revision : 00000001 | ||
27 | [01Ch 0028 4] Asl Compiler ID : "BXPC" | ||
28 | [020h 0032 4] Asl Compiler Revision : 00000001 | ||
29 | |||
30 | [024h 0036 4] Node Count : 00000002 | ||
31 | [028h 0040 4] Node Offset : 00000030 | ||
32 | [02Ch 0044 4] Reserved : 00000000 | ||
33 | |||
34 | [030h 0048 1] Type : 00 | ||
35 | [031h 0049 2] Length : 0018 | ||
36 | [033h 0051 1] Revision : 00 | ||
37 | [034h 0052 4] Reserved : 00000000 | ||
38 | [038h 0056 4] Mapping Count : 00000000 | ||
39 | [03Ch 0060 4] Mapping Offset : 00000000 | ||
40 | |||
41 | [040h 0064 4] ItsCount : 00000001 | ||
42 | [044h 0068 4] Identifiers : 00000000 | ||
43 | |||
44 | [048h 0072 1] Type : 02 | ||
45 | [049h 0073 2] Length : 0034 | ||
46 | [04Bh 0075 1] Revision : 00 | ||
47 | [04Ch 0076 4] Reserved : 00000000 | ||
48 | [050h 0080 4] Mapping Count : 00000001 | ||
49 | [054h 0084 4] Mapping Offset : 00000020 | ||
50 | |||
51 | [058h 0088 8] Memory Properties : [IORT Memory Access Properties] | ||
52 | [058h 0088 4] Cache Coherency : 00000001 | ||
53 | [05Ch 0092 1] Hints (decoded below) : 00 | ||
54 | Transient : 0 | ||
55 | Write Allocate : 0 | ||
56 | Read Allocate : 0 | ||
57 | Override : 0 | ||
58 | [05Dh 0093 2] Reserved : 0000 | ||
59 | [05Fh 0095 1] Memory Flags (decoded below) : 03 | ||
60 | Coherency : 1 | ||
61 | Device Attribute : 1 | ||
62 | [060h 0096 4] ATS Attribute : 00000000 | ||
63 | [064h 0100 4] PCI Segment Number : 00000000 | ||
64 | [068h 0104 1] Memory Size Limit : 00 | ||
65 | [069h 0105 3] Reserved : 000000 | ||
66 | |||
67 | [068h 0104 4] Input base : 00000000 | ||
68 | [06Ch 0108 4] ID Count : 0000FFFF | ||
69 | [070h 0112 4] Output Base : 00000000 | ||
70 | [074h 0116 4] Output Reference : 00000030 | ||
71 | [078h 0120 4] Flags (decoded below) : 00000000 | ||
72 | Single Mapping : 0 | ||
73 | |||
74 | Raw Table Data: Length 124 (0x7C) | ||
75 | |||
76 | 0000: 49 4F 52 54 7C 00 00 00 00 07 42 4F 43 48 53 20 // IORT|.....BOCHS | ||
77 | 0010: 42 58 50 43 20 20 20 20 01 00 00 00 42 58 50 43 // BXPC ....BXPC | ||
78 | 0020: 01 00 00 00 02 00 00 00 30 00 00 00 00 00 00 00 // ........0....... | ||
79 | 0030: 00 18 00 00 00 00 00 00 00 00 00 00 00 00 00 00 // ................ | ||
80 | 0040: 01 00 00 00 00 00 00 00 02 34 00 00 00 00 00 00 // .........4...... | ||
81 | 0050: 01 00 00 00 20 00 00 00 01 00 00 00 00 00 00 03 // .... ........... | ||
82 | 0060: 00 00 00 00 00 00 00 00 00 00 00 00 FF FF 00 00 // ................ | ||
83 | 0070: 00 00 00 00 30 00 00 00 00 00 00 00 // ....0....... | ||
84 | |||
85 | Signed-off-by: Shashi Mallela <shashi.mallela@linaro.org> | ||
86 | Acked-by: Igor Mammedov <imammedo@redhat.com> | ||
87 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
88 | Message-id: 20210910143951.92242-10-shashi.mallela@linaro.org | ||
48 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 89 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
49 | --- | 90 | --- |
50 | tests/acceptance/boot_linux_console.py | 43 ++++++++++++++++++++++++++ | 91 | tests/qtest/bios-tables-test-allowed-diff.h | 4 ---- |
51 | 1 file changed, 43 insertions(+) | 92 | tests/data/acpi/virt/IORT | Bin 0 -> 124 bytes |
93 | tests/data/acpi/virt/IORT.memhp | Bin 0 -> 124 bytes | ||
94 | tests/data/acpi/virt/IORT.numamem | Bin 0 -> 124 bytes | ||
95 | tests/data/acpi/virt/IORT.pxb | Bin 0 -> 124 bytes | ||
96 | 5 files changed, 4 deletions(-) | ||
52 | 97 | ||
53 | diff --git a/tests/acceptance/boot_linux_console.py b/tests/acceptance/boot_linux_console.py | 98 | diff --git a/tests/qtest/bios-tables-test-allowed-diff.h b/tests/qtest/bios-tables-test-allowed-diff.h |
54 | index XXXXXXX..XXXXXXX 100644 | 99 | index XXXXXXX..XXXXXXX 100644 |
55 | --- a/tests/acceptance/boot_linux_console.py | 100 | --- a/tests/qtest/bios-tables-test-allowed-diff.h |
56 | +++ b/tests/acceptance/boot_linux_console.py | 101 | +++ b/tests/qtest/bios-tables-test-allowed-diff.h |
57 | @@ -XXX,XX +XXX,XX @@ | 102 | @@ -1,5 +1 @@ |
58 | from avocado import skip | 103 | /* List of comma-separated changed AML files to ignore */ |
59 | from avocado import skipUnless | 104 | -"tests/data/acpi/virt/IORT", |
60 | from avocado_qemu import Test | 105 | -"tests/data/acpi/virt/IORT.memhp", |
61 | +from avocado_qemu import exec_command | 106 | -"tests/data/acpi/virt/IORT.numamem", |
62 | from avocado_qemu import exec_command_and_wait_for_pattern | 107 | -"tests/data/acpi/virt/IORT.pxb", |
63 | from avocado_qemu import interrupt_interactive_console_until_pattern | 108 | diff --git a/tests/data/acpi/virt/IORT b/tests/data/acpi/virt/IORT |
64 | from avocado_qemu import wait_for_console_pattern | 109 | index XXXXXXX..XXXXXXX 100644 |
65 | @@ -XXX,XX +XXX,XX @@ def test_arm_raspi2_uart0(self): | 110 | GIT binary patch |
66 | """ | 111 | literal 124 |
67 | self.do_test_arm_raspi2(0) | 112 | zcmebD4+^Pa00MR=e`k+i1*eDrX9XZ&1PX!JAesq?4S*O7Bw!2(4Uz`|CKCt^;wu0# |
68 | 113 | QRGb+i3L*dhhtM#y0PN=p0RR91 | |
69 | + def test_arm_raspi2_initrd(self): | 114 | |
70 | + """ | 115 | literal 0 |
71 | + :avocado: tags=arch:arm | 116 | HcmV?d00001 |
72 | + :avocado: tags=machine:raspi2 | 117 | |
73 | + """ | 118 | diff --git a/tests/data/acpi/virt/IORT.memhp b/tests/data/acpi/virt/IORT.memhp |
74 | + deb_url = ('http://archive.raspberrypi.org/debian/' | 119 | index XXXXXXX..XXXXXXX 100644 |
75 | + 'pool/main/r/raspberrypi-firmware/' | 120 | GIT binary patch |
76 | + 'raspberrypi-kernel_1.20190215-1_armhf.deb') | 121 | literal 124 |
77 | + deb_hash = 'cd284220b32128c5084037553db3c482426f3972' | 122 | zcmebD4+^Pa00MR=e`k+i1*eDrX9XZ&1PX!JAesq?4S*O7Bw!2(4Uz`|CKCt^;wu0# |
78 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | 123 | QRGb+i3L*dhhtM#y0PN=p0RR91 |
79 | + kernel_path = self.extract_from_deb(deb_path, '/boot/kernel7.img') | 124 | |
80 | + dtb_path = self.extract_from_deb(deb_path, '/boot/bcm2709-rpi-2-b.dtb') | 125 | literal 0 |
81 | + | 126 | HcmV?d00001 |
82 | + initrd_url = ('https://github.com/groeck/linux-build-test/raw/' | 127 | |
83 | + '2eb0a73b5d5a28df3170c546ddaaa9757e1e0848/rootfs/' | 128 | diff --git a/tests/data/acpi/virt/IORT.numamem b/tests/data/acpi/virt/IORT.numamem |
84 | + 'arm/rootfs-armv7a.cpio.gz') | 129 | index XXXXXXX..XXXXXXX 100644 |
85 | + initrd_hash = '604b2e45cdf35045846b8bbfbf2129b1891bdc9c' | 130 | GIT binary patch |
86 | + initrd_path_gz = self.fetch_asset(initrd_url, asset_hash=initrd_hash) | 131 | literal 124 |
87 | + initrd_path = os.path.join(self.workdir, 'rootfs.cpio') | 132 | zcmebD4+^Pa00MR=e`k+i1*eDrX9XZ&1PX!JAesq?4S*O7Bw!2(4Uz`|CKCt^;wu0# |
88 | + archive.gzip_uncompress(initrd_path_gz, initrd_path) | 133 | QRGb+i3L*dhhtM#y0PN=p0RR91 |
89 | + | 134 | |
90 | + self.vm.set_console() | 135 | literal 0 |
91 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | 136 | HcmV?d00001 |
92 | + 'earlycon=pl011,0x3f201000 console=ttyAMA0 ' | 137 | |
93 | + 'panic=-1 noreboot ' + | 138 | diff --git a/tests/data/acpi/virt/IORT.pxb b/tests/data/acpi/virt/IORT.pxb |
94 | + 'dwc_otg.fiq_fsm_enable=0') | 139 | index XXXXXXX..XXXXXXX 100644 |
95 | + self.vm.add_args('-kernel', kernel_path, | 140 | GIT binary patch |
96 | + '-dtb', dtb_path, | 141 | literal 124 |
97 | + '-initrd', initrd_path, | 142 | zcmebD4+^Pa00MR=e`k+i1*eDrX9XZ&1PX!JAesq?4S*O7Bw!2(4Uz`|CKCt^;wu0# |
98 | + '-append', kernel_command_line, | 143 | QRGb+i3L*dhhtM#y0PN=p0RR91 |
99 | + '-no-reboot') | 144 | |
100 | + self.vm.launch() | 145 | literal 0 |
101 | + self.wait_for_console_pattern('Boot successful.') | 146 | HcmV?d00001 |
102 | + | 147 | |
103 | + exec_command_and_wait_for_pattern(self, 'cat /proc/cpuinfo', | ||
104 | + 'BCM2835') | ||
105 | + exec_command_and_wait_for_pattern(self, 'cat /proc/iomem', | ||
106 | + '/soc/cprman@7e101000') | ||
107 | + exec_command(self, 'halt') | ||
108 | + # Wait for VM to shut down gracefully | ||
109 | + self.vm.wait() | ||
110 | + | ||
111 | def test_arm_exynos4210_initrd(self): | ||
112 | """ | ||
113 | :avocado: tags=arch:arm | ||
114 | -- | 148 | -- |
115 | 2.20.1 | 149 | 2.20.1 |
116 | 150 | ||
117 | 151 | diff view generated by jsdifflib |
1 | Implement the MVE shifts by immediate, which perform shifts | 1 | In v8A, the PSTATE.IL bit is set for various kinds of illegal |
---|---|---|---|
2 | on a single general-purpose register. | 2 | exception return or mode-change attempts. We already set PSTATE.IL |
3 | (or its AArch32 equivalent CPSR.IL) in all those cases, but we | ||
4 | weren't implementing the part of the behaviour where attempting to | ||
5 | execute an instruction with PSTATE.IL takes an immediate exception | ||
6 | with an appropriate syndrome value. | ||
3 | 7 | ||
4 | These patterns overlap with the long-shift-by-immediates, | 8 | Add a new TB flags bit tracking PSTATE.IL/CPSR.IL, and generate code |
5 | so we have to rearrange the grouping a little here. | 9 | to take an exception instead of whatever the instruction would have |
10 | been. | ||
11 | |||
12 | PSTATE.IL and CPSR.IL change only on exception entry, attempted | ||
13 | exception exit, and various AArch32 mode changes via cpsr_write(). | ||
14 | These places generally already rebuild the hflags, so the only place | ||
15 | we need an extra rebuild_hflags call is in the illegal-return | ||
16 | codepath of the AArch64 exception_return helper. | ||
6 | 17 | ||
7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 18 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
19 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 20 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
9 | Message-id: 20210628135835.6690-18-peter.maydell@linaro.org | 21 | Message-id: 20210821195958.41312-2-richard.henderson@linaro.org |
22 | Message-Id: <20210817162118.24319-1-peter.maydell@linaro.org> | ||
23 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
24 | [rth: Added missing returns; set IL bit in syndrome] | ||
25 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
10 | --- | 26 | --- |
11 | target/arm/helper-mve.h | 3 ++ | 27 | target/arm/cpu.h | 1 + |
12 | target/arm/translate.h | 1 + | 28 | target/arm/syndrome.h | 5 +++++ |
13 | target/arm/t32.decode | 31 ++++++++++++++----- | 29 | target/arm/translate.h | 2 ++ |
14 | target/arm/mve_helper.c | 10 ++++++ | 30 | target/arm/helper-a64.c | 1 + |
15 | target/arm/translate.c | 68 +++++++++++++++++++++++++++++++++++++++-- | 31 | target/arm/helper.c | 8 ++++++++ |
16 | 5 files changed, 104 insertions(+), 9 deletions(-) | 32 | target/arm/translate-a64.c | 11 +++++++++++ |
33 | target/arm/translate.c | 21 +++++++++++++++++++++ | ||
34 | 7 files changed, 49 insertions(+) | ||
17 | 35 | ||
18 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 36 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
19 | index XXXXXXX..XXXXXXX 100644 | 37 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/helper-mve.h | 38 | --- a/target/arm/cpu.h |
21 | +++ b/target/arm/helper-mve.h | 39 | +++ b/target/arm/cpu.h |
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(mve_sqrshrl, TCG_CALL_NO_RWG, i64, env, i64, i32) | 40 | @@ -XXX,XX +XXX,XX @@ FIELD(TBFLAG_ANY, FPEXC_EL, 8, 2) |
23 | DEF_HELPER_FLAGS_3(mve_uqrshll, TCG_CALL_NO_RWG, i64, env, i64, i32) | 41 | FIELD(TBFLAG_ANY, DEBUG_TARGET_EL, 10, 2) |
24 | DEF_HELPER_FLAGS_3(mve_sqrshrl48, TCG_CALL_NO_RWG, i64, env, i64, i32) | 42 | /* Memory operations require alignment: SCTLR_ELx.A or CCR.UNALIGN_TRP */ |
25 | DEF_HELPER_FLAGS_3(mve_uqrshll48, TCG_CALL_NO_RWG, i64, env, i64, i32) | 43 | FIELD(TBFLAG_ANY, ALIGN_MEM, 12, 1) |
44 | +FIELD(TBFLAG_ANY, PSTATE__IL, 13, 1) | ||
45 | |||
46 | /* | ||
47 | * Bit usage when in AArch32 state, both A- and M-profile. | ||
48 | diff --git a/target/arm/syndrome.h b/target/arm/syndrome.h | ||
49 | index XXXXXXX..XXXXXXX 100644 | ||
50 | --- a/target/arm/syndrome.h | ||
51 | +++ b/target/arm/syndrome.h | ||
52 | @@ -XXX,XX +XXX,XX @@ static inline uint32_t syn_wfx(int cv, int cond, int ti, bool is_16bit) | ||
53 | (cv << 24) | (cond << 20) | ti; | ||
54 | } | ||
55 | |||
56 | +static inline uint32_t syn_illegalstate(void) | ||
57 | +{ | ||
58 | + return (EC_ILLEGALSTATE << ARM_EL_EC_SHIFT) | ARM_EL_IL; | ||
59 | +} | ||
26 | + | 60 | + |
27 | +DEF_HELPER_FLAGS_3(mve_uqshl, TCG_CALL_NO_RWG, i32, env, i32, i32) | 61 | #endif /* TARGET_ARM_SYNDROME_H */ |
28 | +DEF_HELPER_FLAGS_3(mve_sqshl, TCG_CALL_NO_RWG, i32, env, i32, i32) | ||
29 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 62 | diff --git a/target/arm/translate.h b/target/arm/translate.h |
30 | index XXXXXXX..XXXXXXX 100644 | 63 | index XXXXXXX..XXXXXXX 100644 |
31 | --- a/target/arm/translate.h | 64 | --- a/target/arm/translate.h |
32 | +++ b/target/arm/translate.h | 65 | +++ b/target/arm/translate.h |
33 | @@ -XXX,XX +XXX,XX @@ typedef void CryptoThreeOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr); | 66 | @@ -XXX,XX +XXX,XX @@ typedef struct DisasContext { |
34 | typedef void AtomicThreeOpFn(TCGv_i64, TCGv_i64, TCGv_i64, TCGArg, MemOp); | 67 | bool hstr_active; |
35 | typedef void WideShiftImmFn(TCGv_i64, TCGv_i64, int64_t shift); | 68 | /* True if memory operations require alignment */ |
36 | typedef void WideShiftFn(TCGv_i64, TCGv_ptr, TCGv_i64, TCGv_i32); | 69 | bool align_mem; |
37 | +typedef void ShiftImmFn(TCGv_i32, TCGv_i32, int32_t shift); | 70 | + /* True if PSTATE.IL is set */ |
38 | 71 | + bool pstate_il; | |
39 | /** | 72 | /* |
40 | * arm_tbflags_from_tb: | 73 | * >= 0, a copy of PSTATE.BTYPE, which will be 0 without v8.5-BTI. |
41 | diff --git a/target/arm/t32.decode b/target/arm/t32.decode | 74 | * < 0, set by the current instruction. |
75 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | ||
42 | index XXXXXXX..XXXXXXX 100644 | 76 | index XXXXXXX..XXXXXXX 100644 |
43 | --- a/target/arm/t32.decode | 77 | --- a/target/arm/helper-a64.c |
44 | +++ b/target/arm/t32.decode | 78 | +++ b/target/arm/helper-a64.c |
45 | @@ -XXX,XX +XXX,XX @@ | 79 | @@ -XXX,XX +XXX,XX @@ illegal_return: |
46 | 80 | if (!arm_singlestep_active(env)) { | |
47 | &mve_shl_ri rdalo rdahi shim | 81 | env->pstate &= ~PSTATE_SS; |
48 | &mve_shl_rr rdalo rdahi rm | 82 | } |
49 | +&mve_sh_ri rda shim | 83 | + helper_rebuild_hflags_a64(env, cur_el); |
50 | 84 | qemu_log_mask(LOG_GUEST_ERROR, "Illegal exception return at EL%d: " | |
51 | # rdahi: bits [3:1] from insn, bit 0 is 1 | 85 | "resuming execution at 0x%" PRIx64 "\n", cur_el, env->pc); |
52 | # rdalo: bits [3:1] from insn, bit 0 is 0 | 86 | } |
53 | @@ -XXX,XX +XXX,XX @@ | 87 | diff --git a/target/arm/helper.c b/target/arm/helper.c |
54 | &mve_shl_ri shim=%imm5_12_6 rdalo=%rdalo_17 rdahi=%rdahi_9 | 88 | index XXXXXXX..XXXXXXX 100644 |
55 | @mve_shl_rr ....... .... . ... . rm:4 ... . .. .. .... \ | 89 | --- a/target/arm/helper.c |
56 | &mve_shl_rr rdalo=%rdalo_17 rdahi=%rdahi_9 | 90 | +++ b/target/arm/helper.c |
57 | +@mve_sh_ri ....... .... . rda:4 . ... ... . .. .. .... \ | 91 | @@ -XXX,XX +XXX,XX @@ static CPUARMTBFlags rebuild_hflags_a32(CPUARMState *env, int fp_el, |
58 | + &mve_sh_ri shim=%imm5_12_6 | 92 | DP_TBFLAG_A32(flags, HSTR_ACTIVE, 1); |
59 | 93 | } | |
60 | { | 94 | |
61 | TST_xrri 1110101 0000 1 .... 0 ... 1111 .... .... @S_xrr_shi | 95 | + if (env->uncached_cpsr & CPSR_IL) { |
62 | @@ -XXX,XX +XXX,XX @@ BIC_rrri 1110101 0001 . .... 0 ... .... .... .... @s_rrr_shi | 96 | + DP_TBFLAG_ANY(flags, PSTATE__IL, 1); |
63 | # the rest fall through (where ORR_rrri and MOV_rxri will end up | ||
64 | # handling them as r13 and r15 accesses with the same semantics as A32). | ||
65 | [ | ||
66 | - LSLL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 00 1111 @mve_shl_ri | ||
67 | - LSRL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 01 1111 @mve_shl_ri | ||
68 | - ASRL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 10 1111 @mve_shl_ri | ||
69 | + { | ||
70 | + UQSHL_ri 1110101 0010 1 .... 0 ... 1111 .. 00 1111 @mve_sh_ri | ||
71 | + LSLL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 00 1111 @mve_shl_ri | ||
72 | + UQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 00 1111 @mve_shl_ri | ||
73 | + } | ||
74 | |||
75 | - UQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 00 1111 @mve_shl_ri | ||
76 | - URSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 01 1111 @mve_shl_ri | ||
77 | - SRSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 10 1111 @mve_shl_ri | ||
78 | - SQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 11 1111 @mve_shl_ri | ||
79 | + { | ||
80 | + URSHR_ri 1110101 0010 1 .... 0 ... 1111 .. 01 1111 @mve_sh_ri | ||
81 | + LSRL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 01 1111 @mve_shl_ri | ||
82 | + URSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 01 1111 @mve_shl_ri | ||
83 | + } | 97 | + } |
84 | + | 98 | + |
85 | + { | 99 | return rebuild_hflags_common_32(env, fp_el, mmu_idx, flags); |
86 | + SRSHR_ri 1110101 0010 1 .... 0 ... 1111 .. 10 1111 @mve_sh_ri | 100 | } |
87 | + ASRL_ri 1110101 0010 1 ... 0 0 ... ... 1 .. 10 1111 @mve_shl_ri | 101 | |
88 | + SRSHRL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 10 1111 @mve_shl_ri | 102 | @@ -XXX,XX +XXX,XX @@ static CPUARMTBFlags rebuild_hflags_a64(CPUARMState *env, int el, int fp_el, |
103 | } | ||
104 | } | ||
105 | |||
106 | + if (env->pstate & PSTATE_IL) { | ||
107 | + DP_TBFLAG_ANY(flags, PSTATE__IL, 1); | ||
89 | + } | 108 | + } |
90 | + | 109 | + |
91 | + { | 110 | if (cpu_isar_feature(aa64_mte, env_archcpu(env))) { |
92 | + SQSHL_ri 1110101 0010 1 .... 0 ... 1111 .. 11 1111 @mve_sh_ri | 111 | /* |
93 | + SQSHLL_ri 1110101 0010 1 ... 1 0 ... ... 1 .. 11 1111 @mve_shl_ri | 112 | * Set MTE_ACTIVE if any access may be Checked, and leave clear |
113 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
114 | index XXXXXXX..XXXXXXX 100644 | ||
115 | --- a/target/arm/translate-a64.c | ||
116 | +++ b/target/arm/translate-a64.c | ||
117 | @@ -XXX,XX +XXX,XX @@ static void disas_a64_insn(CPUARMState *env, DisasContext *s) | ||
118 | s->fp_access_checked = false; | ||
119 | s->sve_access_checked = false; | ||
120 | |||
121 | + if (s->pstate_il) { | ||
122 | + /* | ||
123 | + * Illegal execution state. This has priority over BTI | ||
124 | + * exceptions, but comes after instruction abort exceptions. | ||
125 | + */ | ||
126 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
127 | + syn_illegalstate(), default_exception_el(s)); | ||
128 | + return; | ||
94 | + } | 129 | + } |
95 | |||
96 | LSLL_rr 1110101 0010 1 ... 0 .... ... 1 0000 1101 @mve_shl_rr | ||
97 | ASRL_rr 1110101 0010 1 ... 0 .... ... 1 0010 1101 @mve_shl_rr | ||
98 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
99 | index XXXXXXX..XXXXXXX 100644 | ||
100 | --- a/target/arm/mve_helper.c | ||
101 | +++ b/target/arm/mve_helper.c | ||
102 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(mve_uqrshll48)(CPUARMState *env, uint64_t n, uint32_t shift) | ||
103 | { | ||
104 | return do_uqrshl48_d(n, (int8_t)shift, true, &env->QF); | ||
105 | } | ||
106 | + | 130 | + |
107 | +uint32_t HELPER(mve_uqshl)(CPUARMState *env, uint32_t n, uint32_t shift) | 131 | if (dc_isar_feature(aa64_bti, s)) { |
108 | +{ | 132 | if (s->base.num_insns == 1) { |
109 | + return do_uqrshl_bhs(n, (int8_t)shift, 32, false, &env->QF); | 133 | /* |
110 | +} | 134 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_init_disas_context(DisasContextBase *dcbase, |
111 | + | 135 | #endif |
112 | +uint32_t HELPER(mve_sqshl)(CPUARMState *env, uint32_t n, uint32_t shift) | 136 | dc->fp_excp_el = EX_TBFLAG_ANY(tb_flags, FPEXC_EL); |
113 | +{ | 137 | dc->align_mem = EX_TBFLAG_ANY(tb_flags, ALIGN_MEM); |
114 | + return do_sqrshl_bhs(n, (int8_t)shift, 32, false, &env->QF); | 138 | + dc->pstate_il = EX_TBFLAG_ANY(tb_flags, PSTATE__IL); |
115 | +} | 139 | dc->sve_excp_el = EX_TBFLAG_A64(tb_flags, SVEEXC_EL); |
140 | dc->sve_len = (EX_TBFLAG_A64(tb_flags, ZCR_LEN) + 1) * 16; | ||
141 | dc->pauth_active = EX_TBFLAG_A64(tb_flags, PAUTH_ACTIVE); | ||
116 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 142 | diff --git a/target/arm/translate.c b/target/arm/translate.c |
117 | index XXXXXXX..XXXXXXX 100644 | 143 | index XXXXXXX..XXXXXXX 100644 |
118 | --- a/target/arm/translate.c | 144 | --- a/target/arm/translate.c |
119 | +++ b/target/arm/translate.c | 145 | +++ b/target/arm/translate.c |
120 | @@ -XXX,XX +XXX,XX @@ static void gen_srshr16_i64(TCGv_i64 d, TCGv_i64 a, int64_t sh) | 146 | @@ -XXX,XX +XXX,XX @@ static void disas_arm_insn(DisasContext *s, unsigned int insn) |
121 | 147 | return; | |
122 | static void gen_srshr32_i32(TCGv_i32 d, TCGv_i32 a, int32_t sh) | 148 | } |
123 | { | 149 | |
124 | - TCGv_i32 t = tcg_temp_new_i32(); | 150 | + if (s->pstate_il) { |
125 | + TCGv_i32 t; | 151 | + /* |
126 | 152 | + * Illegal execution state. This has priority over BTI | |
127 | + /* Handle shift by the input size for the benefit of trans_SRSHR_ri */ | 153 | + * exceptions, but comes after instruction abort exceptions. |
128 | + if (sh == 32) { | 154 | + */ |
129 | + tcg_gen_movi_i32(d, 0); | 155 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, |
156 | + syn_illegalstate(), default_exception_el(s)); | ||
130 | + return; | 157 | + return; |
131 | + } | 158 | + } |
132 | + t = tcg_temp_new_i32(); | 159 | + |
133 | tcg_gen_extract_i32(t, a, sh - 1, 1); | 160 | if (cond == 0xf) { |
134 | tcg_gen_sari_i32(d, a, sh); | 161 | /* In ARMv3 and v4 the NV condition is UNPREDICTABLE; we |
135 | tcg_gen_add_i32(d, d, t); | 162 | * choose to UNDEF. In ARMv5 and above the space is used |
136 | @@ -XXX,XX +XXX,XX @@ static void gen_urshr16_i64(TCGv_i64 d, TCGv_i64 a, int64_t sh) | 163 | @@ -XXX,XX +XXX,XX @@ static void arm_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs) |
137 | 164 | #endif | |
138 | static void gen_urshr32_i32(TCGv_i32 d, TCGv_i32 a, int32_t sh) | 165 | dc->fp_excp_el = EX_TBFLAG_ANY(tb_flags, FPEXC_EL); |
139 | { | 166 | dc->align_mem = EX_TBFLAG_ANY(tb_flags, ALIGN_MEM); |
140 | - TCGv_i32 t = tcg_temp_new_i32(); | 167 | + dc->pstate_il = EX_TBFLAG_ANY(tb_flags, PSTATE__IL); |
141 | + TCGv_i32 t; | 168 | |
142 | 169 | if (arm_feature(env, ARM_FEATURE_M)) { | |
143 | + /* Handle shift by the input size for the benefit of trans_URSHR_ri */ | 170 | dc->vfp_enabled = 1; |
144 | + if (sh == 32) { | 171 | @@ -XXX,XX +XXX,XX @@ static void thumb_tr_translate_insn(DisasContextBase *dcbase, CPUState *cpu) |
145 | + tcg_gen_extract_i32(d, a, sh - 1, 1); | 172 | } |
173 | dc->insn = insn; | ||
174 | |||
175 | + if (dc->pstate_il) { | ||
176 | + /* | ||
177 | + * Illegal execution state. This has priority over BTI | ||
178 | + * exceptions, but comes after instruction abort exceptions. | ||
179 | + */ | ||
180 | + gen_exception_insn(dc, dc->pc_curr, EXCP_UDEF, | ||
181 | + syn_illegalstate(), default_exception_el(dc)); | ||
146 | + return; | 182 | + return; |
147 | + } | 183 | + } |
148 | + t = tcg_temp_new_i32(); | ||
149 | tcg_gen_extract_i32(t, a, sh - 1, 1); | ||
150 | tcg_gen_shri_i32(d, a, sh); | ||
151 | tcg_gen_add_i32(d, d, t); | ||
152 | @@ -XXX,XX +XXX,XX @@ static bool trans_SQRSHRL48_rr(DisasContext *s, arg_mve_shl_rr *a) | ||
153 | return do_mve_shl_rr(s, a, gen_helper_mve_sqrshrl48); | ||
154 | } | ||
155 | |||
156 | +static bool do_mve_sh_ri(DisasContext *s, arg_mve_sh_ri *a, ShiftImmFn *fn) | ||
157 | +{ | ||
158 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_1M)) { | ||
159 | + /* Decode falls through to ORR/MOV UNPREDICTABLE handling */ | ||
160 | + return false; | ||
161 | + } | ||
162 | + if (!dc_isar_feature(aa32_mve, s) || | ||
163 | + !arm_dc_feature(s, ARM_FEATURE_M_MAIN) || | ||
164 | + a->rda == 13 || a->rda == 15) { | ||
165 | + /* These rda cases are UNPREDICTABLE; we choose to UNDEF */ | ||
166 | + unallocated_encoding(s); | ||
167 | + return true; | ||
168 | + } | ||
169 | + | 184 | + |
170 | + if (a->shim == 0) { | 185 | if (dc->eci) { |
171 | + a->shim = 32; | 186 | /* |
172 | + } | 187 | * For M-profile continuable instructions, ECI/ICI handling |
173 | + fn(cpu_R[a->rda], cpu_R[a->rda], a->shim); | ||
174 | + | ||
175 | + return true; | ||
176 | +} | ||
177 | + | ||
178 | +static bool trans_URSHR_ri(DisasContext *s, arg_mve_sh_ri *a) | ||
179 | +{ | ||
180 | + return do_mve_sh_ri(s, a, gen_urshr32_i32); | ||
181 | +} | ||
182 | + | ||
183 | +static bool trans_SRSHR_ri(DisasContext *s, arg_mve_sh_ri *a) | ||
184 | +{ | ||
185 | + return do_mve_sh_ri(s, a, gen_srshr32_i32); | ||
186 | +} | ||
187 | + | ||
188 | +static void gen_mve_sqshl(TCGv_i32 r, TCGv_i32 n, int32_t shift) | ||
189 | +{ | ||
190 | + gen_helper_mve_sqshl(r, cpu_env, n, tcg_constant_i32(shift)); | ||
191 | +} | ||
192 | + | ||
193 | +static bool trans_SQSHL_ri(DisasContext *s, arg_mve_sh_ri *a) | ||
194 | +{ | ||
195 | + return do_mve_sh_ri(s, a, gen_mve_sqshl); | ||
196 | +} | ||
197 | + | ||
198 | +static void gen_mve_uqshl(TCGv_i32 r, TCGv_i32 n, int32_t shift) | ||
199 | +{ | ||
200 | + gen_helper_mve_uqshl(r, cpu_env, n, tcg_constant_i32(shift)); | ||
201 | +} | ||
202 | + | ||
203 | +static bool trans_UQSHL_ri(DisasContext *s, arg_mve_sh_ri *a) | ||
204 | +{ | ||
205 | + return do_mve_sh_ri(s, a, gen_mve_uqshl); | ||
206 | +} | ||
207 | + | ||
208 | /* | ||
209 | * Multiply and multiply accumulate | ||
210 | */ | ||
211 | -- | 188 | -- |
212 | 2.20.1 | 189 | 2.20.1 |
213 | 190 | ||
214 | 191 | diff view generated by jsdifflib |
1 | Use dup_const() instead of bitfield_replicate() in | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | disas_simd_mod_imm(). | 2 | |
3 | 3 | It is confusing to have different exits from translation | |
4 | (We can't replace the other use of bitfield_replicate() in this file, | 4 | for various conditions in separate functions. |
5 | in logic_imm_decode_wmask(), because that location needs to handle 2 | 5 | |
6 | and 4 bit elements, which dup_const() cannot.) | 6 | Merge disas_a64_insn into its only caller. Standardize |
7 | 7 | on the "s" name for the DisasContext, as the code from | |
8 | disas_a64_insn had more instances. | ||
9 | |||
10 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
12 | Message-id: 20210821195958.41312-3-richard.henderson@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
10 | Message-id: 20210628135835.6690-6-peter.maydell@linaro.org | ||
11 | --- | 14 | --- |
12 | target/arm/translate-a64.c | 2 +- | 15 | target/arm/translate-a64.c | 224 ++++++++++++++++++------------------- |
13 | 1 file changed, 1 insertion(+), 1 deletion(-) | 16 | 1 file changed, 109 insertions(+), 115 deletions(-) |
14 | 17 | ||
15 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 18 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
16 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/translate-a64.c | 20 | --- a/target/arm/translate-a64.c |
18 | +++ b/target/arm/translate-a64.c | 21 | +++ b/target/arm/translate-a64.c |
19 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn) | 22 | @@ -XXX,XX +XXX,XX @@ static bool btype_destination_ok(uint32_t insn, bool bt, int btype) |
20 | /* FMOV (vector, immediate) - half-precision */ | 23 | return false; |
21 | imm = vfp_expand_imm(MO_16, abcdefgh); | 24 | } |
22 | /* now duplicate across the lanes */ | 25 | |
23 | - imm = bitfield_replicate(imm, 16); | 26 | -/* C3.1 A64 instruction index by encoding */ |
24 | + imm = dup_const(MO_16, imm); | 27 | -static void disas_a64_insn(CPUARMState *env, DisasContext *s) |
25 | } else { | 28 | -{ |
26 | imm = asimd_imm_const(abcdefgh, cmode, is_neg); | 29 | - uint32_t insn; |
30 | - | ||
31 | - s->pc_curr = s->base.pc_next; | ||
32 | - insn = arm_ldl_code(env, s->base.pc_next, s->sctlr_b); | ||
33 | - s->insn = insn; | ||
34 | - s->base.pc_next += 4; | ||
35 | - | ||
36 | - s->fp_access_checked = false; | ||
37 | - s->sve_access_checked = false; | ||
38 | - | ||
39 | - if (s->pstate_il) { | ||
40 | - /* | ||
41 | - * Illegal execution state. This has priority over BTI | ||
42 | - * exceptions, but comes after instruction abort exceptions. | ||
43 | - */ | ||
44 | - gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
45 | - syn_illegalstate(), default_exception_el(s)); | ||
46 | - return; | ||
47 | - } | ||
48 | - | ||
49 | - if (dc_isar_feature(aa64_bti, s)) { | ||
50 | - if (s->base.num_insns == 1) { | ||
51 | - /* | ||
52 | - * At the first insn of the TB, compute s->guarded_page. | ||
53 | - * We delayed computing this until successfully reading | ||
54 | - * the first insn of the TB, above. This (mostly) ensures | ||
55 | - * that the softmmu tlb entry has been populated, and the | ||
56 | - * page table GP bit is available. | ||
57 | - * | ||
58 | - * Note that we need to compute this even if btype == 0, | ||
59 | - * because this value is used for BR instructions later | ||
60 | - * where ENV is not available. | ||
61 | - */ | ||
62 | - s->guarded_page = is_guarded_page(env, s); | ||
63 | - | ||
64 | - /* First insn can have btype set to non-zero. */ | ||
65 | - tcg_debug_assert(s->btype >= 0); | ||
66 | - | ||
67 | - /* | ||
68 | - * Note that the Branch Target Exception has fairly high | ||
69 | - * priority -- below debugging exceptions but above most | ||
70 | - * everything else. This allows us to handle this now | ||
71 | - * instead of waiting until the insn is otherwise decoded. | ||
72 | - */ | ||
73 | - if (s->btype != 0 | ||
74 | - && s->guarded_page | ||
75 | - && !btype_destination_ok(insn, s->bt, s->btype)) { | ||
76 | - gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
77 | - syn_btitrap(s->btype), | ||
78 | - default_exception_el(s)); | ||
79 | - return; | ||
80 | - } | ||
81 | - } else { | ||
82 | - /* Not the first insn: btype must be 0. */ | ||
83 | - tcg_debug_assert(s->btype == 0); | ||
84 | - } | ||
85 | - } | ||
86 | - | ||
87 | - switch (extract32(insn, 25, 4)) { | ||
88 | - case 0x0: case 0x1: case 0x3: /* UNALLOCATED */ | ||
89 | - unallocated_encoding(s); | ||
90 | - break; | ||
91 | - case 0x2: | ||
92 | - if (!dc_isar_feature(aa64_sve, s) || !disas_sve(s, insn)) { | ||
93 | - unallocated_encoding(s); | ||
94 | - } | ||
95 | - break; | ||
96 | - case 0x8: case 0x9: /* Data processing - immediate */ | ||
97 | - disas_data_proc_imm(s, insn); | ||
98 | - break; | ||
99 | - case 0xa: case 0xb: /* Branch, exception generation and system insns */ | ||
100 | - disas_b_exc_sys(s, insn); | ||
101 | - break; | ||
102 | - case 0x4: | ||
103 | - case 0x6: | ||
104 | - case 0xc: | ||
105 | - case 0xe: /* Loads and stores */ | ||
106 | - disas_ldst(s, insn); | ||
107 | - break; | ||
108 | - case 0x5: | ||
109 | - case 0xd: /* Data processing - register */ | ||
110 | - disas_data_proc_reg(s, insn); | ||
111 | - break; | ||
112 | - case 0x7: | ||
113 | - case 0xf: /* Data processing - SIMD and floating point */ | ||
114 | - disas_data_proc_simd_fp(s, insn); | ||
115 | - break; | ||
116 | - default: | ||
117 | - assert(FALSE); /* all 15 cases should be handled above */ | ||
118 | - break; | ||
119 | - } | ||
120 | - | ||
121 | - /* if we allocated any temporaries, free them here */ | ||
122 | - free_tmp_a64(s); | ||
123 | - | ||
124 | - /* | ||
125 | - * After execution of most insns, btype is reset to 0. | ||
126 | - * Note that we set btype == -1 when the insn sets btype. | ||
127 | - */ | ||
128 | - if (s->btype > 0 && s->base.is_jmp != DISAS_NORETURN) { | ||
129 | - reset_btype(s); | ||
130 | - } | ||
131 | -} | ||
132 | - | ||
133 | static void aarch64_tr_init_disas_context(DisasContextBase *dcbase, | ||
134 | CPUState *cpu) | ||
135 | { | ||
136 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_insn_start(DisasContextBase *dcbase, CPUState *cpu) | ||
137 | |||
138 | static void aarch64_tr_translate_insn(DisasContextBase *dcbase, CPUState *cpu) | ||
139 | { | ||
140 | - DisasContext *dc = container_of(dcbase, DisasContext, base); | ||
141 | + DisasContext *s = container_of(dcbase, DisasContext, base); | ||
142 | CPUARMState *env = cpu->env_ptr; | ||
143 | + uint32_t insn; | ||
144 | |||
145 | - if (dc->ss_active && !dc->pstate_ss) { | ||
146 | + if (s->ss_active && !s->pstate_ss) { | ||
147 | /* Singlestep state is Active-pending. | ||
148 | * If we're in this state at the start of a TB then either | ||
149 | * a) we just took an exception to an EL which is being debugged | ||
150 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_translate_insn(DisasContextBase *dcbase, CPUState *cpu) | ||
151 | * "did not step an insn" case, and so the syndrome ISV and EX | ||
152 | * bits should be zero. | ||
153 | */ | ||
154 | - assert(dc->base.num_insns == 1); | ||
155 | - gen_swstep_exception(dc, 0, 0); | ||
156 | - dc->base.is_jmp = DISAS_NORETURN; | ||
157 | - } else { | ||
158 | - disas_a64_insn(env, dc); | ||
159 | + assert(s->base.num_insns == 1); | ||
160 | + gen_swstep_exception(s, 0, 0); | ||
161 | + s->base.is_jmp = DISAS_NORETURN; | ||
162 | + return; | ||
27 | } | 163 | } |
164 | |||
165 | - translator_loop_temp_check(&dc->base); | ||
166 | + s->pc_curr = s->base.pc_next; | ||
167 | + insn = arm_ldl_code(env, s->base.pc_next, s->sctlr_b); | ||
168 | + s->insn = insn; | ||
169 | + s->base.pc_next += 4; | ||
170 | + | ||
171 | + s->fp_access_checked = false; | ||
172 | + s->sve_access_checked = false; | ||
173 | + | ||
174 | + if (s->pstate_il) { | ||
175 | + /* | ||
176 | + * Illegal execution state. This has priority over BTI | ||
177 | + * exceptions, but comes after instruction abort exceptions. | ||
178 | + */ | ||
179 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
180 | + syn_illegalstate(), default_exception_el(s)); | ||
181 | + return; | ||
182 | + } | ||
183 | + | ||
184 | + if (dc_isar_feature(aa64_bti, s)) { | ||
185 | + if (s->base.num_insns == 1) { | ||
186 | + /* | ||
187 | + * At the first insn of the TB, compute s->guarded_page. | ||
188 | + * We delayed computing this until successfully reading | ||
189 | + * the first insn of the TB, above. This (mostly) ensures | ||
190 | + * that the softmmu tlb entry has been populated, and the | ||
191 | + * page table GP bit is available. | ||
192 | + * | ||
193 | + * Note that we need to compute this even if btype == 0, | ||
194 | + * because this value is used for BR instructions later | ||
195 | + * where ENV is not available. | ||
196 | + */ | ||
197 | + s->guarded_page = is_guarded_page(env, s); | ||
198 | + | ||
199 | + /* First insn can have btype set to non-zero. */ | ||
200 | + tcg_debug_assert(s->btype >= 0); | ||
201 | + | ||
202 | + /* | ||
203 | + * Note that the Branch Target Exception has fairly high | ||
204 | + * priority -- below debugging exceptions but above most | ||
205 | + * everything else. This allows us to handle this now | ||
206 | + * instead of waiting until the insn is otherwise decoded. | ||
207 | + */ | ||
208 | + if (s->btype != 0 | ||
209 | + && s->guarded_page | ||
210 | + && !btype_destination_ok(insn, s->bt, s->btype)) { | ||
211 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
212 | + syn_btitrap(s->btype), | ||
213 | + default_exception_el(s)); | ||
214 | + return; | ||
215 | + } | ||
216 | + } else { | ||
217 | + /* Not the first insn: btype must be 0. */ | ||
218 | + tcg_debug_assert(s->btype == 0); | ||
219 | + } | ||
220 | + } | ||
221 | + | ||
222 | + switch (extract32(insn, 25, 4)) { | ||
223 | + case 0x0: case 0x1: case 0x3: /* UNALLOCATED */ | ||
224 | + unallocated_encoding(s); | ||
225 | + break; | ||
226 | + case 0x2: | ||
227 | + if (!dc_isar_feature(aa64_sve, s) || !disas_sve(s, insn)) { | ||
228 | + unallocated_encoding(s); | ||
229 | + } | ||
230 | + break; | ||
231 | + case 0x8: case 0x9: /* Data processing - immediate */ | ||
232 | + disas_data_proc_imm(s, insn); | ||
233 | + break; | ||
234 | + case 0xa: case 0xb: /* Branch, exception generation and system insns */ | ||
235 | + disas_b_exc_sys(s, insn); | ||
236 | + break; | ||
237 | + case 0x4: | ||
238 | + case 0x6: | ||
239 | + case 0xc: | ||
240 | + case 0xe: /* Loads and stores */ | ||
241 | + disas_ldst(s, insn); | ||
242 | + break; | ||
243 | + case 0x5: | ||
244 | + case 0xd: /* Data processing - register */ | ||
245 | + disas_data_proc_reg(s, insn); | ||
246 | + break; | ||
247 | + case 0x7: | ||
248 | + case 0xf: /* Data processing - SIMD and floating point */ | ||
249 | + disas_data_proc_simd_fp(s, insn); | ||
250 | + break; | ||
251 | + default: | ||
252 | + assert(FALSE); /* all 15 cases should be handled above */ | ||
253 | + break; | ||
254 | + } | ||
255 | + | ||
256 | + /* if we allocated any temporaries, free them here */ | ||
257 | + free_tmp_a64(s); | ||
258 | + | ||
259 | + /* | ||
260 | + * After execution of most insns, btype is reset to 0. | ||
261 | + * Note that we set btype == -1 when the insn sets btype. | ||
262 | + */ | ||
263 | + if (s->btype > 0 && s->base.is_jmp != DISAS_NORETURN) { | ||
264 | + reset_btype(s); | ||
265 | + } | ||
266 | + | ||
267 | + translator_loop_temp_check(&s->base); | ||
268 | } | ||
269 | |||
270 | static void aarch64_tr_tb_stop(DisasContextBase *dcbase, CPUState *cpu) | ||
28 | -- | 271 | -- |
29 | 2.20.1 | 272 | 2.20.1 |
30 | 273 | ||
31 | 274 | diff view generated by jsdifflib |
1 | The function asimd_imm_const() in translate-neon.c is an | 1 | By default, QEMU will allow devices to be plugged into a bus up to |
---|---|---|---|
2 | implementation of the pseudocode AdvSIMDExpandImm(), which we will | 2 | the bus class's device count limit. If the user creates a device on |
3 | also want for MVE. Move the implementation to translate.c, with a | 3 | the command line or via the monitor and doesn't explicitly specify |
4 | prototype in translate.h. | 4 | the bus to plug it in, QEMU will plug it into the first non-full bus |
5 | that it finds. | ||
6 | |||
7 | This is fine in most cases, but some machines have multiple buses of | ||
8 | a given type, some of which are dedicated to on-board devices and | ||
9 | some of which have an externally exposed connector for user-pluggable | ||
10 | devices. One example is I2C buses. | ||
11 | |||
12 | Provide a new function qbus_mark_full() so that a machine model can | ||
13 | mark this kind of "internal only" bus as 'full' after it has created | ||
14 | all the devices that should be plugged into that bus. The "find a | ||
15 | non-full bus" algorithm will then skip the internal-only bus when | ||
16 | looking for a place to plug in user-created devices. | ||
5 | 17 | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 18 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 19 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20210628135835.6690-4-peter.maydell@linaro.org | 20 | Message-id: 20210903151435.22379-2-peter.maydell@linaro.org |
9 | --- | 21 | --- |
10 | target/arm/translate.h | 16 ++++++++++ | 22 | include/hw/qdev-core.h | 24 ++++++++++++++++++++++++ |
11 | target/arm/translate-neon.c | 63 ------------------------------------- | 23 | softmmu/qdev-monitor.c | 7 ++++++- |
12 | target/arm/translate.c | 57 +++++++++++++++++++++++++++++++++ | 24 | 2 files changed, 30 insertions(+), 1 deletion(-) |
13 | 3 files changed, 73 insertions(+), 63 deletions(-) | ||
14 | 25 | ||
15 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 26 | diff --git a/include/hw/qdev-core.h b/include/hw/qdev-core.h |
16 | index XXXXXXX..XXXXXXX 100644 | 27 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/translate.h | 28 | --- a/include/hw/qdev-core.h |
18 | +++ b/target/arm/translate.h | 29 | +++ b/include/hw/qdev-core.h |
19 | @@ -XXX,XX +XXX,XX @@ static inline MemOp finalize_memop(DisasContext *s, MemOp opc) | 30 | @@ -XXX,XX +XXX,XX @@ struct BusState { |
20 | return opc | s->be_data; | 31 | HotplugHandler *hotplug_handler; |
32 | int max_index; | ||
33 | bool realized; | ||
34 | + bool full; | ||
35 | int num_children; | ||
36 | |||
37 | /* | ||
38 | @@ -XXX,XX +XXX,XX @@ static inline bool qbus_is_hotpluggable(BusState *bus) | ||
39 | return bus->hotplug_handler; | ||
21 | } | 40 | } |
22 | 41 | ||
23 | +/** | 42 | +/** |
24 | + * asimd_imm_const: Expand an encoded SIMD constant value | 43 | + * qbus_mark_full: Mark this bus as full, so no more devices can be attached |
44 | + * @bus: Bus to mark as full | ||
25 | + * | 45 | + * |
26 | + * Expand a SIMD constant value. This is essentially the pseudocode | 46 | + * By default, QEMU will allow devices to be plugged into a bus up |
27 | + * AdvSIMDExpandImm, except that we also perform the boolean NOT needed for | 47 | + * to the bus class's device count limit. Calling this function |
28 | + * VMVN and VBIC (when cmode < 14 && op == 1). | 48 | + * marks a particular bus as full, so that no more devices can be |
29 | + * | 49 | + * plugged into it. In particular this means that the bus will not |
30 | + * The combination cmode == 15 op == 1 is a reserved encoding for AArch32; | 50 | + * be considered as a candidate for plugging in devices created by |
31 | + * callers must catch this. | 51 | + * the user on the commandline or via the monitor. |
32 | + * | 52 | + * If a machine has multiple buses of a given type, such as I2C, |
33 | + * cmode = 2,3,4,5,6,7,10,11,12,13 imm=0 was UNPREDICTABLE in v7A but | 53 | + * where some of those buses in the real hardware are used only for |
34 | + * is either not unpredictable or merely CONSTRAINED UNPREDICTABLE in v8A; | 54 | + * internal devices and some are exposed via expansion ports, you |
35 | + * we produce an immediate constant value of 0 in these cases. | 55 | + * can use this function to mark the internal-only buses as full |
56 | + * after you have created all their internal devices. Then user | ||
57 | + * created devices will appear on the expansion-port bus where | ||
58 | + * guest software expects them. | ||
36 | + */ | 59 | + */ |
37 | +uint64_t asimd_imm_const(uint32_t imm, int cmode, int op); | 60 | +static inline void qbus_mark_full(BusState *bus) |
38 | + | ||
39 | #endif /* TARGET_ARM_TRANSLATE_H */ | ||
40 | diff --git a/target/arm/translate-neon.c b/target/arm/translate-neon.c | ||
41 | index XXXXXXX..XXXXXXX 100644 | ||
42 | --- a/target/arm/translate-neon.c | ||
43 | +++ b/target/arm/translate-neon.c | ||
44 | @@ -XXX,XX +XXX,XX @@ DO_FP_2SH(VCVT_UH, gen_helper_gvec_vcvt_uh) | ||
45 | DO_FP_2SH(VCVT_HS, gen_helper_gvec_vcvt_hs) | ||
46 | DO_FP_2SH(VCVT_HU, gen_helper_gvec_vcvt_hu) | ||
47 | |||
48 | -static uint64_t asimd_imm_const(uint32_t imm, int cmode, int op) | ||
49 | -{ | ||
50 | - /* | ||
51 | - * Expand the encoded constant. | ||
52 | - * Note that cmode = 2,3,4,5,6,7,10,11,12,13 imm=0 is UNPREDICTABLE. | ||
53 | - * We choose to not special-case this and will behave as if a | ||
54 | - * valid constant encoding of 0 had been given. | ||
55 | - * cmode = 15 op = 1 must UNDEF; we assume decode has handled that. | ||
56 | - */ | ||
57 | - switch (cmode) { | ||
58 | - case 0: case 1: | ||
59 | - /* no-op */ | ||
60 | - break; | ||
61 | - case 2: case 3: | ||
62 | - imm <<= 8; | ||
63 | - break; | ||
64 | - case 4: case 5: | ||
65 | - imm <<= 16; | ||
66 | - break; | ||
67 | - case 6: case 7: | ||
68 | - imm <<= 24; | ||
69 | - break; | ||
70 | - case 8: case 9: | ||
71 | - imm |= imm << 16; | ||
72 | - break; | ||
73 | - case 10: case 11: | ||
74 | - imm = (imm << 8) | (imm << 24); | ||
75 | - break; | ||
76 | - case 12: | ||
77 | - imm = (imm << 8) | 0xff; | ||
78 | - break; | ||
79 | - case 13: | ||
80 | - imm = (imm << 16) | 0xffff; | ||
81 | - break; | ||
82 | - case 14: | ||
83 | - if (op) { | ||
84 | - /* | ||
85 | - * This is the only case where the top and bottom 32 bits | ||
86 | - * of the encoded constant differ. | ||
87 | - */ | ||
88 | - uint64_t imm64 = 0; | ||
89 | - int n; | ||
90 | - | ||
91 | - for (n = 0; n < 8; n++) { | ||
92 | - if (imm & (1 << n)) { | ||
93 | - imm64 |= (0xffULL << (n * 8)); | ||
94 | - } | ||
95 | - } | ||
96 | - return imm64; | ||
97 | - } | ||
98 | - imm |= (imm << 8) | (imm << 16) | (imm << 24); | ||
99 | - break; | ||
100 | - case 15: | ||
101 | - imm = ((imm & 0x80) << 24) | ((imm & 0x3f) << 19) | ||
102 | - | ((imm & 0x40) ? (0x1f << 25) : (1 << 30)); | ||
103 | - break; | ||
104 | - } | ||
105 | - if (op) { | ||
106 | - imm = ~imm; | ||
107 | - } | ||
108 | - return dup_const(MO_32, imm); | ||
109 | -} | ||
110 | - | ||
111 | static bool do_1reg_imm(DisasContext *s, arg_1reg_imm *a, | ||
112 | GVecGen2iFn *fn) | ||
113 | { | ||
114 | diff --git a/target/arm/translate.c b/target/arm/translate.c | ||
115 | index XXXXXXX..XXXXXXX 100644 | ||
116 | --- a/target/arm/translate.c | ||
117 | +++ b/target/arm/translate.c | ||
118 | @@ -XXX,XX +XXX,XX @@ void arm_translate_init(void) | ||
119 | a64_translate_init(); | ||
120 | } | ||
121 | |||
122 | +uint64_t asimd_imm_const(uint32_t imm, int cmode, int op) | ||
123 | +{ | 61 | +{ |
124 | + /* Expand the encoded constant as per AdvSIMDExpandImm pseudocode */ | 62 | + bus->full = true; |
125 | + switch (cmode) { | ||
126 | + case 0: case 1: | ||
127 | + /* no-op */ | ||
128 | + break; | ||
129 | + case 2: case 3: | ||
130 | + imm <<= 8; | ||
131 | + break; | ||
132 | + case 4: case 5: | ||
133 | + imm <<= 16; | ||
134 | + break; | ||
135 | + case 6: case 7: | ||
136 | + imm <<= 24; | ||
137 | + break; | ||
138 | + case 8: case 9: | ||
139 | + imm |= imm << 16; | ||
140 | + break; | ||
141 | + case 10: case 11: | ||
142 | + imm = (imm << 8) | (imm << 24); | ||
143 | + break; | ||
144 | + case 12: | ||
145 | + imm = (imm << 8) | 0xff; | ||
146 | + break; | ||
147 | + case 13: | ||
148 | + imm = (imm << 16) | 0xffff; | ||
149 | + break; | ||
150 | + case 14: | ||
151 | + if (op) { | ||
152 | + /* | ||
153 | + * This is the only case where the top and bottom 32 bits | ||
154 | + * of the encoded constant differ. | ||
155 | + */ | ||
156 | + uint64_t imm64 = 0; | ||
157 | + int n; | ||
158 | + | ||
159 | + for (n = 0; n < 8; n++) { | ||
160 | + if (imm & (1 << n)) { | ||
161 | + imm64 |= (0xffULL << (n * 8)); | ||
162 | + } | ||
163 | + } | ||
164 | + return imm64; | ||
165 | + } | ||
166 | + imm |= (imm << 8) | (imm << 16) | (imm << 24); | ||
167 | + break; | ||
168 | + case 15: | ||
169 | + imm = ((imm & 0x80) << 24) | ((imm & 0x3f) << 19) | ||
170 | + | ((imm & 0x40) ? (0x1f << 25) : (1 << 30)); | ||
171 | + break; | ||
172 | + } | ||
173 | + if (op) { | ||
174 | + imm = ~imm; | ||
175 | + } | ||
176 | + return dup_const(MO_32, imm); | ||
177 | +} | 63 | +} |
178 | + | 64 | + |
179 | /* Generate a label used for skipping this instruction */ | 65 | void device_listener_register(DeviceListener *listener); |
180 | void arm_gen_condlabel(DisasContext *s) | 66 | void device_listener_unregister(DeviceListener *listener); |
67 | |||
68 | diff --git a/softmmu/qdev-monitor.c b/softmmu/qdev-monitor.c | ||
69 | index XXXXXXX..XXXXXXX 100644 | ||
70 | --- a/softmmu/qdev-monitor.c | ||
71 | +++ b/softmmu/qdev-monitor.c | ||
72 | @@ -XXX,XX +XXX,XX @@ static DeviceState *qbus_find_dev(BusState *bus, char *elem) | ||
73 | |||
74 | static inline bool qbus_is_full(BusState *bus) | ||
181 | { | 75 | { |
76 | - BusClass *bus_class = BUS_GET_CLASS(bus); | ||
77 | + BusClass *bus_class; | ||
78 | + | ||
79 | + if (bus->full) { | ||
80 | + return true; | ||
81 | + } | ||
82 | + bus_class = BUS_GET_CLASS(bus); | ||
83 | return bus_class->max_dev && bus->num_children >= bus_class->max_dev; | ||
84 | } | ||
85 | |||
182 | -- | 86 | -- |
183 | 2.20.1 | 87 | 2.20.1 |
184 | 88 | ||
185 | 89 | diff view generated by jsdifflib |
1 | In do_ldst(), the calculation of the offset needs to be based on the | 1 | The mps2-tz boards use a data-driven structure to create the devices |
---|---|---|---|
2 | size of the memory access, not the size of the elements in the | 2 | that sit behind peripheral protection controllers. Currently the |
3 | vector. This meant we were getting it wrong for the widening and | 3 | functions which create these devices are passed an 'opaque' pointer |
4 | narrowing variants of the various VLDR and VSTR insns. | 4 | which is always the address within the machine struct of the device |
5 | to create, and some "all devices need this" information like irqs and | ||
6 | addresses. | ||
7 | |||
8 | If a specific device needs more information than this, it is | ||
9 | currently not possible to pass that through from the PPCInfo | ||
10 | data structure. Add support for passing an extra data parameter, | ||
11 | so that we can more flexibly handle the needs of specific | ||
12 | device types. To provide some type-safety we make this extra | ||
13 | parameter a pointer to a union (which initially has no members). | ||
14 | |||
15 | In particular, we would like to be able to indicate which of the | ||
16 | i2c controllers are for on-board devices only and which are | ||
17 | connected to the external 'shield' expansion port; a subsequent | ||
18 | patch will use this mechanism for that purpose. | ||
5 | 19 | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 20 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 21 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20210628135835.6690-2-peter.maydell@linaro.org | 22 | Message-id: 20210903151435.22379-3-peter.maydell@linaro.org |
9 | --- | 23 | --- |
10 | target/arm/translate-mve.c | 17 +++++++++-------- | 24 | hw/arm/mps2-tz.c | 35 ++++++++++++++++++++++------------- |
11 | 1 file changed, 9 insertions(+), 8 deletions(-) | 25 | 1 file changed, 22 insertions(+), 13 deletions(-) |
12 | 26 | ||
13 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | 27 | diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c |
14 | index XXXXXXX..XXXXXXX 100644 | 28 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/translate-mve.c | 29 | --- a/hw/arm/mps2-tz.c |
16 | +++ b/target/arm/translate-mve.c | 30 | +++ b/hw/arm/mps2-tz.c |
17 | @@ -XXX,XX +XXX,XX @@ static bool mve_skip_first_beat(DisasContext *s) | 31 | @@ -XXX,XX +XXX,XX @@ static qemu_irq get_sse_irq_in(MPS2TZMachineState *mms, int irqno) |
18 | } | 32 | } |
19 | } | 33 | } |
20 | 34 | ||
21 | -static bool do_ldst(DisasContext *s, arg_VLDR_VSTR *a, MVEGenLdStFn *fn) | 35 | +/* Union describing the device-specific extra data we pass to the devfn. */ |
22 | +static bool do_ldst(DisasContext *s, arg_VLDR_VSTR *a, MVEGenLdStFn *fn, | 36 | +typedef union PPCExtraData { |
23 | + unsigned msize) | 37 | +} PPCExtraData; |
38 | + | ||
39 | /* Most of the devices in the AN505 FPGA image sit behind | ||
40 | * Peripheral Protection Controllers. These data structures | ||
41 | * define the layout of which devices sit behind which PPCs. | ||
42 | @@ -XXX,XX +XXX,XX @@ static qemu_irq get_sse_irq_in(MPS2TZMachineState *mms, int irqno) | ||
43 | */ | ||
44 | typedef MemoryRegion *MakeDevFn(MPS2TZMachineState *mms, void *opaque, | ||
45 | const char *name, hwaddr size, | ||
46 | - const int *irqs); | ||
47 | + const int *irqs, | ||
48 | + const PPCExtraData *extradata); | ||
49 | |||
50 | typedef struct PPCPortInfo { | ||
51 | const char *name; | ||
52 | @@ -XXX,XX +XXX,XX @@ typedef struct PPCPortInfo { | ||
53 | hwaddr addr; | ||
54 | hwaddr size; | ||
55 | int irqs[3]; /* currently no device needs more IRQ lines than this */ | ||
56 | + PPCExtraData extradata; /* to pass device-specific info to the devfn */ | ||
57 | } PPCPortInfo; | ||
58 | |||
59 | typedef struct PPCInfo { | ||
60 | @@ -XXX,XX +XXX,XX @@ typedef struct PPCInfo { | ||
61 | static MemoryRegion *make_unimp_dev(MPS2TZMachineState *mms, | ||
62 | void *opaque, | ||
63 | const char *name, hwaddr size, | ||
64 | - const int *irqs) | ||
65 | + const int *irqs, | ||
66 | + const PPCExtraData *extradata) | ||
24 | { | 67 | { |
25 | TCGv_i32 addr; | 68 | /* Initialize, configure and realize a TYPE_UNIMPLEMENTED_DEVICE, |
26 | uint32_t offset; | 69 | * and return a pointer to its MemoryRegion. |
27 | @@ -XXX,XX +XXX,XX @@ static bool do_ldst(DisasContext *s, arg_VLDR_VSTR *a, MVEGenLdStFn *fn) | 70 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_unimp_dev(MPS2TZMachineState *mms, |
28 | return true; | 71 | |
29 | } | 72 | static MemoryRegion *make_uart(MPS2TZMachineState *mms, void *opaque, |
30 | 73 | const char *name, hwaddr size, | |
31 | - offset = a->imm << a->size; | 74 | - const int *irqs) |
32 | + offset = a->imm << msize; | 75 | + const int *irqs, const PPCExtraData *extradata) |
33 | if (!a->a) { | ||
34 | offset = -offset; | ||
35 | } | ||
36 | @@ -XXX,XX +XXX,XX @@ static bool trans_VLDR_VSTR(DisasContext *s, arg_VLDR_VSTR *a) | ||
37 | { gen_helper_mve_vstrw, gen_helper_mve_vldrw }, | ||
38 | { NULL, NULL } | ||
39 | }; | ||
40 | - return do_ldst(s, a, ldstfns[a->size][a->l]); | ||
41 | + return do_ldst(s, a, ldstfns[a->size][a->l], a->size); | ||
42 | } | ||
43 | |||
44 | -#define DO_VLDST_WIDE_NARROW(OP, SLD, ULD, ST) \ | ||
45 | +#define DO_VLDST_WIDE_NARROW(OP, SLD, ULD, ST, MSIZE) \ | ||
46 | static bool trans_##OP(DisasContext *s, arg_VLDR_VSTR *a) \ | ||
47 | { \ | ||
48 | static MVEGenLdStFn * const ldstfns[2][2] = { \ | ||
49 | { gen_helper_mve_##ST, gen_helper_mve_##SLD }, \ | ||
50 | { NULL, gen_helper_mve_##ULD }, \ | ||
51 | }; \ | ||
52 | - return do_ldst(s, a, ldstfns[a->u][a->l]); \ | ||
53 | + return do_ldst(s, a, ldstfns[a->u][a->l], MSIZE); \ | ||
54 | } | ||
55 | |||
56 | -DO_VLDST_WIDE_NARROW(VLDSTB_H, vldrb_sh, vldrb_uh, vstrb_h) | ||
57 | -DO_VLDST_WIDE_NARROW(VLDSTB_W, vldrb_sw, vldrb_uw, vstrb_w) | ||
58 | -DO_VLDST_WIDE_NARROW(VLDSTH_W, vldrh_sw, vldrh_uw, vstrh_w) | ||
59 | +DO_VLDST_WIDE_NARROW(VLDSTB_H, vldrb_sh, vldrb_uh, vstrb_h, MO_8) | ||
60 | +DO_VLDST_WIDE_NARROW(VLDSTB_W, vldrb_sw, vldrb_uw, vstrb_w, MO_8) | ||
61 | +DO_VLDST_WIDE_NARROW(VLDSTH_W, vldrh_sw, vldrh_uw, vstrh_w, MO_16) | ||
62 | |||
63 | static bool trans_VDUP(DisasContext *s, arg_VDUP *a) | ||
64 | { | 76 | { |
77 | /* The irq[] array is tx, rx, combined, in that order */ | ||
78 | MPS2TZMachineClass *mmc = MPS2TZ_MACHINE_GET_CLASS(mms); | ||
79 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_uart(MPS2TZMachineState *mms, void *opaque, | ||
80 | |||
81 | static MemoryRegion *make_scc(MPS2TZMachineState *mms, void *opaque, | ||
82 | const char *name, hwaddr size, | ||
83 | - const int *irqs) | ||
84 | + const int *irqs, const PPCExtraData *extradata) | ||
85 | { | ||
86 | MPS2SCC *scc = opaque; | ||
87 | DeviceState *sccdev; | ||
88 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_scc(MPS2TZMachineState *mms, void *opaque, | ||
89 | |||
90 | static MemoryRegion *make_fpgaio(MPS2TZMachineState *mms, void *opaque, | ||
91 | const char *name, hwaddr size, | ||
92 | - const int *irqs) | ||
93 | + const int *irqs, const PPCExtraData *extradata) | ||
94 | { | ||
95 | MPS2FPGAIO *fpgaio = opaque; | ||
96 | MPS2TZMachineClass *mmc = MPS2TZ_MACHINE_GET_CLASS(mms); | ||
97 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_fpgaio(MPS2TZMachineState *mms, void *opaque, | ||
98 | |||
99 | static MemoryRegion *make_eth_dev(MPS2TZMachineState *mms, void *opaque, | ||
100 | const char *name, hwaddr size, | ||
101 | - const int *irqs) | ||
102 | + const int *irqs, | ||
103 | + const PPCExtraData *extradata) | ||
104 | { | ||
105 | SysBusDevice *s; | ||
106 | NICInfo *nd = &nd_table[0]; | ||
107 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_eth_dev(MPS2TZMachineState *mms, void *opaque, | ||
108 | |||
109 | static MemoryRegion *make_eth_usb(MPS2TZMachineState *mms, void *opaque, | ||
110 | const char *name, hwaddr size, | ||
111 | - const int *irqs) | ||
112 | + const int *irqs, | ||
113 | + const PPCExtraData *extradata) | ||
114 | { | ||
115 | /* | ||
116 | * The AN524 makes the ethernet and USB share a PPC port. | ||
117 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_eth_usb(MPS2TZMachineState *mms, void *opaque, | ||
118 | |||
119 | static MemoryRegion *make_mpc(MPS2TZMachineState *mms, void *opaque, | ||
120 | const char *name, hwaddr size, | ||
121 | - const int *irqs) | ||
122 | + const int *irqs, const PPCExtraData *extradata) | ||
123 | { | ||
124 | TZMPC *mpc = opaque; | ||
125 | int i = mpc - &mms->mpc[0]; | ||
126 | @@ -XXX,XX +XXX,XX @@ static void remap_irq_fn(void *opaque, int n, int level) | ||
127 | |||
128 | static MemoryRegion *make_dma(MPS2TZMachineState *mms, void *opaque, | ||
129 | const char *name, hwaddr size, | ||
130 | - const int *irqs) | ||
131 | + const int *irqs, const PPCExtraData *extradata) | ||
132 | { | ||
133 | /* The irq[] array is DMACINTR, DMACINTERR, DMACINTTC, in that order */ | ||
134 | PL080State *dma = opaque; | ||
135 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_dma(MPS2TZMachineState *mms, void *opaque, | ||
136 | |||
137 | static MemoryRegion *make_spi(MPS2TZMachineState *mms, void *opaque, | ||
138 | const char *name, hwaddr size, | ||
139 | - const int *irqs) | ||
140 | + const int *irqs, const PPCExtraData *extradata) | ||
141 | { | ||
142 | /* | ||
143 | * The AN505 has five PL022 SPI controllers. | ||
144 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_spi(MPS2TZMachineState *mms, void *opaque, | ||
145 | |||
146 | static MemoryRegion *make_i2c(MPS2TZMachineState *mms, void *opaque, | ||
147 | const char *name, hwaddr size, | ||
148 | - const int *irqs) | ||
149 | + const int *irqs, const PPCExtraData *extradata) | ||
150 | { | ||
151 | ArmSbconI2CState *i2c = opaque; | ||
152 | SysBusDevice *s; | ||
153 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_i2c(MPS2TZMachineState *mms, void *opaque, | ||
154 | |||
155 | static MemoryRegion *make_rtc(MPS2TZMachineState *mms, void *opaque, | ||
156 | const char *name, hwaddr size, | ||
157 | - const int *irqs) | ||
158 | + const int *irqs, const PPCExtraData *extradata) | ||
159 | { | ||
160 | PL031State *pl031 = opaque; | ||
161 | SysBusDevice *s; | ||
162 | @@ -XXX,XX +XXX,XX @@ static void mps2tz_common_init(MachineState *machine) | ||
163 | } | ||
164 | |||
165 | mr = pinfo->devfn(mms, pinfo->opaque, pinfo->name, pinfo->size, | ||
166 | - pinfo->irqs); | ||
167 | + pinfo->irqs, &pinfo->extradata); | ||
168 | portname = g_strdup_printf("port[%d]", port); | ||
169 | object_property_set_link(OBJECT(ppc), portname, OBJECT(mr), | ||
170 | &error_fatal); | ||
65 | -- | 171 | -- |
66 | 2.20.1 | 172 | 2.20.1 |
67 | 173 | ||
68 | 174 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | The initial implementation of the MVE VRMLALDAVH and VRMLSLDAVH | ||
2 | insns had some bugs: | ||
3 | * the 32x32 multiply of elements was being done as 32x32->32, | ||
4 | not 32x32->64 | ||
5 | * we were incorrectly maintaining the accumulator in its full | ||
6 | 72-bit form across all 4 beats of the insn; in the pseudocode | ||
7 | it is squashed back into the 64 bits of the RdaHi:RdaLo | ||
8 | registers after each beat | ||
9 | 1 | ||
10 | In particular, fixing the second of these allows us to recast | ||
11 | the implementation to avoid 128-bit arithmetic entirely. | ||
12 | |||
13 | Since the element size here is always 4, we can also drop the | ||
14 | parameterization of ESIZE to make the code a little more readable. | ||
15 | |||
16 | Suggested-by: Richard Henderson <richard.henderson@linaro.org> | ||
17 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
18 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
19 | Message-id: 20210628135835.6690-3-peter.maydell@linaro.org | ||
20 | --- | ||
21 | target/arm/mve_helper.c | 38 +++++++++++++++++++++----------------- | ||
22 | 1 file changed, 21 insertions(+), 17 deletions(-) | ||
23 | |||
24 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
25 | index XXXXXXX..XXXXXXX 100644 | ||
26 | --- a/target/arm/mve_helper.c | ||
27 | +++ b/target/arm/mve_helper.c | ||
28 | @@ -XXX,XX +XXX,XX @@ | ||
29 | */ | ||
30 | |||
31 | #include "qemu/osdep.h" | ||
32 | -#include "qemu/int128.h" | ||
33 | #include "cpu.h" | ||
34 | #include "internals.h" | ||
35 | #include "vec_internal.h" | ||
36 | @@ -XXX,XX +XXX,XX @@ DO_LDAV(vmlsldavsw, 4, int32_t, false, +=, -=) | ||
37 | DO_LDAV(vmlsldavxsw, 4, int32_t, true, +=, -=) | ||
38 | |||
39 | /* | ||
40 | - * Rounding multiply add long dual accumulate high: we must keep | ||
41 | - * a 72-bit internal accumulator value and return the top 64 bits. | ||
42 | + * Rounding multiply add long dual accumulate high. In the pseudocode | ||
43 | + * this is implemented with a 72-bit internal accumulator value of which | ||
44 | + * the top 64 bits are returned. We optimize this to avoid having to | ||
45 | + * use 128-bit arithmetic -- we can do this because the 74-bit accumulator | ||
46 | + * is squashed back into 64-bits after each beat. | ||
47 | */ | ||
48 | -#define DO_LDAVH(OP, ESIZE, TYPE, XCHG, EVENACC, ODDACC, TO128) \ | ||
49 | +#define DO_LDAVH(OP, TYPE, LTYPE, XCHG, SUB) \ | ||
50 | uint64_t HELPER(glue(mve_, OP))(CPUARMState *env, void *vn, \ | ||
51 | void *vm, uint64_t a) \ | ||
52 | { \ | ||
53 | uint16_t mask = mve_element_mask(env); \ | ||
54 | unsigned e; \ | ||
55 | TYPE *n = vn, *m = vm; \ | ||
56 | - Int128 acc = int128_lshift(TO128(a), 8); \ | ||
57 | - for (e = 0; e < 16 / ESIZE; e++, mask >>= ESIZE) { \ | ||
58 | + for (e = 0; e < 16 / 4; e++, mask >>= 4) { \ | ||
59 | if (mask & 1) { \ | ||
60 | + LTYPE mul; \ | ||
61 | if (e & 1) { \ | ||
62 | - acc = ODDACC(acc, TO128(n[H##ESIZE(e - 1 * XCHG)] * \ | ||
63 | - m[H##ESIZE(e)])); \ | ||
64 | + mul = (LTYPE)n[H4(e - 1 * XCHG)] * m[H4(e)]; \ | ||
65 | + if (SUB) { \ | ||
66 | + mul = -mul; \ | ||
67 | + } \ | ||
68 | } else { \ | ||
69 | - acc = EVENACC(acc, TO128(n[H##ESIZE(e + 1 * XCHG)] * \ | ||
70 | - m[H##ESIZE(e)])); \ | ||
71 | + mul = (LTYPE)n[H4(e + 1 * XCHG)] * m[H4(e)]; \ | ||
72 | } \ | ||
73 | - acc = int128_add(acc, int128_make64(1 << 7)); \ | ||
74 | + mul = (mul >> 8) + ((mul >> 7) & 1); \ | ||
75 | + a += mul; \ | ||
76 | } \ | ||
77 | } \ | ||
78 | mve_advance_vpt(env); \ | ||
79 | - return int128_getlo(int128_rshift(acc, 8)); \ | ||
80 | + return a; \ | ||
81 | } | ||
82 | |||
83 | -DO_LDAVH(vrmlaldavhsw, 4, int32_t, false, int128_add, int128_add, int128_makes64) | ||
84 | -DO_LDAVH(vrmlaldavhxsw, 4, int32_t, true, int128_add, int128_add, int128_makes64) | ||
85 | +DO_LDAVH(vrmlaldavhsw, int32_t, int64_t, false, false) | ||
86 | +DO_LDAVH(vrmlaldavhxsw, int32_t, int64_t, true, false) | ||
87 | |||
88 | -DO_LDAVH(vrmlaldavhuw, 4, uint32_t, false, int128_add, int128_add, int128_make64) | ||
89 | +DO_LDAVH(vrmlaldavhuw, uint32_t, uint64_t, false, false) | ||
90 | |||
91 | -DO_LDAVH(vrmlsldavhsw, 4, int32_t, false, int128_add, int128_sub, int128_makes64) | ||
92 | -DO_LDAVH(vrmlsldavhxsw, 4, int32_t, true, int128_add, int128_sub, int128_makes64) | ||
93 | +DO_LDAVH(vrmlsldavhsw, int32_t, int64_t, false, true) | ||
94 | +DO_LDAVH(vrmlsldavhxsw, int32_t, int64_t, true, true) | ||
95 | |||
96 | /* Vector add across vector */ | ||
97 | #define DO_VADDV(OP, ESIZE, TYPE) \ | ||
98 | -- | ||
99 | 2.20.1 | ||
100 | |||
101 | diff view generated by jsdifflib |
1 | Implement the MVE VSHLC insn, which performs a shift left of the | 1 | The various MPS2 boards have multiple I2C buses: typically a bus |
---|---|---|---|
2 | entire vector with carry in bits provided from a general purpose | 2 | dedicated to the audio configuration, one for the LCD touchscreen |
3 | register and carry out bits written back to that register. | 3 | controller, one for a DDR4 EEPROM, and two which are connected to the |
4 | external Shield expansion connector. Mark the buses which are used | ||
5 | only for board-internal devices as 'full' so that if the user creates | ||
6 | i2c devices on the commandline without specifying a bus name then | ||
7 | they will be connected to the I2C controller used for the Shield | ||
8 | connector, where guest software will expect them. | ||
4 | 9 | ||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
7 | Message-id: 20210628135835.6690-14-peter.maydell@linaro.org | 12 | Message-id: 20210903151435.22379-4-peter.maydell@linaro.org |
8 | --- | 13 | --- |
9 | target/arm/helper-mve.h | 2 ++ | 14 | hw/arm/mps2-tz.c | 57 ++++++++++++++++++++++++++++++++++++------------ |
10 | target/arm/mve.decode | 2 ++ | 15 | 1 file changed, 43 insertions(+), 14 deletions(-) |
11 | target/arm/mve_helper.c | 38 ++++++++++++++++++++++++++++++++++++++ | ||
12 | target/arm/translate-mve.c | 30 ++++++++++++++++++++++++++++++ | ||
13 | 4 files changed, 72 insertions(+) | ||
14 | 16 | ||
15 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 17 | diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c |
16 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/helper-mve.h | 19 | --- a/hw/arm/mps2-tz.c |
18 | +++ b/target/arm/helper-mve.h | 20 | +++ b/hw/arm/mps2-tz.c |
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(mve_vqrshrunbb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 21 | @@ -XXX,XX +XXX,XX @@ static qemu_irq get_sse_irq_in(MPS2TZMachineState *mms, int irqno) |
20 | DEF_HELPER_FLAGS_4(mve_vqrshrunbh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 22 | |
21 | DEF_HELPER_FLAGS_4(mve_vqrshruntb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 23 | /* Union describing the device-specific extra data we pass to the devfn. */ |
22 | DEF_HELPER_FLAGS_4(mve_vqrshrunth, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 24 | typedef union PPCExtraData { |
23 | + | 25 | + bool i2c_internal; |
24 | +DEF_HELPER_FLAGS_4(mve_vshlc, TCG_CALL_NO_WG, i32, env, ptr, i32, i32) | 26 | } PPCExtraData; |
25 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | 27 | |
26 | index XXXXXXX..XXXXXXX 100644 | 28 | /* Most of the devices in the AN505 FPGA image sit behind |
27 | --- a/target/arm/mve.decode | 29 | @@ -XXX,XX +XXX,XX @@ static MemoryRegion *make_i2c(MPS2TZMachineState *mms, void *opaque, |
28 | +++ b/target/arm/mve.decode | 30 | object_initialize_child(OBJECT(mms), name, i2c, TYPE_ARM_SBCON_I2C); |
29 | @@ -XXX,XX +XXX,XX @@ VQRSHRUNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 0 @2_shr_b | 31 | s = SYS_BUS_DEVICE(i2c); |
30 | VQRSHRUNB 111 1 1110 1 . ... ... ... 0 1111 1 1 . 0 ... 0 @2_shr_h | 32 | sysbus_realize(s, &error_fatal); |
31 | VQRSHRUNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 0 @2_shr_b | ||
32 | VQRSHRUNT 111 1 1110 1 . ... ... ... 1 1111 1 1 . 0 ... 0 @2_shr_h | ||
33 | + | ||
34 | +VSHLC 111 0 1110 1 . 1 imm:5 ... 0 1111 1100 rdm:4 qd=%qd | ||
35 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
36 | index XXXXXXX..XXXXXXX 100644 | ||
37 | --- a/target/arm/mve_helper.c | ||
38 | +++ b/target/arm/mve_helper.c | ||
39 | @@ -XXX,XX +XXX,XX @@ DO_VSHRN_SAT_UB(vqrshrnb_ub, vqrshrnt_ub, DO_RSHRN_UB) | ||
40 | DO_VSHRN_SAT_UH(vqrshrnb_uh, vqrshrnt_uh, DO_RSHRN_UH) | ||
41 | DO_VSHRN_SAT_SB(vqrshrunbb, vqrshruntb, DO_RSHRUN_B) | ||
42 | DO_VSHRN_SAT_SH(vqrshrunbh, vqrshrunth, DO_RSHRUN_H) | ||
43 | + | ||
44 | +uint32_t HELPER(mve_vshlc)(CPUARMState *env, void *vd, uint32_t rdm, | ||
45 | + uint32_t shift) | ||
46 | +{ | ||
47 | + uint32_t *d = vd; | ||
48 | + uint16_t mask = mve_element_mask(env); | ||
49 | + unsigned e; | ||
50 | + uint32_t r; | ||
51 | + | 33 | + |
52 | + /* | 34 | + /* |
53 | + * For each 32-bit element, we shift it left, bringing in the | 35 | + * If this is an internal-use-only i2c bus, mark it full |
54 | + * low 'shift' bits of rdm at the bottom. Bits shifted out at | 36 | + * so that user-created i2c devices are not plugged into it. |
55 | + * the top become the new rdm, if the predicate mask permits. | 37 | + * If we implement models of any on-board i2c devices that |
56 | + * The final rdm value is returned to update the register. | 38 | + * plug in to one of the internal-use-only buses, then we will |
57 | + * shift == 0 here means "shift by 32 bits". | 39 | + * need to create and plugging those in here before we mark the |
40 | + * bus as full. | ||
58 | + */ | 41 | + */ |
59 | + if (shift == 0) { | 42 | + if (extradata->i2c_internal) { |
60 | + for (e = 0; e < 16 / 4; e++, mask >>= 4) { | 43 | + BusState *qbus = qdev_get_child_bus(DEVICE(i2c), "i2c"); |
61 | + r = rdm; | 44 | + qbus_mark_full(qbus); |
62 | + if (mask & 1) { | ||
63 | + rdm = d[H4(e)]; | ||
64 | + } | ||
65 | + mergemask(&d[H4(e)], r, mask); | ||
66 | + } | ||
67 | + } else { | ||
68 | + uint32_t shiftmask = MAKE_64BIT_MASK(0, shift); | ||
69 | + | ||
70 | + for (e = 0; e < 16 / 4; e++, mask >>= 4) { | ||
71 | + r = (d[H4(e)] << shift) | (rdm & shiftmask); | ||
72 | + if (mask & 1) { | ||
73 | + rdm = d[H4(e)] >> (32 - shift); | ||
74 | + } | ||
75 | + mergemask(&d[H4(e)], r, mask); | ||
76 | + } | ||
77 | + } | ||
78 | + mve_advance_vpt(env); | ||
79 | + return rdm; | ||
80 | +} | ||
81 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
82 | index XXXXXXX..XXXXXXX 100644 | ||
83 | --- a/target/arm/translate-mve.c | ||
84 | +++ b/target/arm/translate-mve.c | ||
85 | @@ -XXX,XX +XXX,XX @@ DO_2SHIFT_N(VQRSHRNB_U, vqrshrnb_u) | ||
86 | DO_2SHIFT_N(VQRSHRNT_U, vqrshrnt_u) | ||
87 | DO_2SHIFT_N(VQRSHRUNB, vqrshrunb) | ||
88 | DO_2SHIFT_N(VQRSHRUNT, vqrshrunt) | ||
89 | + | ||
90 | +static bool trans_VSHLC(DisasContext *s, arg_VSHLC *a) | ||
91 | +{ | ||
92 | + /* | ||
93 | + * Whole Vector Left Shift with Carry. The carry is taken | ||
94 | + * from a general purpose register and written back there. | ||
95 | + * An imm of 0 means "shift by 32". | ||
96 | + */ | ||
97 | + TCGv_ptr qd; | ||
98 | + TCGv_i32 rdm; | ||
99 | + | ||
100 | + if (!dc_isar_feature(aa32_mve, s) || !mve_check_qreg_bank(s, a->qd)) { | ||
101 | + return false; | ||
102 | + } | ||
103 | + if (a->rdm == 13 || a->rdm == 15) { | ||
104 | + /* CONSTRAINED UNPREDICTABLE: we UNDEF */ | ||
105 | + return false; | ||
106 | + } | ||
107 | + if (!mve_eci_check(s) || !vfp_access_check(s)) { | ||
108 | + return true; | ||
109 | + } | 45 | + } |
110 | + | 46 | + |
111 | + qd = mve_qreg_ptr(a->qd); | 47 | return sysbus_mmio_get_region(s, 0); |
112 | + rdm = load_reg(s, a->rdm); | 48 | } |
113 | + gen_helper_mve_vshlc(rdm, cpu_env, qd, rdm, tcg_constant_i32(a->imm)); | 49 | |
114 | + store_reg(s, a->rdm, rdm); | 50 | @@ -XXX,XX +XXX,XX @@ static void mps2tz_common_init(MachineState *machine) |
115 | + tcg_temp_free_ptr(qd); | 51 | { "uart2", make_uart, &mms->uart[2], 0x40202000, 0x1000, { 36, 37, 44 } }, |
116 | + mve_update_eci(s); | 52 | { "uart3", make_uart, &mms->uart[3], 0x40203000, 0x1000, { 38, 39, 45 } }, |
117 | + return true; | 53 | { "uart4", make_uart, &mms->uart[4], 0x40204000, 0x1000, { 40, 41, 46 } }, |
118 | +} | 54 | - { "i2c0", make_i2c, &mms->i2c[0], 0x40207000, 0x1000 }, |
55 | - { "i2c1", make_i2c, &mms->i2c[1], 0x40208000, 0x1000 }, | ||
56 | - { "i2c2", make_i2c, &mms->i2c[2], 0x4020c000, 0x1000 }, | ||
57 | - { "i2c3", make_i2c, &mms->i2c[3], 0x4020d000, 0x1000 }, | ||
58 | + { "i2c0", make_i2c, &mms->i2c[0], 0x40207000, 0x1000, {}, | ||
59 | + { .i2c_internal = true /* touchscreen */ } }, | ||
60 | + { "i2c1", make_i2c, &mms->i2c[1], 0x40208000, 0x1000, {}, | ||
61 | + { .i2c_internal = true /* audio conf */ } }, | ||
62 | + { "i2c2", make_i2c, &mms->i2c[2], 0x4020c000, 0x1000, {}, | ||
63 | + { .i2c_internal = false /* shield 0 */ } }, | ||
64 | + { "i2c3", make_i2c, &mms->i2c[3], 0x4020d000, 0x1000, {}, | ||
65 | + { .i2c_internal = false /* shield 1 */ } }, | ||
66 | }, | ||
67 | }, { | ||
68 | .name = "apb_ppcexp2", | ||
69 | @@ -XXX,XX +XXX,XX @@ static void mps2tz_common_init(MachineState *machine) | ||
70 | }, { | ||
71 | .name = "apb_ppcexp1", | ||
72 | .ports = { | ||
73 | - { "i2c0", make_i2c, &mms->i2c[0], 0x41200000, 0x1000 }, | ||
74 | - { "i2c1", make_i2c, &mms->i2c[1], 0x41201000, 0x1000 }, | ||
75 | + { "i2c0", make_i2c, &mms->i2c[0], 0x41200000, 0x1000, {}, | ||
76 | + { .i2c_internal = true /* touchscreen */ } }, | ||
77 | + { "i2c1", make_i2c, &mms->i2c[1], 0x41201000, 0x1000, {}, | ||
78 | + { .i2c_internal = true /* audio conf */ } }, | ||
79 | { "spi0", make_spi, &mms->spi[0], 0x41202000, 0x1000, { 52 } }, | ||
80 | { "spi1", make_spi, &mms->spi[1], 0x41203000, 0x1000, { 53 } }, | ||
81 | { "spi2", make_spi, &mms->spi[2], 0x41204000, 0x1000, { 54 } }, | ||
82 | - { "i2c2", make_i2c, &mms->i2c[2], 0x41205000, 0x1000 }, | ||
83 | - { "i2c3", make_i2c, &mms->i2c[3], 0x41206000, 0x1000 }, | ||
84 | + { "i2c2", make_i2c, &mms->i2c[2], 0x41205000, 0x1000, {}, | ||
85 | + { .i2c_internal = false /* shield 0 */ } }, | ||
86 | + { "i2c3", make_i2c, &mms->i2c[3], 0x41206000, 0x1000, {}, | ||
87 | + { .i2c_internal = false /* shield 1 */ } }, | ||
88 | { /* port 7 reserved */ }, | ||
89 | - { "i2c4", make_i2c, &mms->i2c[4], 0x41208000, 0x1000 }, | ||
90 | + { "i2c4", make_i2c, &mms->i2c[4], 0x41208000, 0x1000, {}, | ||
91 | + { .i2c_internal = true /* DDR4 EEPROM */ } }, | ||
92 | }, | ||
93 | }, { | ||
94 | .name = "apb_ppcexp2", | ||
95 | @@ -XXX,XX +XXX,XX @@ static void mps2tz_common_init(MachineState *machine) | ||
96 | }, { | ||
97 | .name = "apb_ppcexp1", | ||
98 | .ports = { | ||
99 | - { "i2c0", make_i2c, &mms->i2c[0], 0x49200000, 0x1000 }, | ||
100 | - { "i2c1", make_i2c, &mms->i2c[1], 0x49201000, 0x1000 }, | ||
101 | + { "i2c0", make_i2c, &mms->i2c[0], 0x49200000, 0x1000, {}, | ||
102 | + { .i2c_internal = true /* touchscreen */ } }, | ||
103 | + { "i2c1", make_i2c, &mms->i2c[1], 0x49201000, 0x1000, {}, | ||
104 | + { .i2c_internal = true /* audio conf */ } }, | ||
105 | { "spi0", make_spi, &mms->spi[0], 0x49202000, 0x1000, { 53 } }, | ||
106 | { "spi1", make_spi, &mms->spi[1], 0x49203000, 0x1000, { 54 } }, | ||
107 | { "spi2", make_spi, &mms->spi[2], 0x49204000, 0x1000, { 55 } }, | ||
108 | - { "i2c2", make_i2c, &mms->i2c[2], 0x49205000, 0x1000 }, | ||
109 | - { "i2c3", make_i2c, &mms->i2c[3], 0x49206000, 0x1000 }, | ||
110 | + { "i2c2", make_i2c, &mms->i2c[2], 0x49205000, 0x1000, {}, | ||
111 | + { .i2c_internal = false /* shield 0 */ } }, | ||
112 | + { "i2c3", make_i2c, &mms->i2c[3], 0x49206000, 0x1000, {}, | ||
113 | + { .i2c_internal = false /* shield 1 */ } }, | ||
114 | { /* port 7 reserved */ }, | ||
115 | - { "i2c4", make_i2c, &mms->i2c[4], 0x49208000, 0x1000 }, | ||
116 | + { "i2c4", make_i2c, &mms->i2c[4], 0x49208000, 0x1000, {}, | ||
117 | + { .i2c_internal = true /* DDR4 EEPROM */ } }, | ||
118 | }, | ||
119 | }, { | ||
120 | .name = "apb_ppcexp2", | ||
119 | -- | 121 | -- |
120 | 2.20.1 | 122 | 2.20.1 |
121 | 123 | ||
122 | 124 | diff view generated by jsdifflib |
1 | Implement the MVE shift-vector-left-by-immediate insns VSHL, VQSHL | 1 | The various MPS2 boards implemented in mps2.c have multiple I2C |
---|---|---|---|
2 | and VQSHLU. | 2 | buses: a bus dedicated to the audio configuration, one for the LCD |
3 | 3 | touchscreen controller, and two which are connected to the external | |
4 | The size-and-immediate encoding here is the same as Neon, and we | 4 | Shield expansion connector. Mark the buses which are used only for |
5 | handle it the same way neon-dp.decode does. | 5 | board-internal devices as 'full' so that if the user creates i2c |
6 | devices on the commandline without specifying a bus name then they | ||
7 | will be connected to the I2C controller used for the Shield | ||
8 | connector, where guest software will expect them. | ||
6 | 9 | ||
7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
9 | Message-id: 20210628135835.6690-8-peter.maydell@linaro.org | 12 | Message-id: 20210903151435.22379-5-peter.maydell@linaro.org |
10 | --- | 13 | --- |
11 | target/arm/helper-mve.h | 16 +++++++++++ | 14 | hw/arm/mps2.c | 12 +++++++++++- |
12 | target/arm/mve.decode | 23 +++++++++++++++ | 15 | 1 file changed, 11 insertions(+), 1 deletion(-) |
13 | target/arm/mve_helper.c | 57 ++++++++++++++++++++++++++++++++++++++ | ||
14 | target/arm/translate-mve.c | 51 ++++++++++++++++++++++++++++++++++ | ||
15 | 4 files changed, 147 insertions(+) | ||
16 | 16 | ||
17 | diff --git a/target/arm/helper-mve.h b/target/arm/helper-mve.h | 17 | diff --git a/hw/arm/mps2.c b/hw/arm/mps2.c |
18 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/target/arm/helper-mve.h | 19 | --- a/hw/arm/mps2.c |
20 | +++ b/target/arm/helper-mve.h | 20 | +++ b/hw/arm/mps2.c |
21 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(mve_vaddvuw, TCG_CALL_NO_WG, i32, env, ptr, i32) | 21 | @@ -XXX,XX +XXX,XX @@ static void mps2_common_init(MachineState *machine) |
22 | DEF_HELPER_FLAGS_3(mve_vmovi, TCG_CALL_NO_WG, void, env, ptr, i64) | 22 | 0x40023000, /* Audio */ |
23 | DEF_HELPER_FLAGS_3(mve_vandi, TCG_CALL_NO_WG, void, env, ptr, i64) | 23 | 0x40029000, /* Shield0 */ |
24 | DEF_HELPER_FLAGS_3(mve_vorri, TCG_CALL_NO_WG, void, env, ptr, i64) | 24 | 0x4002a000}; /* Shield1 */ |
25 | - sysbus_create_simple(TYPE_ARM_SBCON_I2C, i2cbase[i], NULL); | ||
26 | + DeviceState *dev; | ||
25 | + | 27 | + |
26 | +DEF_HELPER_FLAGS_4(mve_vshli_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 28 | + dev = sysbus_create_simple(TYPE_ARM_SBCON_I2C, i2cbase[i], NULL); |
27 | +DEF_HELPER_FLAGS_4(mve_vshli_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 29 | + if (i < 2) { |
28 | +DEF_HELPER_FLAGS_4(mve_vshli_uw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 30 | + /* |
29 | + | 31 | + * internal-only bus: mark it full to avoid user-created |
30 | +DEF_HELPER_FLAGS_4(mve_vqshli_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 32 | + * i2c devices being plugged into it. |
31 | +DEF_HELPER_FLAGS_4(mve_vqshli_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 33 | + */ |
32 | +DEF_HELPER_FLAGS_4(mve_vqshli_sw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 34 | + BusState *qbus = qdev_get_child_bus(dev, "i2c"); |
33 | + | 35 | + qbus_mark_full(qbus); |
34 | +DEF_HELPER_FLAGS_4(mve_vqshli_ub, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | 36 | + } |
35 | +DEF_HELPER_FLAGS_4(mve_vqshli_uh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
36 | +DEF_HELPER_FLAGS_4(mve_vqshli_uw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
37 | + | ||
38 | +DEF_HELPER_FLAGS_4(mve_vqshlui_sb, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
39 | +DEF_HELPER_FLAGS_4(mve_vqshlui_sh, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
40 | +DEF_HELPER_FLAGS_4(mve_vqshlui_sw, TCG_CALL_NO_WG, void, env, ptr, ptr, i32) | ||
41 | diff --git a/target/arm/mve.decode b/target/arm/mve.decode | ||
42 | index XXXXXXX..XXXXXXX 100644 | ||
43 | --- a/target/arm/mve.decode | ||
44 | +++ b/target/arm/mve.decode | ||
45 | @@ -XXX,XX +XXX,XX @@ | ||
46 | &2op qd qm qn size | ||
47 | &2scalar qd qn rm size | ||
48 | &1imm qd imm cmode op | ||
49 | +&2shift qd qm shift size | ||
50 | |||
51 | @vldr_vstr ....... . . . . l:1 rn:4 ... ...... imm:7 &vldr_vstr qd=%qd u=0 | ||
52 | # Note that both Rn and Qd are 3 bits only (no D bit) | ||
53 | @@ -XXX,XX +XXX,XX @@ | ||
54 | @2scalar .... .... .. size:2 .... .... .... .... rm:4 &2scalar qd=%qd qn=%qn | ||
55 | @2scalar_nosz .... .... .... .... .... .... .... rm:4 &2scalar qd=%qd qn=%qn | ||
56 | |||
57 | +@2_shl_b .... .... .. 001 shift:3 .... .... .... .... &2shift qd=%qd qm=%qm size=0 | ||
58 | +@2_shl_h .... .... .. 01 shift:4 .... .... .... .... &2shift qd=%qd qm=%qm size=1 | ||
59 | +@2_shl_w .... .... .. 1 shift:5 .... .... .... .... &2shift qd=%qd qm=%qm size=2 | ||
60 | + | ||
61 | # Vector loads and stores | ||
62 | |||
63 | # Widening loads and narrowing stores: | ||
64 | @@ -XXX,XX +XXX,XX @@ VPST 1111 1110 0 . 11 000 1 ... 0 1111 0100 1101 mask=%mask_22_13 | ||
65 | # So we have a single decode line and check the cmode/op in the | ||
66 | # trans function. | ||
67 | Vimm_1r 111 . 1111 1 . 00 0 ... ... 0 .... 0 1 . 1 .... @1imm | ||
68 | + | ||
69 | +# Shifts by immediate | ||
70 | + | ||
71 | +VSHLI 111 0 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_b | ||
72 | +VSHLI 111 0 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_h | ||
73 | +VSHLI 111 0 1111 1 . ... ... ... 0 0101 0 1 . 1 ... 0 @2_shl_w | ||
74 | + | ||
75 | +VQSHLI_S 111 0 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_b | ||
76 | +VQSHLI_S 111 0 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_h | ||
77 | +VQSHLI_S 111 0 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_w | ||
78 | + | ||
79 | +VQSHLI_U 111 1 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_b | ||
80 | +VQSHLI_U 111 1 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_h | ||
81 | +VQSHLI_U 111 1 1111 1 . ... ... ... 0 0111 0 1 . 1 ... 0 @2_shl_w | ||
82 | + | ||
83 | +VQSHLUI 111 1 1111 1 . ... ... ... 0 0110 0 1 . 1 ... 0 @2_shl_b | ||
84 | +VQSHLUI 111 1 1111 1 . ... ... ... 0 0110 0 1 . 1 ... 0 @2_shl_h | ||
85 | +VQSHLUI 111 1 1111 1 . ... ... ... 0 0110 0 1 . 1 ... 0 @2_shl_w | ||
86 | diff --git a/target/arm/mve_helper.c b/target/arm/mve_helper.c | ||
87 | index XXXXXXX..XXXXXXX 100644 | ||
88 | --- a/target/arm/mve_helper.c | ||
89 | +++ b/target/arm/mve_helper.c | ||
90 | @@ -XXX,XX +XXX,XX @@ DO_2OP_SAT(vqsubsw, 4, int32_t, DO_SQSUB_W) | ||
91 | WRAP_QRSHL_HELPER(do_sqrshl_bhs, N, M, true, satp) | ||
92 | #define DO_UQRSHL_OP(N, M, satp) \ | ||
93 | WRAP_QRSHL_HELPER(do_uqrshl_bhs, N, M, true, satp) | ||
94 | +#define DO_SUQSHL_OP(N, M, satp) \ | ||
95 | + WRAP_QRSHL_HELPER(do_suqrshl_bhs, N, M, false, satp) | ||
96 | |||
97 | DO_2OP_SAT_S(vqshls, DO_SQSHL_OP) | ||
98 | DO_2OP_SAT_U(vqshlu, DO_UQSHL_OP) | ||
99 | @@ -XXX,XX +XXX,XX @@ DO_VADDV(vaddvsw, 4, uint32_t) | ||
100 | DO_VADDV(vaddvub, 1, uint8_t) | ||
101 | DO_VADDV(vaddvuh, 2, uint16_t) | ||
102 | DO_VADDV(vaddvuw, 4, uint32_t) | ||
103 | + | ||
104 | +/* Shifts by immediate */ | ||
105 | +#define DO_2SHIFT(OP, ESIZE, TYPE, FN) \ | ||
106 | + void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
107 | + void *vm, uint32_t shift) \ | ||
108 | + { \ | ||
109 | + TYPE *d = vd, *m = vm; \ | ||
110 | + uint16_t mask = mve_element_mask(env); \ | ||
111 | + unsigned e; \ | ||
112 | + for (e = 0; e < 16 / ESIZE; e++, mask >>= ESIZE) { \ | ||
113 | + mergemask(&d[H##ESIZE(e)], \ | ||
114 | + FN(m[H##ESIZE(e)], shift), mask); \ | ||
115 | + } \ | ||
116 | + mve_advance_vpt(env); \ | ||
117 | + } | ||
118 | + | ||
119 | +#define DO_2SHIFT_SAT(OP, ESIZE, TYPE, FN) \ | ||
120 | + void HELPER(glue(mve_, OP))(CPUARMState *env, void *vd, \ | ||
121 | + void *vm, uint32_t shift) \ | ||
122 | + { \ | ||
123 | + TYPE *d = vd, *m = vm; \ | ||
124 | + uint16_t mask = mve_element_mask(env); \ | ||
125 | + unsigned e; \ | ||
126 | + bool qc = false; \ | ||
127 | + for (e = 0; e < 16 / ESIZE; e++, mask >>= ESIZE) { \ | ||
128 | + bool sat = false; \ | ||
129 | + mergemask(&d[H##ESIZE(e)], \ | ||
130 | + FN(m[H##ESIZE(e)], shift, &sat), mask); \ | ||
131 | + qc |= sat & mask & 1; \ | ||
132 | + } \ | ||
133 | + if (qc) { \ | ||
134 | + env->vfp.qc[0] = qc; \ | ||
135 | + } \ | ||
136 | + mve_advance_vpt(env); \ | ||
137 | + } | ||
138 | + | ||
139 | +/* provide unsigned 2-op shift helpers for all sizes */ | ||
140 | +#define DO_2SHIFT_U(OP, FN) \ | ||
141 | + DO_2SHIFT(OP##b, 1, uint8_t, FN) \ | ||
142 | + DO_2SHIFT(OP##h, 2, uint16_t, FN) \ | ||
143 | + DO_2SHIFT(OP##w, 4, uint32_t, FN) | ||
144 | + | ||
145 | +#define DO_2SHIFT_SAT_U(OP, FN) \ | ||
146 | + DO_2SHIFT_SAT(OP##b, 1, uint8_t, FN) \ | ||
147 | + DO_2SHIFT_SAT(OP##h, 2, uint16_t, FN) \ | ||
148 | + DO_2SHIFT_SAT(OP##w, 4, uint32_t, FN) | ||
149 | +#define DO_2SHIFT_SAT_S(OP, FN) \ | ||
150 | + DO_2SHIFT_SAT(OP##b, 1, int8_t, FN) \ | ||
151 | + DO_2SHIFT_SAT(OP##h, 2, int16_t, FN) \ | ||
152 | + DO_2SHIFT_SAT(OP##w, 4, int32_t, FN) | ||
153 | + | ||
154 | +DO_2SHIFT_U(vshli_u, DO_VSHLU) | ||
155 | +DO_2SHIFT_SAT_U(vqshli_u, DO_UQSHL_OP) | ||
156 | +DO_2SHIFT_SAT_S(vqshli_s, DO_SQSHL_OP) | ||
157 | +DO_2SHIFT_SAT_S(vqshlui_s, DO_SUQSHL_OP) | ||
158 | diff --git a/target/arm/translate-mve.c b/target/arm/translate-mve.c | ||
159 | index XXXXXXX..XXXXXXX 100644 | ||
160 | --- a/target/arm/translate-mve.c | ||
161 | +++ b/target/arm/translate-mve.c | ||
162 | @@ -XXX,XX +XXX,XX @@ typedef void MVEGenLdStFn(TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
163 | typedef void MVEGenOneOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr); | ||
164 | typedef void MVEGenTwoOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr); | ||
165 | typedef void MVEGenTwoOpScalarFn(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
166 | +typedef void MVEGenTwoOpShiftFn(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
167 | typedef void MVEGenDualAccOpFn(TCGv_i64, TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_i64); | ||
168 | typedef void MVEGenVADDVFn(TCGv_i32, TCGv_ptr, TCGv_ptr, TCGv_i32); | ||
169 | typedef void MVEGenOneOpImmFn(TCGv_ptr, TCGv_ptr, TCGv_i64); | ||
170 | @@ -XXX,XX +XXX,XX @@ static bool trans_Vimm_1r(DisasContext *s, arg_1imm *a) | ||
171 | } | 37 | } |
172 | return do_1imm(s, a, fn); | 38 | create_unimplemented_device("i2s", 0x40024000, 0x400); |
173 | } | 39 | |
174 | + | ||
175 | +static bool do_2shift(DisasContext *s, arg_2shift *a, MVEGenTwoOpShiftFn fn, | ||
176 | + bool negateshift) | ||
177 | +{ | ||
178 | + TCGv_ptr qd, qm; | ||
179 | + int shift = a->shift; | ||
180 | + | ||
181 | + if (!dc_isar_feature(aa32_mve, s) || | ||
182 | + !mve_check_qreg_bank(s, a->qd | a->qm) || | ||
183 | + !fn) { | ||
184 | + return false; | ||
185 | + } | ||
186 | + if (!mve_eci_check(s) || !vfp_access_check(s)) { | ||
187 | + return true; | ||
188 | + } | ||
189 | + | ||
190 | + /* | ||
191 | + * When we handle a right shift insn using a left-shift helper | ||
192 | + * which permits a negative shift count to indicate a right-shift, | ||
193 | + * we must negate the shift count. | ||
194 | + */ | ||
195 | + if (negateshift) { | ||
196 | + shift = -shift; | ||
197 | + } | ||
198 | + | ||
199 | + qd = mve_qreg_ptr(a->qd); | ||
200 | + qm = mve_qreg_ptr(a->qm); | ||
201 | + fn(cpu_env, qd, qm, tcg_constant_i32(shift)); | ||
202 | + tcg_temp_free_ptr(qd); | ||
203 | + tcg_temp_free_ptr(qm); | ||
204 | + mve_update_eci(s); | ||
205 | + return true; | ||
206 | +} | ||
207 | + | ||
208 | +#define DO_2SHIFT(INSN, FN, NEGATESHIFT) \ | ||
209 | + static bool trans_##INSN(DisasContext *s, arg_2shift *a) \ | ||
210 | + { \ | ||
211 | + static MVEGenTwoOpShiftFn * const fns[] = { \ | ||
212 | + gen_helper_mve_##FN##b, \ | ||
213 | + gen_helper_mve_##FN##h, \ | ||
214 | + gen_helper_mve_##FN##w, \ | ||
215 | + NULL, \ | ||
216 | + }; \ | ||
217 | + return do_2shift(s, a, fns[a->size], NEGATESHIFT); \ | ||
218 | + } | ||
219 | + | ||
220 | +DO_2SHIFT(VSHLI, vshli_u, false) | ||
221 | +DO_2SHIFT(VQSHLI_S, vqshli_s, false) | ||
222 | +DO_2SHIFT(VQSHLI_U, vqshli_u, false) | ||
223 | +DO_2SHIFT(VQSHLUI, vqshlui_s, false) | ||
224 | -- | 40 | -- |
225 | 2.20.1 | 41 | 2.20.1 |
226 | 42 | ||
227 | 43 | diff view generated by jsdifflib |