1 | I don't have anything else queued up at the moment, so this is just | 1 | Hi; this pullreq includes FEAT_LSE2 support, the new |
---|---|---|---|
2 | Richard's SME patches. | 2 | bpim2u board, and some other smaller patchsets. |
3 | 3 | ||
4 | thanks | ||
4 | -- PMM | 5 | -- PMM |
5 | 6 | ||
6 | The following changes since commit 63b38f6c85acd312c2cab68554abf33adf4ee2b3: | 7 | The following changes since commit 369081c4558e7e940fa36ce59bf17b2e390f55d3: |
7 | 8 | ||
8 | Merge tag 'pull-target-arm-20220707' of https://git.linaro.org/people/pmaydell/qemu-arm into staging (2022-07-08 06:17:11 +0530) | 9 | Merge tag 'pull-tcg-20230605' of https://gitlab.com/rth7680/qemu into staging (2023-06-05 13:16:56 -0700) |
9 | 10 | ||
10 | are available in the Git repository at: | 11 | are available in the Git repository at: |
11 | 12 | ||
12 | https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20220711 | 13 | https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20230606 |
13 | 14 | ||
14 | for you to fetch changes up to f9982ceaf26df27d15547a3a7990a95019e9e3a8: | 15 | for you to fetch changes up to f9ac778898cb28307e0f91421aba34d43c34b679: |
15 | 16 | ||
16 | linux-user/aarch64: Add SME related hwcap entries (2022-07-11 13:43:52 +0100) | 17 | target/arm: trap DCC access in user mode emulation (2023-06-06 10:19:40 +0100) |
17 | 18 | ||
18 | ---------------------------------------------------------------- | 19 | ---------------------------------------------------------------- |
19 | target-arm: | 20 | target-arm queue: |
20 | * Implement SME emulation, for both system and linux-user | 21 | * Support gdbstub (guest debug) in HVF |
22 | * xnlx-versal: Support CANFD controller | ||
23 | * bpim2u: New board model: Banana Pi BPI-M2 Ultra | ||
24 | * Emulate FEAT_LSE2 | ||
25 | * allow DC CVA[D]P in user mode emulation | ||
26 | * trap DCC access in user mode emulation | ||
21 | 27 | ||
22 | ---------------------------------------------------------------- | 28 | ---------------------------------------------------------------- |
23 | Richard Henderson (45): | 29 | Francesco Cagnin (4): |
24 | target/arm: Handle SME in aarch64_cpu_dump_state | 30 | arm: move KVM breakpoints helpers |
25 | target/arm: Add infrastructure for disas_sme | 31 | hvf: handle access for more registers |
26 | target/arm: Trap non-streaming usage when Streaming SVE is active | 32 | hvf: add breakpoint handlers |
27 | target/arm: Mark ADR as non-streaming | 33 | hvf: add guest debugging handlers for Apple Silicon hosts |
28 | target/arm: Mark RDFFR, WRFFR, SETFFR as non-streaming | ||
29 | target/arm: Mark BDEP, BEXT, BGRP, COMPACT, FEXPA, FTSSEL as non-streaming | ||
30 | target/arm: Mark PMULL, FMMLA as non-streaming | ||
31 | target/arm: Mark FTSMUL, FTMAD, FADDA as non-streaming | ||
32 | target/arm: Mark SMMLA, UMMLA, USMMLA as non-streaming | ||
33 | target/arm: Mark string/histo/crypto as non-streaming | ||
34 | target/arm: Mark gather/scatter load/store as non-streaming | ||
35 | target/arm: Mark gather prefetch as non-streaming | ||
36 | target/arm: Mark LDFF1 and LDNF1 as non-streaming | ||
37 | target/arm: Mark LD1RO as non-streaming | ||
38 | target/arm: Add SME enablement checks | ||
39 | target/arm: Handle SME in sve_access_check | ||
40 | target/arm: Implement SME RDSVL, ADDSVL, ADDSPL | ||
41 | target/arm: Implement SME ZERO | ||
42 | target/arm: Implement SME MOVA | ||
43 | target/arm: Implement SME LD1, ST1 | ||
44 | target/arm: Export unpredicated ld/st from translate-sve.c | ||
45 | target/arm: Implement SME LDR, STR | ||
46 | target/arm: Implement SME ADDHA, ADDVA | ||
47 | target/arm: Implement FMOPA, FMOPS (non-widening) | ||
48 | target/arm: Implement BFMOPA, BFMOPS | ||
49 | target/arm: Implement FMOPA, FMOPS (widening) | ||
50 | target/arm: Implement SME integer outer product | ||
51 | target/arm: Implement PSEL | ||
52 | target/arm: Implement REVD | ||
53 | target/arm: Implement SCLAMP, UCLAMP | ||
54 | target/arm: Reset streaming sve state on exception boundaries | ||
55 | target/arm: Enable SME for -cpu max | ||
56 | linux-user/aarch64: Clear tpidr2_el0 if CLONE_SETTLS | ||
57 | linux-user/aarch64: Reset PSTATE.SM on syscalls | ||
58 | linux-user/aarch64: Add SM bit to SVE signal context | ||
59 | linux-user/aarch64: Tidy target_restore_sigframe error return | ||
60 | linux-user/aarch64: Do not allow duplicate or short sve records | ||
61 | linux-user/aarch64: Verify extra record lock succeeded | ||
62 | linux-user/aarch64: Move sve record checks into restore | ||
63 | linux-user/aarch64: Implement SME signal handling | ||
64 | linux-user: Rename sve prctls | ||
65 | linux-user/aarch64: Implement PR_SME_GET_VL, PR_SME_SET_VL | ||
66 | target/arm: Only set ZEN in reset if SVE present | ||
67 | target/arm: Enable SME for user-only | ||
68 | linux-user/aarch64: Add SME related hwcap entries | ||
69 | 34 | ||
70 | docs/system/arm/emulation.rst | 4 + | 35 | Richard Henderson (20): |
71 | linux-user/aarch64/target_cpu.h | 5 +- | 36 | target/arm: Add commentary for CPUARMState.exclusive_high |
72 | linux-user/aarch64/target_prctl.h | 62 +- | 37 | target/arm: Add feature test for FEAT_LSE2 |
73 | target/arm/cpu.h | 7 + | 38 | target/arm: Introduce finalize_memop_{atom,pair} |
74 | target/arm/helper-sme.h | 126 ++++ | 39 | target/arm: Use tcg_gen_qemu_ld_i128 for LDXP |
75 | target/arm/helper-sve.h | 4 + | 40 | target/arm: Use tcg_gen_qemu_{st, ld}_i128 for do_fp_{st, ld} |
76 | target/arm/helper.h | 18 + | 41 | target/arm: Use tcg_gen_qemu_st_i128 for STZG, STZ2G |
77 | target/arm/translate-a64.h | 45 ++ | 42 | target/arm: Use tcg_gen_qemu_{ld, st}_i128 in gen_sve_{ld, st}r |
78 | target/arm/translate.h | 16 + | 43 | target/arm: Sink gen_mte_check1 into load/store_exclusive |
79 | target/arm/sme-fa64.decode | 60 ++ | 44 | target/arm: Load/store integer pair with one tcg operation |
80 | target/arm/sme.decode | 88 +++ | 45 | target/arm: Hoist finalize_memop out of do_gpr_{ld, st} |
81 | target/arm/sve.decode | 41 +- | 46 | target/arm: Hoist finalize_memop out of do_fp_{ld, st} |
82 | linux-user/aarch64/cpu_loop.c | 9 + | 47 | target/arm: Pass memop to gen_mte_check1* |
83 | linux-user/aarch64/signal.c | 243 ++++++-- | 48 | target/arm: Pass single_memop to gen_mte_checkN |
84 | linux-user/elfload.c | 20 + | 49 | target/arm: Check alignment in helper_mte_check |
85 | linux-user/syscall.c | 28 +- | 50 | target/arm: Add SCTLR.nAA to TBFLAG_A64 |
86 | target/arm/cpu.c | 35 +- | 51 | target/arm: Relax ordered/atomic alignment checks for LSE2 |
87 | target/arm/cpu64.c | 11 + | 52 | target/arm: Move mte check for store-exclusive |
88 | target/arm/helper.c | 56 +- | 53 | tests/tcg/aarch64: Use stz2g in mte-7.c |
89 | target/arm/sme_helper.c | 1140 +++++++++++++++++++++++++++++++++++++ | 54 | tests/tcg/multiarch: Adjust sigbus.c |
90 | target/arm/sve_helper.c | 28 + | 55 | target/arm: Enable FEAT_LSE2 for -cpu max |
91 | target/arm/translate-a64.c | 103 +++- | 56 | |
92 | target/arm/translate-sme.c | 373 ++++++++++++ | 57 | Vikram Garhwal (4): |
93 | target/arm/translate-sve.c | 393 ++++++++++--- | 58 | hw/net/can: Introduce Xilinx Versal CANFD controller |
94 | target/arm/translate-vfp.c | 12 + | 59 | xlnx-versal: Connect Xilinx VERSAL CANFD controllers |
95 | target/arm/translate.c | 2 + | 60 | MAINTAINERS: Include canfd tests under Xilinx CAN |
96 | target/arm/vec_helper.c | 24 + | 61 | tests/qtest: Introduce tests for Xilinx VERSAL CANFD controller |
97 | target/arm/meson.build | 3 + | 62 | |
98 | 28 files changed, 2821 insertions(+), 135 deletions(-) | 63 | Zhuojia Shen (3): |
99 | create mode 100644 target/arm/sme-fa64.decode | 64 | target/arm: allow DC CVA[D]P in user mode emulation |
100 | create mode 100644 target/arm/sme.decode | 65 | tests/tcg/aarch64: add DC CVA[D]P tests |
101 | create mode 100644 target/arm/translate-sme.c | 66 | target/arm: trap DCC access in user mode emulation |
67 | |||
68 | qianfan Zhao (11): | ||
69 | hw: arm: Add bananapi M2-Ultra and allwinner-r40 support | ||
70 | hw/arm/allwinner-r40: add Clock Control Unit | ||
71 | hw: allwinner-r40: Complete uart devices | ||
72 | hw: arm: allwinner-r40: Add i2c0 device | ||
73 | hw/misc: Rename axp209 to axp22x and add support AXP221 PMU | ||
74 | hw/arm/allwinner-r40: add SDRAM controller device | ||
75 | hw: sd: allwinner-sdhost: Add sun50i-a64 SoC support | ||
76 | hw: arm: allwinner-r40: Add emac and gmac support | ||
77 | hw: arm: allwinner-sramc: Add SRAM Controller support for R40 | ||
78 | tests: avocado: boot_linux_console: Add test case for bpim2u | ||
79 | docs: system: arm: Introduce bananapi_m2u | ||
80 | |||
81 | MAINTAINERS | 2 +- | ||
82 | docs/system/arm/bananapi_m2u.rst | 139 +++ | ||
83 | docs/system/arm/emulation.rst | 1 + | ||
84 | docs/system/arm/xlnx-versal-virt.rst | 31 + | ||
85 | docs/system/target-arm.rst | 1 + | ||
86 | include/hw/arm/allwinner-r40.h | 143 +++ | ||
87 | include/hw/arm/xlnx-versal.h | 12 + | ||
88 | include/hw/misc/allwinner-r40-ccu.h | 65 + | ||
89 | include/hw/misc/allwinner-r40-dramc.h | 108 ++ | ||
90 | include/hw/misc/allwinner-sramc.h | 69 ++ | ||
91 | include/hw/net/xlnx-versal-canfd.h | 87 ++ | ||
92 | include/hw/sd/allwinner-sdhost.h | 9 + | ||
93 | include/sysemu/hvf.h | 37 + | ||
94 | include/sysemu/hvf_int.h | 2 + | ||
95 | target/arm/cpu.h | 16 +- | ||
96 | target/arm/hvf_arm.h | 7 + | ||
97 | target/arm/internals.h | 53 +- | ||
98 | target/arm/tcg/helper-a64.h | 3 + | ||
99 | target/arm/tcg/translate-a64.h | 4 +- | ||
100 | target/arm/tcg/translate.h | 65 +- | ||
101 | accel/hvf/hvf-accel-ops.c | 119 ++ | ||
102 | accel/hvf/hvf-all.c | 23 + | ||
103 | hw/arm/allwinner-r40.c | 526 ++++++++ | ||
104 | hw/arm/bananapi_m2u.c | 145 +++ | ||
105 | hw/arm/xlnx-versal-virt.c | 53 + | ||
106 | hw/arm/xlnx-versal.c | 37 + | ||
107 | hw/misc/allwinner-r40-ccu.c | 209 ++++ | ||
108 | hw/misc/allwinner-r40-dramc.c | 513 ++++++++ | ||
109 | hw/misc/allwinner-sramc.c | 184 +++ | ||
110 | hw/misc/axp209.c | 238 ---- | ||
111 | hw/misc/axp2xx.c | 283 +++++ | ||
112 | hw/net/can/xlnx-versal-canfd.c | 2107 +++++++++++++++++++++++++++++++++ | ||
113 | hw/sd/allwinner-sdhost.c | 72 +- | ||
114 | target/arm/cpu.c | 2 + | ||
115 | target/arm/debug_helper.c | 5 + | ||
116 | target/arm/helper.c | 6 +- | ||
117 | target/arm/hvf/hvf.c | 750 +++++++++++- | ||
118 | target/arm/hyp_gdbstub.c | 253 ++++ | ||
119 | target/arm/kvm64.c | 276 ----- | ||
120 | target/arm/tcg/cpu64.c | 1 + | ||
121 | target/arm/tcg/helper-a64.c | 7 + | ||
122 | target/arm/tcg/hflags.c | 6 + | ||
123 | target/arm/tcg/mte_helper.c | 18 + | ||
124 | target/arm/tcg/translate-a64.c | 477 +++++--- | ||
125 | target/arm/tcg/translate-sve.c | 106 +- | ||
126 | target/arm/tcg/translate.c | 1 + | ||
127 | target/i386/hvf/hvf.c | 33 + | ||
128 | tests/qtest/xlnx-canfd-test.c | 423 +++++++ | ||
129 | tests/tcg/aarch64/dcpodp.c | 63 + | ||
130 | tests/tcg/aarch64/dcpop.c | 63 + | ||
131 | tests/tcg/aarch64/mte-7.c | 3 +- | ||
132 | tests/tcg/multiarch/sigbus.c | 13 +- | ||
133 | hw/arm/Kconfig | 14 +- | ||
134 | hw/arm/meson.build | 1 + | ||
135 | hw/misc/Kconfig | 5 +- | ||
136 | hw/misc/meson.build | 5 +- | ||
137 | hw/misc/trace-events | 26 +- | ||
138 | hw/net/can/meson.build | 1 + | ||
139 | hw/net/can/trace-events | 7 + | ||
140 | target/arm/meson.build | 3 +- | ||
141 | tests/avocado/boot_linux_console.py | 176 +++ | ||
142 | tests/qtest/meson.build | 1 + | ||
143 | tests/tcg/aarch64/Makefile.target | 11 + | ||
144 | 63 files changed, 7386 insertions(+), 733 deletions(-) | ||
145 | create mode 100644 docs/system/arm/bananapi_m2u.rst | ||
146 | create mode 100644 include/hw/arm/allwinner-r40.h | ||
147 | create mode 100644 include/hw/misc/allwinner-r40-ccu.h | ||
148 | create mode 100644 include/hw/misc/allwinner-r40-dramc.h | ||
149 | create mode 100644 include/hw/misc/allwinner-sramc.h | ||
150 | create mode 100644 include/hw/net/xlnx-versal-canfd.h | ||
151 | create mode 100644 hw/arm/allwinner-r40.c | ||
152 | create mode 100644 hw/arm/bananapi_m2u.c | ||
153 | create mode 100644 hw/misc/allwinner-r40-ccu.c | ||
154 | create mode 100644 hw/misc/allwinner-r40-dramc.c | ||
155 | create mode 100644 hw/misc/allwinner-sramc.c | ||
156 | delete mode 100644 hw/misc/axp209.c | ||
157 | create mode 100644 hw/misc/axp2xx.c | ||
158 | create mode 100644 hw/net/can/xlnx-versal-canfd.c | ||
159 | create mode 100644 target/arm/hyp_gdbstub.c | ||
160 | create mode 100644 tests/qtest/xlnx-canfd-test.c | ||
161 | create mode 100644 tests/tcg/aarch64/dcpodp.c | ||
162 | create mode 100644 tests/tcg/aarch64/dcpop.c | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Francesco Cagnin <fcagnin@quarkslab.com> |
---|---|---|---|
2 | 2 | ||
3 | These functions will be used to verify that the cpu | 3 | These helpers will be also used for HVF. Aside from reformatting a |
4 | is in the correct state for a given instruction. | 4 | couple of comments for 'checkpatch.pl' and updating meson to compile |
5 | 'hyp_gdbstub.c', this is just code motion. | ||
5 | 6 | ||
7 | Signed-off-by: Francesco Cagnin <fcagnin@quarkslab.com> | ||
8 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 10 | Message-id: 20230601153107.81955-2-fcagnin@quarkslab.com |
8 | Message-id: 20220708151540.18136-16-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 12 | --- |
11 | target/arm/translate-a64.h | 21 +++++++++++++++++++++ | 13 | target/arm/internals.h | 50 +++++++ |
12 | target/arm/translate-a64.c | 34 ++++++++++++++++++++++++++++++++++ | 14 | target/arm/hyp_gdbstub.c | 253 +++++++++++++++++++++++++++++++++++ |
13 | 2 files changed, 55 insertions(+) | 15 | target/arm/kvm64.c | 276 --------------------------------------- |
16 | target/arm/meson.build | 3 +- | ||
17 | 4 files changed, 305 insertions(+), 277 deletions(-) | ||
18 | create mode 100644 target/arm/hyp_gdbstub.c | ||
14 | 19 | ||
15 | diff --git a/target/arm/translate-a64.h b/target/arm/translate-a64.h | 20 | diff --git a/target/arm/internals.h b/target/arm/internals.h |
16 | index XXXXXXX..XXXXXXX 100644 | 21 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/translate-a64.h | 22 | --- a/target/arm/internals.h |
18 | +++ b/target/arm/translate-a64.h | 23 | +++ b/target/arm/internals.h |
19 | @@ -XXX,XX +XXX,XX @@ void write_fp_dreg(DisasContext *s, int reg, TCGv_i64 v); | 24 | @@ -XXX,XX +XXX,XX @@ static inline bool arm_fgt_active(CPUARMState *env, int el) |
20 | bool logic_imm_decode_wmask(uint64_t *result, unsigned int immn, | 25 | } |
21 | unsigned int imms, unsigned int immr); | 26 | |
22 | bool sve_access_check(DisasContext *s); | 27 | void assert_hflags_rebuild_correctly(CPUARMState *env); |
23 | +bool sme_enabled_check(DisasContext *s); | 28 | + |
24 | +bool sme_enabled_check_with_svcr(DisasContext *s, unsigned); | 29 | +/* |
25 | + | 30 | + * Although the ARM implementation of hardware assisted debugging |
26 | +/* This function corresponds to CheckStreamingSVEEnabled. */ | 31 | + * allows for different breakpoints per-core, the current GDB |
27 | +static inline bool sme_sm_enabled_check(DisasContext *s) | 32 | + * interface treats them as a global pool of registers (which seems to |
33 | + * be the case for x86, ppc and s390). As a result we store one copy | ||
34 | + * of registers which is used for all active cores. | ||
35 | + * | ||
36 | + * Write access is serialised by virtue of the GDB protocol which | ||
37 | + * updates things. Read access (i.e. when the values are copied to the | ||
38 | + * vCPU) is also gated by GDB's run control. | ||
39 | + * | ||
40 | + * This is not unreasonable as most of the time debugging kernels you | ||
41 | + * never know which core will eventually execute your function. | ||
42 | + */ | ||
43 | + | ||
44 | +typedef struct { | ||
45 | + uint64_t bcr; | ||
46 | + uint64_t bvr; | ||
47 | +} HWBreakpoint; | ||
48 | + | ||
49 | +/* | ||
50 | + * The watchpoint registers can cover more area than the requested | ||
51 | + * watchpoint so we need to store the additional information | ||
52 | + * somewhere. We also need to supply a CPUWatchpoint to the GDB stub | ||
53 | + * when the watchpoint is hit. | ||
54 | + */ | ||
55 | +typedef struct { | ||
56 | + uint64_t wcr; | ||
57 | + uint64_t wvr; | ||
58 | + CPUWatchpoint details; | ||
59 | +} HWWatchpoint; | ||
60 | + | ||
61 | +/* Maximum and current break/watch point counts */ | ||
62 | +extern int max_hw_bps, max_hw_wps; | ||
63 | +extern GArray *hw_breakpoints, *hw_watchpoints; | ||
64 | + | ||
65 | +#define cur_hw_wps (hw_watchpoints->len) | ||
66 | +#define cur_hw_bps (hw_breakpoints->len) | ||
67 | +#define get_hw_bp(i) (&g_array_index(hw_breakpoints, HWBreakpoint, i)) | ||
68 | +#define get_hw_wp(i) (&g_array_index(hw_watchpoints, HWWatchpoint, i)) | ||
69 | + | ||
70 | +bool find_hw_breakpoint(CPUState *cpu, target_ulong pc); | ||
71 | +int insert_hw_breakpoint(target_ulong pc); | ||
72 | +int delete_hw_breakpoint(target_ulong pc); | ||
73 | + | ||
74 | +bool check_watchpoint_in_range(int i, target_ulong addr); | ||
75 | +CPUWatchpoint *find_hw_watchpoint(CPUState *cpu, target_ulong addr); | ||
76 | +int insert_hw_watchpoint(target_ulong addr, target_ulong len, int type); | ||
77 | +int delete_hw_watchpoint(target_ulong addr, target_ulong len, int type); | ||
78 | #endif | ||
79 | diff --git a/target/arm/hyp_gdbstub.c b/target/arm/hyp_gdbstub.c | ||
80 | new file mode 100644 | ||
81 | index XXXXXXX..XXXXXXX | ||
82 | --- /dev/null | ||
83 | +++ b/target/arm/hyp_gdbstub.c | ||
84 | @@ -XXX,XX +XXX,XX @@ | ||
85 | +/* | ||
86 | + * ARM implementation of KVM and HVF hooks, 64 bit specific code | ||
87 | + * | ||
88 | + * Copyright Mian-M. Hamayun 2013, Virtual Open Systems | ||
89 | + * Copyright Alex Bennée 2014, Linaro | ||
90 | + * | ||
91 | + * This work is licensed under the terms of the GNU GPL, version 2 or later. | ||
92 | + * See the COPYING file in the top-level directory. | ||
93 | + * | ||
94 | + */ | ||
95 | + | ||
96 | +#include "qemu/osdep.h" | ||
97 | +#include "cpu.h" | ||
98 | +#include "internals.h" | ||
99 | +#include "exec/gdbstub.h" | ||
100 | + | ||
101 | +/* Maximum and current break/watch point counts */ | ||
102 | +int max_hw_bps, max_hw_wps; | ||
103 | +GArray *hw_breakpoints, *hw_watchpoints; | ||
104 | + | ||
105 | +/** | ||
106 | + * insert_hw_breakpoint() | ||
107 | + * @addr: address of breakpoint | ||
108 | + * | ||
109 | + * See ARM ARM D2.9.1 for details but here we are only going to create | ||
110 | + * simple un-linked breakpoints (i.e. we don't chain breakpoints | ||
111 | + * together to match address and context or vmid). The hardware is | ||
112 | + * capable of fancier matching but that will require exposing that | ||
113 | + * fanciness to GDB's interface | ||
114 | + * | ||
115 | + * DBGBCR<n>_EL1, Debug Breakpoint Control Registers | ||
116 | + * | ||
117 | + * 31 24 23 20 19 16 15 14 13 12 9 8 5 4 3 2 1 0 | ||
118 | + * +------+------+-------+-----+----+------+-----+------+-----+---+ | ||
119 | + * | RES0 | BT | LBN | SSC | HMC| RES0 | BAS | RES0 | PMC | E | | ||
120 | + * +------+------+-------+-----+----+------+-----+------+-----+---+ | ||
121 | + * | ||
122 | + * BT: Breakpoint type (0 = unlinked address match) | ||
123 | + * LBN: Linked BP number (0 = unused) | ||
124 | + * SSC/HMC/PMC: Security, Higher and Priv access control (Table D-12) | ||
125 | + * BAS: Byte Address Select (RES1 for AArch64) | ||
126 | + * E: Enable bit | ||
127 | + * | ||
128 | + * DBGBVR<n>_EL1, Debug Breakpoint Value Registers | ||
129 | + * | ||
130 | + * 63 53 52 49 48 2 1 0 | ||
131 | + * +------+-----------+----------+-----+ | ||
132 | + * | RESS | VA[52:49] | VA[48:2] | 0 0 | | ||
133 | + * +------+-----------+----------+-----+ | ||
134 | + * | ||
135 | + * Depending on the addressing mode bits the top bits of the register | ||
136 | + * are a sign extension of the highest applicable VA bit. Some | ||
137 | + * versions of GDB don't do it correctly so we ensure they are correct | ||
138 | + * here so future PC comparisons will work properly. | ||
139 | + */ | ||
140 | + | ||
141 | +int insert_hw_breakpoint(target_ulong addr) | ||
28 | +{ | 142 | +{ |
29 | + return sme_enabled_check_with_svcr(s, R_SVCR_SM_MASK); | 143 | + HWBreakpoint brk = { |
144 | + .bcr = 0x1, /* BCR E=1, enable */ | ||
145 | + .bvr = sextract64(addr, 0, 53) | ||
146 | + }; | ||
147 | + | ||
148 | + if (cur_hw_bps >= max_hw_bps) { | ||
149 | + return -ENOBUFS; | ||
150 | + } | ||
151 | + | ||
152 | + brk.bcr = deposit32(brk.bcr, 1, 2, 0x3); /* PMC = 11 */ | ||
153 | + brk.bcr = deposit32(brk.bcr, 5, 4, 0xf); /* BAS = RES1 */ | ||
154 | + | ||
155 | + g_array_append_val(hw_breakpoints, brk); | ||
156 | + | ||
157 | + return 0; | ||
30 | +} | 158 | +} |
31 | + | 159 | + |
32 | +/* This function corresponds to CheckSMEAndZAEnabled. */ | 160 | +/** |
33 | +static inline bool sme_za_enabled_check(DisasContext *s) | 161 | + * delete_hw_breakpoint() |
162 | + * @pc: address of breakpoint | ||
163 | + * | ||
164 | + * Delete a breakpoint and shuffle any above down | ||
165 | + */ | ||
166 | + | ||
167 | +int delete_hw_breakpoint(target_ulong pc) | ||
34 | +{ | 168 | +{ |
35 | + return sme_enabled_check_with_svcr(s, R_SVCR_ZA_MASK); | 169 | + int i; |
170 | + for (i = 0; i < hw_breakpoints->len; i++) { | ||
171 | + HWBreakpoint *brk = get_hw_bp(i); | ||
172 | + if (brk->bvr == pc) { | ||
173 | + g_array_remove_index(hw_breakpoints, i); | ||
174 | + return 0; | ||
175 | + } | ||
176 | + } | ||
177 | + return -ENOENT; | ||
36 | +} | 178 | +} |
37 | + | 179 | + |
38 | +/* Note that this function corresponds to CheckStreamingSVEAndZAEnabled. */ | 180 | +/** |
39 | +static inline bool sme_smza_enabled_check(DisasContext *s) | 181 | + * insert_hw_watchpoint() |
182 | + * @addr: address of watch point | ||
183 | + * @len: size of area | ||
184 | + * @type: type of watch point | ||
185 | + * | ||
186 | + * See ARM ARM D2.10. As with the breakpoints we can do some advanced | ||
187 | + * stuff if we want to. The watch points can be linked with the break | ||
188 | + * points above to make them context aware. However for simplicity | ||
189 | + * currently we only deal with simple read/write watch points. | ||
190 | + * | ||
191 | + * D7.3.11 DBGWCR<n>_EL1, Debug Watchpoint Control Registers | ||
192 | + * | ||
193 | + * 31 29 28 24 23 21 20 19 16 15 14 13 12 5 4 3 2 1 0 | ||
194 | + * +------+-------+------+----+-----+-----+-----+-----+-----+-----+---+ | ||
195 | + * | RES0 | MASK | RES0 | WT | LBN | SSC | HMC | BAS | LSC | PAC | E | | ||
196 | + * +------+-------+------+----+-----+-----+-----+-----+-----+-----+---+ | ||
197 | + * | ||
198 | + * MASK: num bits addr mask (0=none,01/10=res,11=3 bits (8 bytes)) | ||
199 | + * WT: 0 - unlinked, 1 - linked (not currently used) | ||
200 | + * LBN: Linked BP number (not currently used) | ||
201 | + * SSC/HMC/PAC: Security, Higher and Priv access control (Table D2-11) | ||
202 | + * BAS: Byte Address Select | ||
203 | + * LSC: Load/Store control (01: load, 10: store, 11: both) | ||
204 | + * E: Enable | ||
205 | + * | ||
206 | + * The bottom 2 bits of the value register are masked. Therefore to | ||
207 | + * break on any sizes smaller than an unaligned word you need to set | ||
208 | + * MASK=0, BAS=bit per byte in question. For larger regions (^2) you | ||
209 | + * need to ensure you mask the address as required and set BAS=0xff | ||
210 | + */ | ||
211 | + | ||
212 | +int insert_hw_watchpoint(target_ulong addr, target_ulong len, int type) | ||
40 | +{ | 213 | +{ |
41 | + return sme_enabled_check_with_svcr(s, R_SVCR_SM_MASK | R_SVCR_ZA_MASK); | 214 | + HWWatchpoint wp = { |
215 | + .wcr = R_DBGWCR_E_MASK, /* E=1, enable */ | ||
216 | + .wvr = addr & (~0x7ULL), | ||
217 | + .details = { .vaddr = addr, .len = len } | ||
218 | + }; | ||
219 | + | ||
220 | + if (cur_hw_wps >= max_hw_wps) { | ||
221 | + return -ENOBUFS; | ||
222 | + } | ||
223 | + | ||
224 | + /* | ||
225 | + * HMC=0 SSC=0 PAC=3 will hit EL0 or EL1, any security state, | ||
226 | + * valid whether EL3 is implemented or not | ||
227 | + */ | ||
228 | + wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, PAC, 3); | ||
229 | + | ||
230 | + switch (type) { | ||
231 | + case GDB_WATCHPOINT_READ: | ||
232 | + wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, LSC, 1); | ||
233 | + wp.details.flags = BP_MEM_READ; | ||
234 | + break; | ||
235 | + case GDB_WATCHPOINT_WRITE: | ||
236 | + wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, LSC, 2); | ||
237 | + wp.details.flags = BP_MEM_WRITE; | ||
238 | + break; | ||
239 | + case GDB_WATCHPOINT_ACCESS: | ||
240 | + wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, LSC, 3); | ||
241 | + wp.details.flags = BP_MEM_ACCESS; | ||
242 | + break; | ||
243 | + default: | ||
244 | + g_assert_not_reached(); | ||
245 | + break; | ||
246 | + } | ||
247 | + if (len <= 8) { | ||
248 | + /* we align the address and set the bits in BAS */ | ||
249 | + int off = addr & 0x7; | ||
250 | + int bas = (1 << len) - 1; | ||
251 | + | ||
252 | + wp.wcr = deposit32(wp.wcr, 5 + off, 8 - off, bas); | ||
253 | + } else { | ||
254 | + /* For ranges above 8 bytes we need to be a power of 2 */ | ||
255 | + if (is_power_of_2(len)) { | ||
256 | + int bits = ctz64(len); | ||
257 | + | ||
258 | + wp.wvr &= ~((1 << bits) - 1); | ||
259 | + wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, MASK, bits); | ||
260 | + wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, BAS, 0xff); | ||
261 | + } else { | ||
262 | + return -ENOBUFS; | ||
263 | + } | ||
264 | + } | ||
265 | + | ||
266 | + g_array_append_val(hw_watchpoints, wp); | ||
267 | + return 0; | ||
42 | +} | 268 | +} |
43 | + | 269 | + |
44 | TCGv_i64 clean_data_tbi(DisasContext *s, TCGv_i64 addr); | 270 | +bool check_watchpoint_in_range(int i, target_ulong addr) |
45 | TCGv_i64 gen_mte_check1(DisasContext *s, TCGv_i64 addr, bool is_write, | 271 | +{ |
46 | bool tag_checked, int log2_size); | 272 | + HWWatchpoint *wp = get_hw_wp(i); |
47 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 273 | + uint64_t addr_top, addr_bottom = wp->wvr; |
274 | + int bas = extract32(wp->wcr, 5, 8); | ||
275 | + int mask = extract32(wp->wcr, 24, 4); | ||
276 | + | ||
277 | + if (mask) { | ||
278 | + addr_top = addr_bottom + (1 << mask); | ||
279 | + } else { | ||
280 | + /* | ||
281 | + * BAS must be contiguous but can offset against the base | ||
282 | + * address in DBGWVR | ||
283 | + */ | ||
284 | + addr_bottom = addr_bottom + ctz32(bas); | ||
285 | + addr_top = addr_bottom + clo32(bas); | ||
286 | + } | ||
287 | + | ||
288 | + if (addr >= addr_bottom && addr <= addr_top) { | ||
289 | + return true; | ||
290 | + } | ||
291 | + | ||
292 | + return false; | ||
293 | +} | ||
294 | + | ||
295 | +/** | ||
296 | + * delete_hw_watchpoint() | ||
297 | + * @addr: address of breakpoint | ||
298 | + * | ||
299 | + * Delete a breakpoint and shuffle any above down | ||
300 | + */ | ||
301 | + | ||
302 | +int delete_hw_watchpoint(target_ulong addr, target_ulong len, int type) | ||
303 | +{ | ||
304 | + int i; | ||
305 | + for (i = 0; i < cur_hw_wps; i++) { | ||
306 | + if (check_watchpoint_in_range(i, addr)) { | ||
307 | + g_array_remove_index(hw_watchpoints, i); | ||
308 | + return 0; | ||
309 | + } | ||
310 | + } | ||
311 | + return -ENOENT; | ||
312 | +} | ||
313 | + | ||
314 | +bool find_hw_breakpoint(CPUState *cpu, target_ulong pc) | ||
315 | +{ | ||
316 | + int i; | ||
317 | + | ||
318 | + for (i = 0; i < cur_hw_bps; i++) { | ||
319 | + HWBreakpoint *bp = get_hw_bp(i); | ||
320 | + if (bp->bvr == pc) { | ||
321 | + return true; | ||
322 | + } | ||
323 | + } | ||
324 | + return false; | ||
325 | +} | ||
326 | + | ||
327 | +CPUWatchpoint *find_hw_watchpoint(CPUState *cpu, target_ulong addr) | ||
328 | +{ | ||
329 | + int i; | ||
330 | + | ||
331 | + for (i = 0; i < cur_hw_wps; i++) { | ||
332 | + if (check_watchpoint_in_range(i, addr)) { | ||
333 | + return &get_hw_wp(i)->details; | ||
334 | + } | ||
335 | + } | ||
336 | + return NULL; | ||
337 | +} | ||
338 | diff --git a/target/arm/kvm64.c b/target/arm/kvm64.c | ||
48 | index XXXXXXX..XXXXXXX 100644 | 339 | index XXXXXXX..XXXXXXX 100644 |
49 | --- a/target/arm/translate-a64.c | 340 | --- a/target/arm/kvm64.c |
50 | +++ b/target/arm/translate-a64.c | 341 | +++ b/target/arm/kvm64.c |
51 | @@ -XXX,XX +XXX,XX @@ static bool sme_access_check(DisasContext *s) | 342 | @@ -XXX,XX +XXX,XX @@ |
52 | return true; | 343 | |
344 | static bool have_guest_debug; | ||
345 | |||
346 | -/* | ||
347 | - * Although the ARM implementation of hardware assisted debugging | ||
348 | - * allows for different breakpoints per-core, the current GDB | ||
349 | - * interface treats them as a global pool of registers (which seems to | ||
350 | - * be the case for x86, ppc and s390). As a result we store one copy | ||
351 | - * of registers which is used for all active cores. | ||
352 | - * | ||
353 | - * Write access is serialised by virtue of the GDB protocol which | ||
354 | - * updates things. Read access (i.e. when the values are copied to the | ||
355 | - * vCPU) is also gated by GDB's run control. | ||
356 | - * | ||
357 | - * This is not unreasonable as most of the time debugging kernels you | ||
358 | - * never know which core will eventually execute your function. | ||
359 | - */ | ||
360 | - | ||
361 | -typedef struct { | ||
362 | - uint64_t bcr; | ||
363 | - uint64_t bvr; | ||
364 | -} HWBreakpoint; | ||
365 | - | ||
366 | -/* The watchpoint registers can cover more area than the requested | ||
367 | - * watchpoint so we need to store the additional information | ||
368 | - * somewhere. We also need to supply a CPUWatchpoint to the GDB stub | ||
369 | - * when the watchpoint is hit. | ||
370 | - */ | ||
371 | -typedef struct { | ||
372 | - uint64_t wcr; | ||
373 | - uint64_t wvr; | ||
374 | - CPUWatchpoint details; | ||
375 | -} HWWatchpoint; | ||
376 | - | ||
377 | -/* Maximum and current break/watch point counts */ | ||
378 | -int max_hw_bps, max_hw_wps; | ||
379 | -GArray *hw_breakpoints, *hw_watchpoints; | ||
380 | - | ||
381 | -#define cur_hw_wps (hw_watchpoints->len) | ||
382 | -#define cur_hw_bps (hw_breakpoints->len) | ||
383 | -#define get_hw_bp(i) (&g_array_index(hw_breakpoints, HWBreakpoint, i)) | ||
384 | -#define get_hw_wp(i) (&g_array_index(hw_watchpoints, HWWatchpoint, i)) | ||
385 | - | ||
386 | void kvm_arm_init_debug(KVMState *s) | ||
387 | { | ||
388 | have_guest_debug = kvm_check_extension(s, | ||
389 | @@ -XXX,XX +XXX,XX @@ void kvm_arm_init_debug(KVMState *s) | ||
390 | return; | ||
53 | } | 391 | } |
54 | 392 | ||
55 | +/* This function corresponds to CheckSMEEnabled. */ | 393 | -/** |
56 | +bool sme_enabled_check(DisasContext *s) | 394 | - * insert_hw_breakpoint() |
57 | +{ | 395 | - * @addr: address of breakpoint |
58 | + /* | 396 | - * |
59 | + * Note that unlike sve_excp_el, we have not constrained sme_excp_el | 397 | - * See ARM ARM D2.9.1 for details but here we are only going to create |
60 | + * to be zero when fp_excp_el has priority. This is because we need | 398 | - * simple un-linked breakpoints (i.e. we don't chain breakpoints |
61 | + * sme_excp_el by itself for cpregs access checks. | 399 | - * together to match address and context or vmid). The hardware is |
62 | + */ | 400 | - * capable of fancier matching but that will require exposing that |
63 | + if (!s->fp_excp_el || s->sme_excp_el < s->fp_excp_el) { | 401 | - * fanciness to GDB's interface |
64 | + s->fp_access_checked = true; | 402 | - * |
65 | + return sme_access_check(s); | 403 | - * DBGBCR<n>_EL1, Debug Breakpoint Control Registers |
66 | + } | 404 | - * |
67 | + return fp_access_check_only(s); | 405 | - * 31 24 23 20 19 16 15 14 13 12 9 8 5 4 3 2 1 0 |
68 | +} | 406 | - * +------+------+-------+-----+----+------+-----+------+-----+---+ |
69 | + | 407 | - * | RES0 | BT | LBN | SSC | HMC| RES0 | BAS | RES0 | PMC | E | |
70 | +/* Common subroutine for CheckSMEAnd*Enabled. */ | 408 | - * +------+------+-------+-----+----+------+-----+------+-----+---+ |
71 | +bool sme_enabled_check_with_svcr(DisasContext *s, unsigned req) | 409 | - * |
72 | +{ | 410 | - * BT: Breakpoint type (0 = unlinked address match) |
73 | + if (!sme_enabled_check(s)) { | 411 | - * LBN: Linked BP number (0 = unused) |
74 | + return false; | 412 | - * SSC/HMC/PMC: Security, Higher and Priv access control (Table D-12) |
75 | + } | 413 | - * BAS: Byte Address Select (RES1 for AArch64) |
76 | + if (FIELD_EX64(req, SVCR, SM) && !s->pstate_sm) { | 414 | - * E: Enable bit |
77 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | 415 | - * |
78 | + syn_smetrap(SME_ET_NotStreaming, false)); | 416 | - * DBGBVR<n>_EL1, Debug Breakpoint Value Registers |
79 | + return false; | 417 | - * |
80 | + } | 418 | - * 63 53 52 49 48 2 1 0 |
81 | + if (FIELD_EX64(req, SVCR, ZA) && !s->pstate_za) { | 419 | - * +------+-----------+----------+-----+ |
82 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | 420 | - * | RESS | VA[52:49] | VA[48:2] | 0 0 | |
83 | + syn_smetrap(SME_ET_InactiveZA, false)); | 421 | - * +------+-----------+----------+-----+ |
84 | + return false; | 422 | - * |
85 | + } | 423 | - * Depending on the addressing mode bits the top bits of the register |
86 | + return true; | 424 | - * are a sign extension of the highest applicable VA bit. Some |
87 | +} | 425 | - * versions of GDB don't do it correctly so we ensure they are correct |
88 | + | 426 | - * here so future PC comparisons will work properly. |
89 | /* | 427 | - */ |
90 | * This utility function is for doing register extension with an | 428 | - |
91 | * optional shift. You will likely want to pass a temporary for the | 429 | -static int insert_hw_breakpoint(target_ulong addr) |
430 | -{ | ||
431 | - HWBreakpoint brk = { | ||
432 | - .bcr = 0x1, /* BCR E=1, enable */ | ||
433 | - .bvr = sextract64(addr, 0, 53) | ||
434 | - }; | ||
435 | - | ||
436 | - if (cur_hw_bps >= max_hw_bps) { | ||
437 | - return -ENOBUFS; | ||
438 | - } | ||
439 | - | ||
440 | - brk.bcr = deposit32(brk.bcr, 1, 2, 0x3); /* PMC = 11 */ | ||
441 | - brk.bcr = deposit32(brk.bcr, 5, 4, 0xf); /* BAS = RES1 */ | ||
442 | - | ||
443 | - g_array_append_val(hw_breakpoints, brk); | ||
444 | - | ||
445 | - return 0; | ||
446 | -} | ||
447 | - | ||
448 | -/** | ||
449 | - * delete_hw_breakpoint() | ||
450 | - * @pc: address of breakpoint | ||
451 | - * | ||
452 | - * Delete a breakpoint and shuffle any above down | ||
453 | - */ | ||
454 | - | ||
455 | -static int delete_hw_breakpoint(target_ulong pc) | ||
456 | -{ | ||
457 | - int i; | ||
458 | - for (i = 0; i < hw_breakpoints->len; i++) { | ||
459 | - HWBreakpoint *brk = get_hw_bp(i); | ||
460 | - if (brk->bvr == pc) { | ||
461 | - g_array_remove_index(hw_breakpoints, i); | ||
462 | - return 0; | ||
463 | - } | ||
464 | - } | ||
465 | - return -ENOENT; | ||
466 | -} | ||
467 | - | ||
468 | -/** | ||
469 | - * insert_hw_watchpoint() | ||
470 | - * @addr: address of watch point | ||
471 | - * @len: size of area | ||
472 | - * @type: type of watch point | ||
473 | - * | ||
474 | - * See ARM ARM D2.10. As with the breakpoints we can do some advanced | ||
475 | - * stuff if we want to. The watch points can be linked with the break | ||
476 | - * points above to make them context aware. However for simplicity | ||
477 | - * currently we only deal with simple read/write watch points. | ||
478 | - * | ||
479 | - * D7.3.11 DBGWCR<n>_EL1, Debug Watchpoint Control Registers | ||
480 | - * | ||
481 | - * 31 29 28 24 23 21 20 19 16 15 14 13 12 5 4 3 2 1 0 | ||
482 | - * +------+-------+------+----+-----+-----+-----+-----+-----+-----+---+ | ||
483 | - * | RES0 | MASK | RES0 | WT | LBN | SSC | HMC | BAS | LSC | PAC | E | | ||
484 | - * +------+-------+------+----+-----+-----+-----+-----+-----+-----+---+ | ||
485 | - * | ||
486 | - * MASK: num bits addr mask (0=none,01/10=res,11=3 bits (8 bytes)) | ||
487 | - * WT: 0 - unlinked, 1 - linked (not currently used) | ||
488 | - * LBN: Linked BP number (not currently used) | ||
489 | - * SSC/HMC/PAC: Security, Higher and Priv access control (Table D2-11) | ||
490 | - * BAS: Byte Address Select | ||
491 | - * LSC: Load/Store control (01: load, 10: store, 11: both) | ||
492 | - * E: Enable | ||
493 | - * | ||
494 | - * The bottom 2 bits of the value register are masked. Therefore to | ||
495 | - * break on any sizes smaller than an unaligned word you need to set | ||
496 | - * MASK=0, BAS=bit per byte in question. For larger regions (^2) you | ||
497 | - * need to ensure you mask the address as required and set BAS=0xff | ||
498 | - */ | ||
499 | - | ||
500 | -static int insert_hw_watchpoint(target_ulong addr, | ||
501 | - target_ulong len, int type) | ||
502 | -{ | ||
503 | - HWWatchpoint wp = { | ||
504 | - .wcr = R_DBGWCR_E_MASK, /* E=1, enable */ | ||
505 | - .wvr = addr & (~0x7ULL), | ||
506 | - .details = { .vaddr = addr, .len = len } | ||
507 | - }; | ||
508 | - | ||
509 | - if (cur_hw_wps >= max_hw_wps) { | ||
510 | - return -ENOBUFS; | ||
511 | - } | ||
512 | - | ||
513 | - /* | ||
514 | - * HMC=0 SSC=0 PAC=3 will hit EL0 or EL1, any security state, | ||
515 | - * valid whether EL3 is implemented or not | ||
516 | - */ | ||
517 | - wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, PAC, 3); | ||
518 | - | ||
519 | - switch (type) { | ||
520 | - case GDB_WATCHPOINT_READ: | ||
521 | - wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, LSC, 1); | ||
522 | - wp.details.flags = BP_MEM_READ; | ||
523 | - break; | ||
524 | - case GDB_WATCHPOINT_WRITE: | ||
525 | - wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, LSC, 2); | ||
526 | - wp.details.flags = BP_MEM_WRITE; | ||
527 | - break; | ||
528 | - case GDB_WATCHPOINT_ACCESS: | ||
529 | - wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, LSC, 3); | ||
530 | - wp.details.flags = BP_MEM_ACCESS; | ||
531 | - break; | ||
532 | - default: | ||
533 | - g_assert_not_reached(); | ||
534 | - break; | ||
535 | - } | ||
536 | - if (len <= 8) { | ||
537 | - /* we align the address and set the bits in BAS */ | ||
538 | - int off = addr & 0x7; | ||
539 | - int bas = (1 << len) - 1; | ||
540 | - | ||
541 | - wp.wcr = deposit32(wp.wcr, 5 + off, 8 - off, bas); | ||
542 | - } else { | ||
543 | - /* For ranges above 8 bytes we need to be a power of 2 */ | ||
544 | - if (is_power_of_2(len)) { | ||
545 | - int bits = ctz64(len); | ||
546 | - | ||
547 | - wp.wvr &= ~((1 << bits) - 1); | ||
548 | - wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, MASK, bits); | ||
549 | - wp.wcr = FIELD_DP64(wp.wcr, DBGWCR, BAS, 0xff); | ||
550 | - } else { | ||
551 | - return -ENOBUFS; | ||
552 | - } | ||
553 | - } | ||
554 | - | ||
555 | - g_array_append_val(hw_watchpoints, wp); | ||
556 | - return 0; | ||
557 | -} | ||
558 | - | ||
559 | - | ||
560 | -static bool check_watchpoint_in_range(int i, target_ulong addr) | ||
561 | -{ | ||
562 | - HWWatchpoint *wp = get_hw_wp(i); | ||
563 | - uint64_t addr_top, addr_bottom = wp->wvr; | ||
564 | - int bas = extract32(wp->wcr, 5, 8); | ||
565 | - int mask = extract32(wp->wcr, 24, 4); | ||
566 | - | ||
567 | - if (mask) { | ||
568 | - addr_top = addr_bottom + (1 << mask); | ||
569 | - } else { | ||
570 | - /* BAS must be contiguous but can offset against the base | ||
571 | - * address in DBGWVR */ | ||
572 | - addr_bottom = addr_bottom + ctz32(bas); | ||
573 | - addr_top = addr_bottom + clo32(bas); | ||
574 | - } | ||
575 | - | ||
576 | - if (addr >= addr_bottom && addr <= addr_top) { | ||
577 | - return true; | ||
578 | - } | ||
579 | - | ||
580 | - return false; | ||
581 | -} | ||
582 | - | ||
583 | -/** | ||
584 | - * delete_hw_watchpoint() | ||
585 | - * @addr: address of breakpoint | ||
586 | - * | ||
587 | - * Delete a breakpoint and shuffle any above down | ||
588 | - */ | ||
589 | - | ||
590 | -static int delete_hw_watchpoint(target_ulong addr, | ||
591 | - target_ulong len, int type) | ||
592 | -{ | ||
593 | - int i; | ||
594 | - for (i = 0; i < cur_hw_wps; i++) { | ||
595 | - if (check_watchpoint_in_range(i, addr)) { | ||
596 | - g_array_remove_index(hw_watchpoints, i); | ||
597 | - return 0; | ||
598 | - } | ||
599 | - } | ||
600 | - return -ENOENT; | ||
601 | -} | ||
602 | - | ||
603 | - | ||
604 | int kvm_arch_insert_hw_breakpoint(target_ulong addr, | ||
605 | target_ulong len, int type) | ||
606 | { | ||
607 | @@ -XXX,XX +XXX,XX @@ bool kvm_arm_hw_debug_active(CPUState *cs) | ||
608 | return ((cur_hw_wps > 0) || (cur_hw_bps > 0)); | ||
609 | } | ||
610 | |||
611 | -static bool find_hw_breakpoint(CPUState *cpu, target_ulong pc) | ||
612 | -{ | ||
613 | - int i; | ||
614 | - | ||
615 | - for (i = 0; i < cur_hw_bps; i++) { | ||
616 | - HWBreakpoint *bp = get_hw_bp(i); | ||
617 | - if (bp->bvr == pc) { | ||
618 | - return true; | ||
619 | - } | ||
620 | - } | ||
621 | - return false; | ||
622 | -} | ||
623 | - | ||
624 | -static CPUWatchpoint *find_hw_watchpoint(CPUState *cpu, target_ulong addr) | ||
625 | -{ | ||
626 | - int i; | ||
627 | - | ||
628 | - for (i = 0; i < cur_hw_wps; i++) { | ||
629 | - if (check_watchpoint_in_range(i, addr)) { | ||
630 | - return &get_hw_wp(i)->details; | ||
631 | - } | ||
632 | - } | ||
633 | - return NULL; | ||
634 | -} | ||
635 | - | ||
636 | static bool kvm_arm_set_device_attr(CPUState *cs, struct kvm_device_attr *attr, | ||
637 | const char *name) | ||
638 | { | ||
639 | diff --git a/target/arm/meson.build b/target/arm/meson.build | ||
640 | index XXXXXXX..XXXXXXX 100644 | ||
641 | --- a/target/arm/meson.build | ||
642 | +++ b/target/arm/meson.build | ||
643 | @@ -XXX,XX +XXX,XX @@ arm_ss.add(files( | ||
644 | )) | ||
645 | arm_ss.add(zlib) | ||
646 | |||
647 | -arm_ss.add(when: 'CONFIG_KVM', if_true: files('kvm.c', 'kvm64.c'), if_false: files('kvm-stub.c')) | ||
648 | +arm_ss.add(when: 'CONFIG_KVM', if_true: files('hyp_gdbstub.c', 'kvm.c', 'kvm64.c'), if_false: files('kvm-stub.c')) | ||
649 | +arm_ss.add(when: 'CONFIG_HVF', if_true: files('hyp_gdbstub.c')) | ||
650 | |||
651 | arm_ss.add(when: 'TARGET_AARCH64', if_true: files( | ||
652 | 'cpu64.c', | ||
92 | -- | 653 | -- |
93 | 2.25.1 | 654 | 2.34.1 |
655 | |||
656 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Francesco Cagnin <fcagnin@quarkslab.com> |
---|---|---|---|
2 | 2 | ||
3 | Required for guest debugging. | ||
4 | |||
5 | Signed-off-by: Francesco Cagnin <fcagnin@quarkslab.com> | ||
6 | Message-id: 20230601153107.81955-3-fcagnin@quarkslab.com | ||
3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Message-id: 20220708151540.18136-46-richard.henderson@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 9 | --- |
8 | linux-user/elfload.c | 20 ++++++++++++++++++++ | 10 | target/arm/hvf/hvf.c | 213 +++++++++++++++++++++++++++++++++++++++++++ |
9 | 1 file changed, 20 insertions(+) | 11 | 1 file changed, 213 insertions(+) |
10 | 12 | ||
11 | diff --git a/linux-user/elfload.c b/linux-user/elfload.c | 13 | diff --git a/target/arm/hvf/hvf.c b/target/arm/hvf/hvf.c |
12 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/linux-user/elfload.c | 15 | --- a/target/arm/hvf/hvf.c |
14 | +++ b/linux-user/elfload.c | 16 | +++ b/target/arm/hvf/hvf.c |
15 | @@ -XXX,XX +XXX,XX @@ enum { | 17 | @@ -XXX,XX +XXX,XX @@ |
16 | ARM_HWCAP2_A64_RNG = 1 << 16, | 18 | #define SYSREG_ICC_SGI1R_EL1 SYSREG(3, 0, 12, 11, 5) |
17 | ARM_HWCAP2_A64_BTI = 1 << 17, | 19 | #define SYSREG_ICC_SRE_EL1 SYSREG(3, 0, 12, 12, 5) |
18 | ARM_HWCAP2_A64_MTE = 1 << 18, | 20 | |
19 | + ARM_HWCAP2_A64_ECV = 1 << 19, | 21 | +#define SYSREG_MDSCR_EL1 SYSREG(2, 0, 0, 2, 2) |
20 | + ARM_HWCAP2_A64_AFP = 1 << 20, | 22 | +#define SYSREG_DBGBVR0_EL1 SYSREG(2, 0, 0, 0, 4) |
21 | + ARM_HWCAP2_A64_RPRES = 1 << 21, | 23 | +#define SYSREG_DBGBCR0_EL1 SYSREG(2, 0, 0, 0, 5) |
22 | + ARM_HWCAP2_A64_MTE3 = 1 << 22, | 24 | +#define SYSREG_DBGWVR0_EL1 SYSREG(2, 0, 0, 0, 6) |
23 | + ARM_HWCAP2_A64_SME = 1 << 23, | 25 | +#define SYSREG_DBGWCR0_EL1 SYSREG(2, 0, 0, 0, 7) |
24 | + ARM_HWCAP2_A64_SME_I16I64 = 1 << 24, | 26 | +#define SYSREG_DBGBVR1_EL1 SYSREG(2, 0, 0, 1, 4) |
25 | + ARM_HWCAP2_A64_SME_F64F64 = 1 << 25, | 27 | +#define SYSREG_DBGBCR1_EL1 SYSREG(2, 0, 0, 1, 5) |
26 | + ARM_HWCAP2_A64_SME_I8I32 = 1 << 26, | 28 | +#define SYSREG_DBGWVR1_EL1 SYSREG(2, 0, 0, 1, 6) |
27 | + ARM_HWCAP2_A64_SME_F16F32 = 1 << 27, | 29 | +#define SYSREG_DBGWCR1_EL1 SYSREG(2, 0, 0, 1, 7) |
28 | + ARM_HWCAP2_A64_SME_B16F32 = 1 << 28, | 30 | +#define SYSREG_DBGBVR2_EL1 SYSREG(2, 0, 0, 2, 4) |
29 | + ARM_HWCAP2_A64_SME_F32F32 = 1 << 29, | 31 | +#define SYSREG_DBGBCR2_EL1 SYSREG(2, 0, 0, 2, 5) |
30 | + ARM_HWCAP2_A64_SME_FA64 = 1 << 30, | 32 | +#define SYSREG_DBGWVR2_EL1 SYSREG(2, 0, 0, 2, 6) |
31 | }; | 33 | +#define SYSREG_DBGWCR2_EL1 SYSREG(2, 0, 0, 2, 7) |
32 | 34 | +#define SYSREG_DBGBVR3_EL1 SYSREG(2, 0, 0, 3, 4) | |
33 | #define ELF_HWCAP get_elf_hwcap() | 35 | +#define SYSREG_DBGBCR3_EL1 SYSREG(2, 0, 0, 3, 5) |
34 | @@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap2(void) | 36 | +#define SYSREG_DBGWVR3_EL1 SYSREG(2, 0, 0, 3, 6) |
35 | GET_FEATURE_ID(aa64_rndr, ARM_HWCAP2_A64_RNG); | 37 | +#define SYSREG_DBGWCR3_EL1 SYSREG(2, 0, 0, 3, 7) |
36 | GET_FEATURE_ID(aa64_bti, ARM_HWCAP2_A64_BTI); | 38 | +#define SYSREG_DBGBVR4_EL1 SYSREG(2, 0, 0, 4, 4) |
37 | GET_FEATURE_ID(aa64_mte, ARM_HWCAP2_A64_MTE); | 39 | +#define SYSREG_DBGBCR4_EL1 SYSREG(2, 0, 0, 4, 5) |
38 | + GET_FEATURE_ID(aa64_sme, (ARM_HWCAP2_A64_SME | | 40 | +#define SYSREG_DBGWVR4_EL1 SYSREG(2, 0, 0, 4, 6) |
39 | + ARM_HWCAP2_A64_SME_F32F32 | | 41 | +#define SYSREG_DBGWCR4_EL1 SYSREG(2, 0, 0, 4, 7) |
40 | + ARM_HWCAP2_A64_SME_B16F32 | | 42 | +#define SYSREG_DBGBVR5_EL1 SYSREG(2, 0, 0, 5, 4) |
41 | + ARM_HWCAP2_A64_SME_F16F32 | | 43 | +#define SYSREG_DBGBCR5_EL1 SYSREG(2, 0, 0, 5, 5) |
42 | + ARM_HWCAP2_A64_SME_I8I32)); | 44 | +#define SYSREG_DBGWVR5_EL1 SYSREG(2, 0, 0, 5, 6) |
43 | + GET_FEATURE_ID(aa64_sme_f64f64, ARM_HWCAP2_A64_SME_F64F64); | 45 | +#define SYSREG_DBGWCR5_EL1 SYSREG(2, 0, 0, 5, 7) |
44 | + GET_FEATURE_ID(aa64_sme_i16i64, ARM_HWCAP2_A64_SME_I16I64); | 46 | +#define SYSREG_DBGBVR6_EL1 SYSREG(2, 0, 0, 6, 4) |
45 | + GET_FEATURE_ID(aa64_sme_fa64, ARM_HWCAP2_A64_SME_FA64); | 47 | +#define SYSREG_DBGBCR6_EL1 SYSREG(2, 0, 0, 6, 5) |
46 | 48 | +#define SYSREG_DBGWVR6_EL1 SYSREG(2, 0, 0, 6, 6) | |
47 | return hwcaps; | 49 | +#define SYSREG_DBGWCR6_EL1 SYSREG(2, 0, 0, 6, 7) |
48 | } | 50 | +#define SYSREG_DBGBVR7_EL1 SYSREG(2, 0, 0, 7, 4) |
51 | +#define SYSREG_DBGBCR7_EL1 SYSREG(2, 0, 0, 7, 5) | ||
52 | +#define SYSREG_DBGWVR7_EL1 SYSREG(2, 0, 0, 7, 6) | ||
53 | +#define SYSREG_DBGWCR7_EL1 SYSREG(2, 0, 0, 7, 7) | ||
54 | +#define SYSREG_DBGBVR8_EL1 SYSREG(2, 0, 0, 8, 4) | ||
55 | +#define SYSREG_DBGBCR8_EL1 SYSREG(2, 0, 0, 8, 5) | ||
56 | +#define SYSREG_DBGWVR8_EL1 SYSREG(2, 0, 0, 8, 6) | ||
57 | +#define SYSREG_DBGWCR8_EL1 SYSREG(2, 0, 0, 8, 7) | ||
58 | +#define SYSREG_DBGBVR9_EL1 SYSREG(2, 0, 0, 9, 4) | ||
59 | +#define SYSREG_DBGBCR9_EL1 SYSREG(2, 0, 0, 9, 5) | ||
60 | +#define SYSREG_DBGWVR9_EL1 SYSREG(2, 0, 0, 9, 6) | ||
61 | +#define SYSREG_DBGWCR9_EL1 SYSREG(2, 0, 0, 9, 7) | ||
62 | +#define SYSREG_DBGBVR10_EL1 SYSREG(2, 0, 0, 10, 4) | ||
63 | +#define SYSREG_DBGBCR10_EL1 SYSREG(2, 0, 0, 10, 5) | ||
64 | +#define SYSREG_DBGWVR10_EL1 SYSREG(2, 0, 0, 10, 6) | ||
65 | +#define SYSREG_DBGWCR10_EL1 SYSREG(2, 0, 0, 10, 7) | ||
66 | +#define SYSREG_DBGBVR11_EL1 SYSREG(2, 0, 0, 11, 4) | ||
67 | +#define SYSREG_DBGBCR11_EL1 SYSREG(2, 0, 0, 11, 5) | ||
68 | +#define SYSREG_DBGWVR11_EL1 SYSREG(2, 0, 0, 11, 6) | ||
69 | +#define SYSREG_DBGWCR11_EL1 SYSREG(2, 0, 0, 11, 7) | ||
70 | +#define SYSREG_DBGBVR12_EL1 SYSREG(2, 0, 0, 12, 4) | ||
71 | +#define SYSREG_DBGBCR12_EL1 SYSREG(2, 0, 0, 12, 5) | ||
72 | +#define SYSREG_DBGWVR12_EL1 SYSREG(2, 0, 0, 12, 6) | ||
73 | +#define SYSREG_DBGWCR12_EL1 SYSREG(2, 0, 0, 12, 7) | ||
74 | +#define SYSREG_DBGBVR13_EL1 SYSREG(2, 0, 0, 13, 4) | ||
75 | +#define SYSREG_DBGBCR13_EL1 SYSREG(2, 0, 0, 13, 5) | ||
76 | +#define SYSREG_DBGWVR13_EL1 SYSREG(2, 0, 0, 13, 6) | ||
77 | +#define SYSREG_DBGWCR13_EL1 SYSREG(2, 0, 0, 13, 7) | ||
78 | +#define SYSREG_DBGBVR14_EL1 SYSREG(2, 0, 0, 14, 4) | ||
79 | +#define SYSREG_DBGBCR14_EL1 SYSREG(2, 0, 0, 14, 5) | ||
80 | +#define SYSREG_DBGWVR14_EL1 SYSREG(2, 0, 0, 14, 6) | ||
81 | +#define SYSREG_DBGWCR14_EL1 SYSREG(2, 0, 0, 14, 7) | ||
82 | +#define SYSREG_DBGBVR15_EL1 SYSREG(2, 0, 0, 15, 4) | ||
83 | +#define SYSREG_DBGBCR15_EL1 SYSREG(2, 0, 0, 15, 5) | ||
84 | +#define SYSREG_DBGWVR15_EL1 SYSREG(2, 0, 0, 15, 6) | ||
85 | +#define SYSREG_DBGWCR15_EL1 SYSREG(2, 0, 0, 15, 7) | ||
86 | + | ||
87 | #define WFX_IS_WFE (1 << 0) | ||
88 | |||
89 | #define TMR_CTL_ENABLE (1 << 0) | ||
90 | @@ -XXX,XX +XXX,XX @@ static int hvf_sysreg_read(CPUState *cpu, uint32_t reg, uint32_t rt) | ||
91 | hvf_raise_exception(cpu, EXCP_UDEF, syn_uncategorized()); | ||
92 | } | ||
93 | break; | ||
94 | + case SYSREG_DBGBVR0_EL1: | ||
95 | + case SYSREG_DBGBVR1_EL1: | ||
96 | + case SYSREG_DBGBVR2_EL1: | ||
97 | + case SYSREG_DBGBVR3_EL1: | ||
98 | + case SYSREG_DBGBVR4_EL1: | ||
99 | + case SYSREG_DBGBVR5_EL1: | ||
100 | + case SYSREG_DBGBVR6_EL1: | ||
101 | + case SYSREG_DBGBVR7_EL1: | ||
102 | + case SYSREG_DBGBVR8_EL1: | ||
103 | + case SYSREG_DBGBVR9_EL1: | ||
104 | + case SYSREG_DBGBVR10_EL1: | ||
105 | + case SYSREG_DBGBVR11_EL1: | ||
106 | + case SYSREG_DBGBVR12_EL1: | ||
107 | + case SYSREG_DBGBVR13_EL1: | ||
108 | + case SYSREG_DBGBVR14_EL1: | ||
109 | + case SYSREG_DBGBVR15_EL1: | ||
110 | + val = env->cp15.dbgbvr[SYSREG_CRM(reg)]; | ||
111 | + break; | ||
112 | + case SYSREG_DBGBCR0_EL1: | ||
113 | + case SYSREG_DBGBCR1_EL1: | ||
114 | + case SYSREG_DBGBCR2_EL1: | ||
115 | + case SYSREG_DBGBCR3_EL1: | ||
116 | + case SYSREG_DBGBCR4_EL1: | ||
117 | + case SYSREG_DBGBCR5_EL1: | ||
118 | + case SYSREG_DBGBCR6_EL1: | ||
119 | + case SYSREG_DBGBCR7_EL1: | ||
120 | + case SYSREG_DBGBCR8_EL1: | ||
121 | + case SYSREG_DBGBCR9_EL1: | ||
122 | + case SYSREG_DBGBCR10_EL1: | ||
123 | + case SYSREG_DBGBCR11_EL1: | ||
124 | + case SYSREG_DBGBCR12_EL1: | ||
125 | + case SYSREG_DBGBCR13_EL1: | ||
126 | + case SYSREG_DBGBCR14_EL1: | ||
127 | + case SYSREG_DBGBCR15_EL1: | ||
128 | + val = env->cp15.dbgbcr[SYSREG_CRM(reg)]; | ||
129 | + break; | ||
130 | + case SYSREG_DBGWVR0_EL1: | ||
131 | + case SYSREG_DBGWVR1_EL1: | ||
132 | + case SYSREG_DBGWVR2_EL1: | ||
133 | + case SYSREG_DBGWVR3_EL1: | ||
134 | + case SYSREG_DBGWVR4_EL1: | ||
135 | + case SYSREG_DBGWVR5_EL1: | ||
136 | + case SYSREG_DBGWVR6_EL1: | ||
137 | + case SYSREG_DBGWVR7_EL1: | ||
138 | + case SYSREG_DBGWVR8_EL1: | ||
139 | + case SYSREG_DBGWVR9_EL1: | ||
140 | + case SYSREG_DBGWVR10_EL1: | ||
141 | + case SYSREG_DBGWVR11_EL1: | ||
142 | + case SYSREG_DBGWVR12_EL1: | ||
143 | + case SYSREG_DBGWVR13_EL1: | ||
144 | + case SYSREG_DBGWVR14_EL1: | ||
145 | + case SYSREG_DBGWVR15_EL1: | ||
146 | + val = env->cp15.dbgwvr[SYSREG_CRM(reg)]; | ||
147 | + break; | ||
148 | + case SYSREG_DBGWCR0_EL1: | ||
149 | + case SYSREG_DBGWCR1_EL1: | ||
150 | + case SYSREG_DBGWCR2_EL1: | ||
151 | + case SYSREG_DBGWCR3_EL1: | ||
152 | + case SYSREG_DBGWCR4_EL1: | ||
153 | + case SYSREG_DBGWCR5_EL1: | ||
154 | + case SYSREG_DBGWCR6_EL1: | ||
155 | + case SYSREG_DBGWCR7_EL1: | ||
156 | + case SYSREG_DBGWCR8_EL1: | ||
157 | + case SYSREG_DBGWCR9_EL1: | ||
158 | + case SYSREG_DBGWCR10_EL1: | ||
159 | + case SYSREG_DBGWCR11_EL1: | ||
160 | + case SYSREG_DBGWCR12_EL1: | ||
161 | + case SYSREG_DBGWCR13_EL1: | ||
162 | + case SYSREG_DBGWCR14_EL1: | ||
163 | + case SYSREG_DBGWCR15_EL1: | ||
164 | + val = env->cp15.dbgwcr[SYSREG_CRM(reg)]; | ||
165 | + break; | ||
166 | default: | ||
167 | if (is_id_sysreg(reg)) { | ||
168 | /* ID system registers read as RES0 */ | ||
169 | @@ -XXX,XX +XXX,XX @@ static int hvf_sysreg_write(CPUState *cpu, uint32_t reg, uint64_t val) | ||
170 | hvf_raise_exception(cpu, EXCP_UDEF, syn_uncategorized()); | ||
171 | } | ||
172 | break; | ||
173 | + case SYSREG_MDSCR_EL1: | ||
174 | + env->cp15.mdscr_el1 = val; | ||
175 | + break; | ||
176 | + case SYSREG_DBGBVR0_EL1: | ||
177 | + case SYSREG_DBGBVR1_EL1: | ||
178 | + case SYSREG_DBGBVR2_EL1: | ||
179 | + case SYSREG_DBGBVR3_EL1: | ||
180 | + case SYSREG_DBGBVR4_EL1: | ||
181 | + case SYSREG_DBGBVR5_EL1: | ||
182 | + case SYSREG_DBGBVR6_EL1: | ||
183 | + case SYSREG_DBGBVR7_EL1: | ||
184 | + case SYSREG_DBGBVR8_EL1: | ||
185 | + case SYSREG_DBGBVR9_EL1: | ||
186 | + case SYSREG_DBGBVR10_EL1: | ||
187 | + case SYSREG_DBGBVR11_EL1: | ||
188 | + case SYSREG_DBGBVR12_EL1: | ||
189 | + case SYSREG_DBGBVR13_EL1: | ||
190 | + case SYSREG_DBGBVR14_EL1: | ||
191 | + case SYSREG_DBGBVR15_EL1: | ||
192 | + env->cp15.dbgbvr[SYSREG_CRM(reg)] = val; | ||
193 | + break; | ||
194 | + case SYSREG_DBGBCR0_EL1: | ||
195 | + case SYSREG_DBGBCR1_EL1: | ||
196 | + case SYSREG_DBGBCR2_EL1: | ||
197 | + case SYSREG_DBGBCR3_EL1: | ||
198 | + case SYSREG_DBGBCR4_EL1: | ||
199 | + case SYSREG_DBGBCR5_EL1: | ||
200 | + case SYSREG_DBGBCR6_EL1: | ||
201 | + case SYSREG_DBGBCR7_EL1: | ||
202 | + case SYSREG_DBGBCR8_EL1: | ||
203 | + case SYSREG_DBGBCR9_EL1: | ||
204 | + case SYSREG_DBGBCR10_EL1: | ||
205 | + case SYSREG_DBGBCR11_EL1: | ||
206 | + case SYSREG_DBGBCR12_EL1: | ||
207 | + case SYSREG_DBGBCR13_EL1: | ||
208 | + case SYSREG_DBGBCR14_EL1: | ||
209 | + case SYSREG_DBGBCR15_EL1: | ||
210 | + env->cp15.dbgbcr[SYSREG_CRM(reg)] = val; | ||
211 | + break; | ||
212 | + case SYSREG_DBGWVR0_EL1: | ||
213 | + case SYSREG_DBGWVR1_EL1: | ||
214 | + case SYSREG_DBGWVR2_EL1: | ||
215 | + case SYSREG_DBGWVR3_EL1: | ||
216 | + case SYSREG_DBGWVR4_EL1: | ||
217 | + case SYSREG_DBGWVR5_EL1: | ||
218 | + case SYSREG_DBGWVR6_EL1: | ||
219 | + case SYSREG_DBGWVR7_EL1: | ||
220 | + case SYSREG_DBGWVR8_EL1: | ||
221 | + case SYSREG_DBGWVR9_EL1: | ||
222 | + case SYSREG_DBGWVR10_EL1: | ||
223 | + case SYSREG_DBGWVR11_EL1: | ||
224 | + case SYSREG_DBGWVR12_EL1: | ||
225 | + case SYSREG_DBGWVR13_EL1: | ||
226 | + case SYSREG_DBGWVR14_EL1: | ||
227 | + case SYSREG_DBGWVR15_EL1: | ||
228 | + env->cp15.dbgwvr[SYSREG_CRM(reg)] = val; | ||
229 | + break; | ||
230 | + case SYSREG_DBGWCR0_EL1: | ||
231 | + case SYSREG_DBGWCR1_EL1: | ||
232 | + case SYSREG_DBGWCR2_EL1: | ||
233 | + case SYSREG_DBGWCR3_EL1: | ||
234 | + case SYSREG_DBGWCR4_EL1: | ||
235 | + case SYSREG_DBGWCR5_EL1: | ||
236 | + case SYSREG_DBGWCR6_EL1: | ||
237 | + case SYSREG_DBGWCR7_EL1: | ||
238 | + case SYSREG_DBGWCR8_EL1: | ||
239 | + case SYSREG_DBGWCR9_EL1: | ||
240 | + case SYSREG_DBGWCR10_EL1: | ||
241 | + case SYSREG_DBGWCR11_EL1: | ||
242 | + case SYSREG_DBGWCR12_EL1: | ||
243 | + case SYSREG_DBGWCR13_EL1: | ||
244 | + case SYSREG_DBGWCR14_EL1: | ||
245 | + case SYSREG_DBGWCR15_EL1: | ||
246 | + env->cp15.dbgwcr[SYSREG_CRM(reg)] = val; | ||
247 | + break; | ||
248 | default: | ||
249 | cpu_synchronize_state(cpu); | ||
250 | trace_hvf_unhandled_sysreg_write(env->pc, reg, | ||
49 | -- | 251 | -- |
50 | 2.25.1 | 252 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Francesco Cagnin <fcagnin@quarkslab.com> |
---|---|---|---|
2 | 2 | ||
3 | Enable SME, TPIDR2_EL0, and FA64 if supported by the cpu. | 3 | Required for guest debugging. The code has been structured like the KVM |
4 | counterpart. | ||
4 | 5 | ||
6 | Signed-off-by: Francesco Cagnin <fcagnin@quarkslab.com> | ||
7 | Message-id: 20230601153107.81955-4-fcagnin@quarkslab.com | ||
5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20220708151540.18136-45-richard.henderson@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 10 | --- |
10 | target/arm/cpu.c | 11 +++++++++++ | 11 | include/sysemu/hvf.h | 22 ++++++++ |
11 | 1 file changed, 11 insertions(+) | 12 | include/sysemu/hvf_int.h | 1 + |
13 | accel/hvf/hvf-accel-ops.c | 109 ++++++++++++++++++++++++++++++++++++++ | ||
14 | accel/hvf/hvf-all.c | 17 ++++++ | ||
15 | target/arm/hvf/hvf.c | 63 ++++++++++++++++++++++ | ||
16 | target/i386/hvf/hvf.c | 24 +++++++++ | ||
17 | 6 files changed, 236 insertions(+) | ||
12 | 18 | ||
13 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c | 19 | diff --git a/include/sysemu/hvf.h b/include/sysemu/hvf.h |
14 | index XXXXXXX..XXXXXXX 100644 | 20 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/cpu.c | 21 | --- a/include/sysemu/hvf.h |
16 | +++ b/target/arm/cpu.c | 22 | +++ b/include/sysemu/hvf.h |
17 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(DeviceState *dev) | 23 | @@ -XXX,XX +XXX,XX @@ |
18 | CPACR_EL1, ZEN, 3); | 24 | #include "qom/object.h" |
19 | env->vfp.zcr_el[1] = cpu->sve_default_vq - 1; | 25 | |
20 | } | 26 | #ifdef NEED_CPU_H |
21 | + /* and for SME instructions, with default vector length, and TPIDR2 */ | 27 | +#include "cpu.h" |
22 | + if (cpu_isar_feature(aa64_sme, cpu)) { | 28 | |
23 | + env->cp15.sctlr_el[1] |= SCTLR_EnTP2; | 29 | #ifdef CONFIG_HVF |
24 | + env->cp15.cpacr_el1 = FIELD_DP64(env->cp15.cpacr_el1, | 30 | uint32_t hvf_get_supported_cpuid(uint32_t func, uint32_t idx, |
25 | + CPACR_EL1, SMEN, 3); | 31 | @@ -XXX,XX +XXX,XX @@ typedef struct HVFState HVFState; |
26 | + env->vfp.smcr_el[1] = cpu->sme_default_vq - 1; | 32 | DECLARE_INSTANCE_CHECKER(HVFState, HVF_STATE, |
27 | + if (cpu_isar_feature(aa64_sme_fa64, cpu)) { | 33 | TYPE_HVF_ACCEL) |
28 | + env->vfp.smcr_el[1] = FIELD_DP64(env->vfp.smcr_el[1], | 34 | |
29 | + SMCR, FA64, 1); | 35 | +#ifdef NEED_CPU_H |
36 | +struct hvf_sw_breakpoint { | ||
37 | + target_ulong pc; | ||
38 | + target_ulong saved_insn; | ||
39 | + int use_count; | ||
40 | + QTAILQ_ENTRY(hvf_sw_breakpoint) entry; | ||
41 | +}; | ||
42 | + | ||
43 | +struct hvf_sw_breakpoint *hvf_find_sw_breakpoint(CPUState *cpu, | ||
44 | + target_ulong pc); | ||
45 | +int hvf_sw_breakpoints_active(CPUState *cpu); | ||
46 | + | ||
47 | +int hvf_arch_insert_sw_breakpoint(CPUState *cpu, struct hvf_sw_breakpoint *bp); | ||
48 | +int hvf_arch_remove_sw_breakpoint(CPUState *cpu, struct hvf_sw_breakpoint *bp); | ||
49 | +int hvf_arch_insert_hw_breakpoint(target_ulong addr, target_ulong len, | ||
50 | + int type); | ||
51 | +int hvf_arch_remove_hw_breakpoint(target_ulong addr, target_ulong len, | ||
52 | + int type); | ||
53 | +void hvf_arch_remove_all_hw_breakpoints(void); | ||
54 | +#endif /* NEED_CPU_H */ | ||
55 | + | ||
56 | #endif | ||
57 | diff --git a/include/sysemu/hvf_int.h b/include/sysemu/hvf_int.h | ||
58 | index XXXXXXX..XXXXXXX 100644 | ||
59 | --- a/include/sysemu/hvf_int.h | ||
60 | +++ b/include/sysemu/hvf_int.h | ||
61 | @@ -XXX,XX +XXX,XX @@ struct HVFState { | ||
62 | |||
63 | hvf_vcpu_caps *hvf_caps; | ||
64 | uint64_t vtimer_offset; | ||
65 | + QTAILQ_HEAD(, hvf_sw_breakpoint) hvf_sw_breakpoints; | ||
66 | }; | ||
67 | extern HVFState *hvf_state; | ||
68 | |||
69 | diff --git a/accel/hvf/hvf-accel-ops.c b/accel/hvf/hvf-accel-ops.c | ||
70 | index XXXXXXX..XXXXXXX 100644 | ||
71 | --- a/accel/hvf/hvf-accel-ops.c | ||
72 | +++ b/accel/hvf/hvf-accel-ops.c | ||
73 | @@ -XXX,XX +XXX,XX @@ | ||
74 | #include "qemu/main-loop.h" | ||
75 | #include "exec/address-spaces.h" | ||
76 | #include "exec/exec-all.h" | ||
77 | +#include "exec/gdbstub.h" | ||
78 | #include "sysemu/cpus.h" | ||
79 | #include "sysemu/hvf.h" | ||
80 | #include "sysemu/hvf_int.h" | ||
81 | @@ -XXX,XX +XXX,XX @@ static int hvf_accel_init(MachineState *ms) | ||
82 | s->slots[x].slot_id = x; | ||
83 | } | ||
84 | |||
85 | + QTAILQ_INIT(&s->hvf_sw_breakpoints); | ||
86 | + | ||
87 | hvf_state = s; | ||
88 | memory_listener_register(&hvf_memory_listener, &address_space_memory); | ||
89 | |||
90 | @@ -XXX,XX +XXX,XX @@ static void hvf_start_vcpu_thread(CPUState *cpu) | ||
91 | cpu, QEMU_THREAD_JOINABLE); | ||
92 | } | ||
93 | |||
94 | +static int hvf_insert_breakpoint(CPUState *cpu, int type, hwaddr addr, hwaddr len) | ||
95 | +{ | ||
96 | + struct hvf_sw_breakpoint *bp; | ||
97 | + int err; | ||
98 | + | ||
99 | + if (type == GDB_BREAKPOINT_SW) { | ||
100 | + bp = hvf_find_sw_breakpoint(cpu, addr); | ||
101 | + if (bp) { | ||
102 | + bp->use_count++; | ||
103 | + return 0; | ||
104 | + } | ||
105 | + | ||
106 | + bp = g_new(struct hvf_sw_breakpoint, 1); | ||
107 | + bp->pc = addr; | ||
108 | + bp->use_count = 1; | ||
109 | + err = hvf_arch_insert_sw_breakpoint(cpu, bp); | ||
110 | + if (err) { | ||
111 | + g_free(bp); | ||
112 | + return err; | ||
113 | + } | ||
114 | + | ||
115 | + QTAILQ_INSERT_HEAD(&hvf_state->hvf_sw_breakpoints, bp, entry); | ||
116 | + } else { | ||
117 | + err = hvf_arch_insert_hw_breakpoint(addr, len, type); | ||
118 | + if (err) { | ||
119 | + return err; | ||
120 | + } | ||
121 | + } | ||
122 | + | ||
123 | + CPU_FOREACH(cpu) { | ||
124 | + err = hvf_update_guest_debug(cpu); | ||
125 | + if (err) { | ||
126 | + return err; | ||
127 | + } | ||
128 | + } | ||
129 | + return 0; | ||
130 | +} | ||
131 | + | ||
132 | +static int hvf_remove_breakpoint(CPUState *cpu, int type, hwaddr addr, hwaddr len) | ||
133 | +{ | ||
134 | + struct hvf_sw_breakpoint *bp; | ||
135 | + int err; | ||
136 | + | ||
137 | + if (type == GDB_BREAKPOINT_SW) { | ||
138 | + bp = hvf_find_sw_breakpoint(cpu, addr); | ||
139 | + if (!bp) { | ||
140 | + return -ENOENT; | ||
141 | + } | ||
142 | + | ||
143 | + if (bp->use_count > 1) { | ||
144 | + bp->use_count--; | ||
145 | + return 0; | ||
146 | + } | ||
147 | + | ||
148 | + err = hvf_arch_remove_sw_breakpoint(cpu, bp); | ||
149 | + if (err) { | ||
150 | + return err; | ||
151 | + } | ||
152 | + | ||
153 | + QTAILQ_REMOVE(&hvf_state->hvf_sw_breakpoints, bp, entry); | ||
154 | + g_free(bp); | ||
155 | + } else { | ||
156 | + err = hvf_arch_remove_hw_breakpoint(addr, len, type); | ||
157 | + if (err) { | ||
158 | + return err; | ||
159 | + } | ||
160 | + } | ||
161 | + | ||
162 | + CPU_FOREACH(cpu) { | ||
163 | + err = hvf_update_guest_debug(cpu); | ||
164 | + if (err) { | ||
165 | + return err; | ||
166 | + } | ||
167 | + } | ||
168 | + return 0; | ||
169 | +} | ||
170 | + | ||
171 | +static void hvf_remove_all_breakpoints(CPUState *cpu) | ||
172 | +{ | ||
173 | + struct hvf_sw_breakpoint *bp, *next; | ||
174 | + CPUState *tmpcpu; | ||
175 | + | ||
176 | + QTAILQ_FOREACH_SAFE(bp, &hvf_state->hvf_sw_breakpoints, entry, next) { | ||
177 | + if (hvf_arch_remove_sw_breakpoint(cpu, bp) != 0) { | ||
178 | + /* Try harder to find a CPU that currently sees the breakpoint. */ | ||
179 | + CPU_FOREACH(tmpcpu) | ||
180 | + { | ||
181 | + if (hvf_arch_remove_sw_breakpoint(tmpcpu, bp) == 0) { | ||
182 | + break; | ||
183 | + } | ||
30 | + } | 184 | + } |
31 | + } | 185 | + } |
32 | /* | 186 | + QTAILQ_REMOVE(&hvf_state->hvf_sw_breakpoints, bp, entry); |
33 | * Enable 48-bit address space (TODO: take reserved_va into account). | 187 | + g_free(bp); |
34 | * Enable TBI0 but not TBI1. | 188 | + } |
189 | + hvf_arch_remove_all_hw_breakpoints(); | ||
190 | + | ||
191 | + CPU_FOREACH(cpu) { | ||
192 | + hvf_update_guest_debug(cpu); | ||
193 | + } | ||
194 | +} | ||
195 | + | ||
196 | static void hvf_accel_ops_class_init(ObjectClass *oc, void *data) | ||
197 | { | ||
198 | AccelOpsClass *ops = ACCEL_OPS_CLASS(oc); | ||
199 | @@ -XXX,XX +XXX,XX @@ static void hvf_accel_ops_class_init(ObjectClass *oc, void *data) | ||
200 | ops->synchronize_post_init = hvf_cpu_synchronize_post_init; | ||
201 | ops->synchronize_state = hvf_cpu_synchronize_state; | ||
202 | ops->synchronize_pre_loadvm = hvf_cpu_synchronize_pre_loadvm; | ||
203 | + | ||
204 | + ops->insert_breakpoint = hvf_insert_breakpoint; | ||
205 | + ops->remove_breakpoint = hvf_remove_breakpoint; | ||
206 | + ops->remove_all_breakpoints = hvf_remove_all_breakpoints; | ||
207 | }; | ||
208 | static const TypeInfo hvf_accel_ops_type = { | ||
209 | .name = ACCEL_OPS_NAME("hvf"), | ||
210 | diff --git a/accel/hvf/hvf-all.c b/accel/hvf/hvf-all.c | ||
211 | index XXXXXXX..XXXXXXX 100644 | ||
212 | --- a/accel/hvf/hvf-all.c | ||
213 | +++ b/accel/hvf/hvf-all.c | ||
214 | @@ -XXX,XX +XXX,XX @@ void assert_hvf_ok(hv_return_t ret) | ||
215 | |||
216 | abort(); | ||
217 | } | ||
218 | + | ||
219 | +struct hvf_sw_breakpoint *hvf_find_sw_breakpoint(CPUState *cpu, target_ulong pc) | ||
220 | +{ | ||
221 | + struct hvf_sw_breakpoint *bp; | ||
222 | + | ||
223 | + QTAILQ_FOREACH(bp, &hvf_state->hvf_sw_breakpoints, entry) { | ||
224 | + if (bp->pc == pc) { | ||
225 | + return bp; | ||
226 | + } | ||
227 | + } | ||
228 | + return NULL; | ||
229 | +} | ||
230 | + | ||
231 | +int hvf_sw_breakpoints_active(CPUState *cpu) | ||
232 | +{ | ||
233 | + return !QTAILQ_EMPTY(&hvf_state->hvf_sw_breakpoints); | ||
234 | +} | ||
235 | diff --git a/target/arm/hvf/hvf.c b/target/arm/hvf/hvf.c | ||
236 | index XXXXXXX..XXXXXXX 100644 | ||
237 | --- a/target/arm/hvf/hvf.c | ||
238 | +++ b/target/arm/hvf/hvf.c | ||
239 | @@ -XXX,XX +XXX,XX @@ | ||
240 | #include "trace/trace-target_arm_hvf.h" | ||
241 | #include "migration/vmstate.h" | ||
242 | |||
243 | +#include "exec/gdbstub.h" | ||
244 | + | ||
245 | #define HVF_SYSREG(crn, crm, op0, op1, op2) \ | ||
246 | ENCODE_AA64_CP_REG(CP_REG_ARM64_SYSREG_CP, crn, crm, op0, op1, op2) | ||
247 | #define PL1_WRITE_MASK 0x4 | ||
248 | @@ -XXX,XX +XXX,XX @@ int hvf_arch_init(void) | ||
249 | qemu_add_vm_change_state_handler(hvf_vm_state_change, &vtimer); | ||
250 | return 0; | ||
251 | } | ||
252 | + | ||
253 | +static const uint32_t brk_insn = 0xd4200000; | ||
254 | + | ||
255 | +int hvf_arch_insert_sw_breakpoint(CPUState *cpu, struct hvf_sw_breakpoint *bp) | ||
256 | +{ | ||
257 | + if (cpu_memory_rw_debug(cpu, bp->pc, (uint8_t *)&bp->saved_insn, 4, 0) || | ||
258 | + cpu_memory_rw_debug(cpu, bp->pc, (uint8_t *)&brk_insn, 4, 1)) { | ||
259 | + return -EINVAL; | ||
260 | + } | ||
261 | + return 0; | ||
262 | +} | ||
263 | + | ||
264 | +int hvf_arch_remove_sw_breakpoint(CPUState *cpu, struct hvf_sw_breakpoint *bp) | ||
265 | +{ | ||
266 | + static uint32_t brk; | ||
267 | + | ||
268 | + if (cpu_memory_rw_debug(cpu, bp->pc, (uint8_t *)&brk, 4, 0) || | ||
269 | + brk != brk_insn || | ||
270 | + cpu_memory_rw_debug(cpu, bp->pc, (uint8_t *)&bp->saved_insn, 4, 1)) { | ||
271 | + return -EINVAL; | ||
272 | + } | ||
273 | + return 0; | ||
274 | +} | ||
275 | + | ||
276 | +int hvf_arch_insert_hw_breakpoint(target_ulong addr, target_ulong len, int type) | ||
277 | +{ | ||
278 | + switch (type) { | ||
279 | + case GDB_BREAKPOINT_HW: | ||
280 | + return insert_hw_breakpoint(addr); | ||
281 | + case GDB_WATCHPOINT_READ: | ||
282 | + case GDB_WATCHPOINT_WRITE: | ||
283 | + case GDB_WATCHPOINT_ACCESS: | ||
284 | + return insert_hw_watchpoint(addr, len, type); | ||
285 | + default: | ||
286 | + return -ENOSYS; | ||
287 | + } | ||
288 | +} | ||
289 | + | ||
290 | +int hvf_arch_remove_hw_breakpoint(target_ulong addr, target_ulong len, int type) | ||
291 | +{ | ||
292 | + switch (type) { | ||
293 | + case GDB_BREAKPOINT_HW: | ||
294 | + return delete_hw_breakpoint(addr); | ||
295 | + case GDB_WATCHPOINT_READ: | ||
296 | + case GDB_WATCHPOINT_WRITE: | ||
297 | + case GDB_WATCHPOINT_ACCESS: | ||
298 | + return delete_hw_watchpoint(addr, len, type); | ||
299 | + default: | ||
300 | + return -ENOSYS; | ||
301 | + } | ||
302 | +} | ||
303 | + | ||
304 | +void hvf_arch_remove_all_hw_breakpoints(void) | ||
305 | +{ | ||
306 | + if (cur_hw_wps > 0) { | ||
307 | + g_array_remove_range(hw_watchpoints, 0, cur_hw_wps); | ||
308 | + } | ||
309 | + if (cur_hw_bps > 0) { | ||
310 | + g_array_remove_range(hw_breakpoints, 0, cur_hw_bps); | ||
311 | + } | ||
312 | +} | ||
313 | diff --git a/target/i386/hvf/hvf.c b/target/i386/hvf/hvf.c | ||
314 | index XXXXXXX..XXXXXXX 100644 | ||
315 | --- a/target/i386/hvf/hvf.c | ||
316 | +++ b/target/i386/hvf/hvf.c | ||
317 | @@ -XXX,XX +XXX,XX @@ int hvf_vcpu_exec(CPUState *cpu) | ||
318 | |||
319 | return ret; | ||
320 | } | ||
321 | + | ||
322 | +int hvf_arch_insert_sw_breakpoint(CPUState *cpu, struct hvf_sw_breakpoint *bp) | ||
323 | +{ | ||
324 | + return -ENOSYS; | ||
325 | +} | ||
326 | + | ||
327 | +int hvf_arch_remove_sw_breakpoint(CPUState *cpu, struct hvf_sw_breakpoint *bp) | ||
328 | +{ | ||
329 | + return -ENOSYS; | ||
330 | +} | ||
331 | + | ||
332 | +int hvf_arch_insert_hw_breakpoint(target_ulong addr, target_ulong len, int type) | ||
333 | +{ | ||
334 | + return -ENOSYS; | ||
335 | +} | ||
336 | + | ||
337 | +int hvf_arch_remove_hw_breakpoint(target_ulong addr, target_ulong len, int type) | ||
338 | +{ | ||
339 | + return -ENOSYS; | ||
340 | +} | ||
341 | + | ||
342 | +void hvf_arch_remove_all_hw_breakpoints(void) | ||
343 | +{ | ||
344 | +} | ||
35 | -- | 345 | -- |
36 | 2.25.1 | 346 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Francesco Cagnin <fcagnin@quarkslab.com> |
---|---|---|---|
2 | 2 | ||
3 | We cannot reuse the SVE functions for LD[1-4] and ST[1-4], | 3 | Guests can now be debugged through the gdbstub. Support is added for |
4 | because those functions accept only a Zreg register number. | 4 | single-stepping, software breakpoints, hardware breakpoints and |
5 | For SME, we want to pass a pointer into ZA storage. | 5 | watchpoints. The code has been structured like the KVM counterpart. |
6 | 6 | ||
7 | While guest debugging is enabled, the guest can still read and write the | ||
8 | DBG*_EL1 registers but they don't have any effect. | ||
9 | |||
10 | Signed-off-by: Francesco Cagnin <fcagnin@quarkslab.com> | ||
11 | Message-id: 20230601153107.81955-5-fcagnin@quarkslab.com | ||
7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20220708151540.18136-21-richard.henderson@linaro.org | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 14 | --- |
12 | target/arm/helper-sme.h | 82 +++++ | 15 | include/sysemu/hvf.h | 15 ++ |
13 | target/arm/sme.decode | 9 + | 16 | include/sysemu/hvf_int.h | 1 + |
14 | target/arm/sme_helper.c | 595 +++++++++++++++++++++++++++++++++++++ | 17 | target/arm/hvf_arm.h | 7 + |
15 | target/arm/translate-sme.c | 70 +++++ | 18 | accel/hvf/hvf-accel-ops.c | 10 + |
16 | 4 files changed, 756 insertions(+) | 19 | accel/hvf/hvf-all.c | 6 + |
20 | target/arm/hvf/hvf.c | 474 +++++++++++++++++++++++++++++++++++++- | ||
21 | target/i386/hvf/hvf.c | 9 + | ||
22 | 7 files changed, 520 insertions(+), 2 deletions(-) | ||
17 | 23 | ||
18 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | 24 | diff --git a/include/sysemu/hvf.h b/include/sysemu/hvf.h |
19 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/helper-sme.h | 26 | --- a/include/sysemu/hvf.h |
21 | +++ b/target/arm/helper-sme.h | 27 | +++ b/include/sysemu/hvf.h |
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(sme_mova_cz_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 28 | @@ -XXX,XX +XXX,XX @@ int hvf_arch_insert_hw_breakpoint(target_ulong addr, target_ulong len, |
23 | DEF_HELPER_FLAGS_4(sme_mova_zc_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 29 | int hvf_arch_remove_hw_breakpoint(target_ulong addr, target_ulong len, |
24 | DEF_HELPER_FLAGS_4(sme_mova_cz_q, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 30 | int type); |
25 | DEF_HELPER_FLAGS_4(sme_mova_zc_q, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 31 | void hvf_arch_remove_all_hw_breakpoints(void); |
26 | + | 32 | + |
27 | +DEF_HELPER_FLAGS_5(sme_ld1b_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 33 | +/* |
28 | +DEF_HELPER_FLAGS_5(sme_ld1b_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 34 | + * hvf_update_guest_debug: |
29 | +DEF_HELPER_FLAGS_5(sme_ld1b_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 35 | + * @cs: CPUState for the CPU to update |
30 | +DEF_HELPER_FLAGS_5(sme_ld1b_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 36 | + * |
31 | + | 37 | + * Update guest to enable or disable debugging. Per-arch specifics will be |
32 | +DEF_HELPER_FLAGS_5(sme_ld1h_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 38 | + * handled by calling down to hvf_arch_update_guest_debug. |
33 | +DEF_HELPER_FLAGS_5(sme_ld1h_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 39 | + */ |
34 | +DEF_HELPER_FLAGS_5(sme_ld1h_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 40 | +int hvf_update_guest_debug(CPUState *cpu); |
35 | +DEF_HELPER_FLAGS_5(sme_ld1h_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 41 | +void hvf_arch_update_guest_debug(CPUState *cpu); |
36 | +DEF_HELPER_FLAGS_5(sme_ld1h_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 42 | + |
37 | +DEF_HELPER_FLAGS_5(sme_ld1h_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 43 | +/* |
38 | +DEF_HELPER_FLAGS_5(sme_ld1h_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 44 | + * Return whether the guest supports debugging. |
39 | +DEF_HELPER_FLAGS_5(sme_ld1h_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 45 | + */ |
40 | + | 46 | +bool hvf_arch_supports_guest_debug(void); |
41 | +DEF_HELPER_FLAGS_5(sme_ld1s_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 47 | #endif /* NEED_CPU_H */ |
42 | +DEF_HELPER_FLAGS_5(sme_ld1s_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 48 | |
43 | +DEF_HELPER_FLAGS_5(sme_ld1s_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 49 | #endif |
44 | +DEF_HELPER_FLAGS_5(sme_ld1s_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 50 | diff --git a/include/sysemu/hvf_int.h b/include/sysemu/hvf_int.h |
45 | +DEF_HELPER_FLAGS_5(sme_ld1s_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
46 | +DEF_HELPER_FLAGS_5(sme_ld1s_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
47 | +DEF_HELPER_FLAGS_5(sme_ld1s_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
48 | +DEF_HELPER_FLAGS_5(sme_ld1s_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
49 | + | ||
50 | +DEF_HELPER_FLAGS_5(sme_ld1d_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
51 | +DEF_HELPER_FLAGS_5(sme_ld1d_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
52 | +DEF_HELPER_FLAGS_5(sme_ld1d_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
53 | +DEF_HELPER_FLAGS_5(sme_ld1d_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
54 | +DEF_HELPER_FLAGS_5(sme_ld1d_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
55 | +DEF_HELPER_FLAGS_5(sme_ld1d_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
56 | +DEF_HELPER_FLAGS_5(sme_ld1d_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
57 | +DEF_HELPER_FLAGS_5(sme_ld1d_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
58 | + | ||
59 | +DEF_HELPER_FLAGS_5(sme_ld1q_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
60 | +DEF_HELPER_FLAGS_5(sme_ld1q_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
61 | +DEF_HELPER_FLAGS_5(sme_ld1q_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
62 | +DEF_HELPER_FLAGS_5(sme_ld1q_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
63 | +DEF_HELPER_FLAGS_5(sme_ld1q_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
64 | +DEF_HELPER_FLAGS_5(sme_ld1q_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
65 | +DEF_HELPER_FLAGS_5(sme_ld1q_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
66 | +DEF_HELPER_FLAGS_5(sme_ld1q_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
67 | + | ||
68 | +DEF_HELPER_FLAGS_5(sme_st1b_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
69 | +DEF_HELPER_FLAGS_5(sme_st1b_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
70 | +DEF_HELPER_FLAGS_5(sme_st1b_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
71 | +DEF_HELPER_FLAGS_5(sme_st1b_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
72 | + | ||
73 | +DEF_HELPER_FLAGS_5(sme_st1h_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
74 | +DEF_HELPER_FLAGS_5(sme_st1h_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
75 | +DEF_HELPER_FLAGS_5(sme_st1h_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
76 | +DEF_HELPER_FLAGS_5(sme_st1h_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
77 | +DEF_HELPER_FLAGS_5(sme_st1h_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
78 | +DEF_HELPER_FLAGS_5(sme_st1h_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
79 | +DEF_HELPER_FLAGS_5(sme_st1h_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
80 | +DEF_HELPER_FLAGS_5(sme_st1h_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
81 | + | ||
82 | +DEF_HELPER_FLAGS_5(sme_st1s_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
83 | +DEF_HELPER_FLAGS_5(sme_st1s_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
84 | +DEF_HELPER_FLAGS_5(sme_st1s_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
85 | +DEF_HELPER_FLAGS_5(sme_st1s_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
86 | +DEF_HELPER_FLAGS_5(sme_st1s_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
87 | +DEF_HELPER_FLAGS_5(sme_st1s_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
88 | +DEF_HELPER_FLAGS_5(sme_st1s_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
89 | +DEF_HELPER_FLAGS_5(sme_st1s_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
90 | + | ||
91 | +DEF_HELPER_FLAGS_5(sme_st1d_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
92 | +DEF_HELPER_FLAGS_5(sme_st1d_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
93 | +DEF_HELPER_FLAGS_5(sme_st1d_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
94 | +DEF_HELPER_FLAGS_5(sme_st1d_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
95 | +DEF_HELPER_FLAGS_5(sme_st1d_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
96 | +DEF_HELPER_FLAGS_5(sme_st1d_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
97 | +DEF_HELPER_FLAGS_5(sme_st1d_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
98 | +DEF_HELPER_FLAGS_5(sme_st1d_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
99 | + | ||
100 | +DEF_HELPER_FLAGS_5(sme_st1q_be_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
101 | +DEF_HELPER_FLAGS_5(sme_st1q_le_h, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
102 | +DEF_HELPER_FLAGS_5(sme_st1q_be_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
103 | +DEF_HELPER_FLAGS_5(sme_st1q_le_v, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
104 | +DEF_HELPER_FLAGS_5(sme_st1q_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
105 | +DEF_HELPER_FLAGS_5(sme_st1q_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
106 | +DEF_HELPER_FLAGS_5(sme_st1q_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
107 | +DEF_HELPER_FLAGS_5(sme_st1q_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | ||
108 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | ||
109 | index XXXXXXX..XXXXXXX 100644 | 51 | index XXXXXXX..XXXXXXX 100644 |
110 | --- a/target/arm/sme.decode | 52 | --- a/include/sysemu/hvf_int.h |
111 | +++ b/target/arm/sme.decode | 53 | +++ b/include/sysemu/hvf_int.h |
112 | @@ -XXX,XX +XXX,XX @@ MOVA 11000000 esz:2 00001 0 v:1 .. pg:3 0 za_imm:4 zr:5 \ | 54 | @@ -XXX,XX +XXX,XX @@ struct hvf_vcpu_state { |
113 | &mova to_vec=1 rs=%mova_rs | 55 | void *exit; |
114 | MOVA 11000000 11 00001 1 v:1 .. pg:3 0 za_imm:4 zr:5 \ | 56 | bool vtimer_masked; |
115 | &mova to_vec=1 rs=%mova_rs esz=4 | 57 | sigset_t unblock_ipi_mask; |
116 | + | 58 | + bool guest_debug_enabled; |
117 | +### SME Memory | 59 | }; |
118 | + | 60 | |
119 | +&ldst esz rs pg rn rm za_imm v:bool st:bool | 61 | void assert_hvf_ok(hv_return_t ret); |
120 | + | 62 | diff --git a/target/arm/hvf_arm.h b/target/arm/hvf_arm.h |
121 | +LDST1 1110000 0 esz:2 st:1 rm:5 v:1 .. pg:3 rn:5 0 za_imm:4 \ | ||
122 | + &ldst rs=%mova_rs | ||
123 | +LDST1 1110000 111 st:1 rm:5 v:1 .. pg:3 rn:5 0 za_imm:4 \ | ||
124 | + &ldst esz=4 rs=%mova_rs | ||
125 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | ||
126 | index XXXXXXX..XXXXXXX 100644 | 63 | index XXXXXXX..XXXXXXX 100644 |
127 | --- a/target/arm/sme_helper.c | 64 | --- a/target/arm/hvf_arm.h |
128 | +++ b/target/arm/sme_helper.c | 65 | +++ b/target/arm/hvf_arm.h |
129 | @@ -XXX,XX +XXX,XX @@ | 66 | @@ -XXX,XX +XXX,XX @@ |
130 | 67 | ||
131 | #include "qemu/osdep.h" | ||
132 | #include "cpu.h" | 68 | #include "cpu.h" |
133 | +#include "internals.h" | 69 | |
134 | #include "tcg/tcg-gvec-desc.h" | 70 | +/** |
135 | #include "exec/helper-proto.h" | 71 | + * hvf_arm_init_debug() - initialize guest debug capabilities |
136 | +#include "exec/cpu_ldst.h" | 72 | + * |
137 | +#include "exec/exec-all.h" | 73 | + * Should be called only once before using guest debug capabilities. |
138 | #include "qemu/int128.h" | ||
139 | #include "vec_internal.h" | ||
140 | +#include "sve_ldst_internal.h" | ||
141 | |||
142 | /* ResetSVEState */ | ||
143 | void arm_reset_sve_state(CPUARMState *env) | ||
144 | @@ -XXX,XX +XXX,XX @@ void HELPER(sme_mova_zc_q)(void *vd, void *za, void *vg, uint32_t desc) | ||
145 | } | ||
146 | |||
147 | #undef DO_MOVA_Z | ||
148 | + | ||
149 | +/* | ||
150 | + * Clear elements in a tile slice comprising len bytes. | ||
151 | + */ | 74 | + */ |
152 | + | 75 | +void hvf_arm_init_debug(void); |
153 | +typedef void ClearFn(void *ptr, size_t off, size_t len); | 76 | + |
154 | + | 77 | void hvf_arm_set_cpu_features_from_host(ARMCPU *cpu); |
155 | +static void clear_horizontal(void *ptr, size_t off, size_t len) | 78 | |
156 | +{ | 79 | #endif |
157 | + memset(ptr + off, 0, len); | 80 | diff --git a/accel/hvf/hvf-accel-ops.c b/accel/hvf/hvf-accel-ops.c |
158 | +} | 81 | index XXXXXXX..XXXXXXX 100644 |
159 | + | 82 | --- a/accel/hvf/hvf-accel-ops.c |
160 | +static void clear_vertical_b(void *vptr, size_t off, size_t len) | 83 | +++ b/accel/hvf/hvf-accel-ops.c |
161 | +{ | 84 | @@ -XXX,XX +XXX,XX @@ static int hvf_accel_init(MachineState *ms) |
162 | + for (size_t i = 0; i < len; ++i) { | 85 | return hvf_arch_init(); |
163 | + *(uint8_t *)(vptr + tile_vslice_offset(i + off)) = 0; | 86 | } |
164 | + } | 87 | |
165 | +} | 88 | +static inline int hvf_gdbstub_sstep_flags(void) |
166 | + | 89 | +{ |
167 | +static void clear_vertical_h(void *vptr, size_t off, size_t len) | 90 | + return SSTEP_ENABLE | SSTEP_NOIRQ; |
168 | +{ | 91 | +} |
169 | + for (size_t i = 0; i < len; i += 2) { | 92 | + |
170 | + *(uint16_t *)(vptr + tile_vslice_offset(i + off)) = 0; | 93 | static void hvf_accel_class_init(ObjectClass *oc, void *data) |
171 | + } | 94 | { |
172 | +} | 95 | AccelClass *ac = ACCEL_CLASS(oc); |
173 | + | 96 | ac->name = "HVF"; |
174 | +static void clear_vertical_s(void *vptr, size_t off, size_t len) | 97 | ac->init_machine = hvf_accel_init; |
175 | +{ | 98 | ac->allowed = &hvf_allowed; |
176 | + for (size_t i = 0; i < len; i += 4) { | 99 | + ac->gdbstub_supported_sstep_flags = hvf_gdbstub_sstep_flags; |
177 | + *(uint32_t *)(vptr + tile_vslice_offset(i + off)) = 0; | 100 | } |
178 | + } | 101 | |
179 | +} | 102 | static const TypeInfo hvf_accel_type = { |
180 | + | 103 | @@ -XXX,XX +XXX,XX @@ static int hvf_init_vcpu(CPUState *cpu) |
181 | +static void clear_vertical_d(void *vptr, size_t off, size_t len) | 104 | cpu->vcpu_dirty = 1; |
182 | +{ | 105 | assert_hvf_ok(r); |
183 | + for (size_t i = 0; i < len; i += 8) { | 106 | |
184 | + *(uint64_t *)(vptr + tile_vslice_offset(i + off)) = 0; | 107 | + cpu->hvf->guest_debug_enabled = false; |
185 | + } | 108 | + |
186 | +} | 109 | return hvf_arch_init_vcpu(cpu); |
187 | + | 110 | } |
188 | +static void clear_vertical_q(void *vptr, size_t off, size_t len) | 111 | |
189 | +{ | 112 | @@ -XXX,XX +XXX,XX @@ static void hvf_accel_ops_class_init(ObjectClass *oc, void *data) |
190 | + for (size_t i = 0; i < len; i += 16) { | 113 | ops->insert_breakpoint = hvf_insert_breakpoint; |
191 | + memset(vptr + tile_vslice_offset(i + off), 0, 16); | 114 | ops->remove_breakpoint = hvf_remove_breakpoint; |
192 | + } | 115 | ops->remove_all_breakpoints = hvf_remove_all_breakpoints; |
193 | +} | 116 | + ops->update_guest_debug = hvf_update_guest_debug; |
194 | + | 117 | + ops->supports_guest_debug = hvf_arch_supports_guest_debug; |
195 | +/* | 118 | }; |
196 | + * Copy elements from an array into a tile slice comprising len bytes. | 119 | static const TypeInfo hvf_accel_ops_type = { |
197 | + */ | 120 | .name = ACCEL_OPS_NAME("hvf"), |
198 | + | 121 | diff --git a/accel/hvf/hvf-all.c b/accel/hvf/hvf-all.c |
199 | +typedef void CopyFn(void *dst, const void *src, size_t len); | 122 | index XXXXXXX..XXXXXXX 100644 |
200 | + | 123 | --- a/accel/hvf/hvf-all.c |
201 | +static void copy_horizontal(void *dst, const void *src, size_t len) | 124 | +++ b/accel/hvf/hvf-all.c |
202 | +{ | 125 | @@ -XXX,XX +XXX,XX @@ int hvf_sw_breakpoints_active(CPUState *cpu) |
203 | + memcpy(dst, src, len); | 126 | { |
204 | +} | 127 | return !QTAILQ_EMPTY(&hvf_state->hvf_sw_breakpoints); |
205 | + | 128 | } |
206 | +static void copy_vertical_b(void *vdst, const void *vsrc, size_t len) | 129 | + |
207 | +{ | 130 | +int hvf_update_guest_debug(CPUState *cpu) |
208 | + const uint8_t *src = vsrc; | 131 | +{ |
209 | + uint8_t *dst = vdst; | 132 | + hvf_arch_update_guest_debug(cpu); |
210 | + size_t i; | 133 | + return 0; |
211 | + | 134 | +} |
212 | + for (i = 0; i < len; ++i) { | 135 | diff --git a/target/arm/hvf/hvf.c b/target/arm/hvf/hvf.c |
213 | + dst[tile_vslice_index(i)] = src[i]; | 136 | index XXXXXXX..XXXXXXX 100644 |
214 | + } | 137 | --- a/target/arm/hvf/hvf.c |
215 | +} | 138 | +++ b/target/arm/hvf/hvf.c |
216 | + | 139 | @@ -XXX,XX +XXX,XX @@ |
217 | +static void copy_vertical_h(void *vdst, const void *vsrc, size_t len) | 140 | |
218 | +{ | 141 | #include "exec/gdbstub.h" |
219 | + const uint16_t *src = vsrc; | 142 | |
220 | + uint16_t *dst = vdst; | 143 | +#define MDSCR_EL1_SS_SHIFT 0 |
221 | + size_t i; | 144 | +#define MDSCR_EL1_MDE_SHIFT 15 |
222 | + | 145 | + |
223 | + for (i = 0; i < len / 2; ++i) { | 146 | +static uint16_t dbgbcr_regs[] = { |
224 | + dst[tile_vslice_index(i)] = src[i]; | 147 | + HV_SYS_REG_DBGBCR0_EL1, |
225 | + } | 148 | + HV_SYS_REG_DBGBCR1_EL1, |
226 | +} | 149 | + HV_SYS_REG_DBGBCR2_EL1, |
227 | + | 150 | + HV_SYS_REG_DBGBCR3_EL1, |
228 | +static void copy_vertical_s(void *vdst, const void *vsrc, size_t len) | 151 | + HV_SYS_REG_DBGBCR4_EL1, |
229 | +{ | 152 | + HV_SYS_REG_DBGBCR5_EL1, |
230 | + const uint32_t *src = vsrc; | 153 | + HV_SYS_REG_DBGBCR6_EL1, |
231 | + uint32_t *dst = vdst; | 154 | + HV_SYS_REG_DBGBCR7_EL1, |
232 | + size_t i; | 155 | + HV_SYS_REG_DBGBCR8_EL1, |
233 | + | 156 | + HV_SYS_REG_DBGBCR9_EL1, |
234 | + for (i = 0; i < len / 4; ++i) { | 157 | + HV_SYS_REG_DBGBCR10_EL1, |
235 | + dst[tile_vslice_index(i)] = src[i]; | 158 | + HV_SYS_REG_DBGBCR11_EL1, |
236 | + } | 159 | + HV_SYS_REG_DBGBCR12_EL1, |
237 | +} | 160 | + HV_SYS_REG_DBGBCR13_EL1, |
238 | + | 161 | + HV_SYS_REG_DBGBCR14_EL1, |
239 | +static void copy_vertical_d(void *vdst, const void *vsrc, size_t len) | 162 | + HV_SYS_REG_DBGBCR15_EL1, |
240 | +{ | 163 | +}; |
241 | + const uint64_t *src = vsrc; | 164 | +static uint16_t dbgbvr_regs[] = { |
242 | + uint64_t *dst = vdst; | 165 | + HV_SYS_REG_DBGBVR0_EL1, |
243 | + size_t i; | 166 | + HV_SYS_REG_DBGBVR1_EL1, |
244 | + | 167 | + HV_SYS_REG_DBGBVR2_EL1, |
245 | + for (i = 0; i < len / 8; ++i) { | 168 | + HV_SYS_REG_DBGBVR3_EL1, |
246 | + dst[tile_vslice_index(i)] = src[i]; | 169 | + HV_SYS_REG_DBGBVR4_EL1, |
247 | + } | 170 | + HV_SYS_REG_DBGBVR5_EL1, |
248 | +} | 171 | + HV_SYS_REG_DBGBVR6_EL1, |
249 | + | 172 | + HV_SYS_REG_DBGBVR7_EL1, |
250 | +static void copy_vertical_q(void *vdst, const void *vsrc, size_t len) | 173 | + HV_SYS_REG_DBGBVR8_EL1, |
251 | +{ | 174 | + HV_SYS_REG_DBGBVR9_EL1, |
252 | + for (size_t i = 0; i < len; i += 16) { | 175 | + HV_SYS_REG_DBGBVR10_EL1, |
253 | + memcpy(vdst + tile_vslice_offset(i), vsrc + i, 16); | 176 | + HV_SYS_REG_DBGBVR11_EL1, |
254 | + } | 177 | + HV_SYS_REG_DBGBVR12_EL1, |
255 | +} | 178 | + HV_SYS_REG_DBGBVR13_EL1, |
256 | + | 179 | + HV_SYS_REG_DBGBVR14_EL1, |
257 | +/* | 180 | + HV_SYS_REG_DBGBVR15_EL1, |
258 | + * Host and TLB primitives for vertical tile slice addressing. | 181 | +}; |
259 | + */ | 182 | +static uint16_t dbgwcr_regs[] = { |
260 | + | 183 | + HV_SYS_REG_DBGWCR0_EL1, |
261 | +#define DO_LD(NAME, TYPE, HOST, TLB) \ | 184 | + HV_SYS_REG_DBGWCR1_EL1, |
262 | +static inline void sme_##NAME##_v_host(void *za, intptr_t off, void *host) \ | 185 | + HV_SYS_REG_DBGWCR2_EL1, |
263 | +{ \ | 186 | + HV_SYS_REG_DBGWCR3_EL1, |
264 | + TYPE val = HOST(host); \ | 187 | + HV_SYS_REG_DBGWCR4_EL1, |
265 | + *(TYPE *)(za + tile_vslice_offset(off)) = val; \ | 188 | + HV_SYS_REG_DBGWCR5_EL1, |
266 | +} \ | 189 | + HV_SYS_REG_DBGWCR6_EL1, |
267 | +static inline void sme_##NAME##_v_tlb(CPUARMState *env, void *za, \ | 190 | + HV_SYS_REG_DBGWCR7_EL1, |
268 | + intptr_t off, target_ulong addr, uintptr_t ra) \ | 191 | + HV_SYS_REG_DBGWCR8_EL1, |
269 | +{ \ | 192 | + HV_SYS_REG_DBGWCR9_EL1, |
270 | + TYPE val = TLB(env, useronly_clean_ptr(addr), ra); \ | 193 | + HV_SYS_REG_DBGWCR10_EL1, |
271 | + *(TYPE *)(za + tile_vslice_offset(off)) = val; \ | 194 | + HV_SYS_REG_DBGWCR11_EL1, |
272 | +} | 195 | + HV_SYS_REG_DBGWCR12_EL1, |
273 | + | 196 | + HV_SYS_REG_DBGWCR13_EL1, |
274 | +#define DO_ST(NAME, TYPE, HOST, TLB) \ | 197 | + HV_SYS_REG_DBGWCR14_EL1, |
275 | +static inline void sme_##NAME##_v_host(void *za, intptr_t off, void *host) \ | 198 | + HV_SYS_REG_DBGWCR15_EL1, |
276 | +{ \ | 199 | +}; |
277 | + TYPE val = *(TYPE *)(za + tile_vslice_offset(off)); \ | 200 | +static uint16_t dbgwvr_regs[] = { |
278 | + HOST(host, val); \ | 201 | + HV_SYS_REG_DBGWVR0_EL1, |
279 | +} \ | 202 | + HV_SYS_REG_DBGWVR1_EL1, |
280 | +static inline void sme_##NAME##_v_tlb(CPUARMState *env, void *za, \ | 203 | + HV_SYS_REG_DBGWVR2_EL1, |
281 | + intptr_t off, target_ulong addr, uintptr_t ra) \ | 204 | + HV_SYS_REG_DBGWVR3_EL1, |
282 | +{ \ | 205 | + HV_SYS_REG_DBGWVR4_EL1, |
283 | + TYPE val = *(TYPE *)(za + tile_vslice_offset(off)); \ | 206 | + HV_SYS_REG_DBGWVR5_EL1, |
284 | + TLB(env, useronly_clean_ptr(addr), val, ra); \ | 207 | + HV_SYS_REG_DBGWVR6_EL1, |
285 | +} | 208 | + HV_SYS_REG_DBGWVR7_EL1, |
286 | + | 209 | + HV_SYS_REG_DBGWVR8_EL1, |
287 | +/* | 210 | + HV_SYS_REG_DBGWVR9_EL1, |
288 | + * The ARMVectorReg elements are stored in host-endian 64-bit units. | 211 | + HV_SYS_REG_DBGWVR10_EL1, |
289 | + * For 128-bit quantities, the sequence defined by the Elem[] pseudocode | 212 | + HV_SYS_REG_DBGWVR11_EL1, |
290 | + * corresponds to storing the two 64-bit pieces in little-endian order. | 213 | + HV_SYS_REG_DBGWVR12_EL1, |
291 | + */ | 214 | + HV_SYS_REG_DBGWVR13_EL1, |
292 | +#define DO_LDQ(HNAME, VNAME, BE, HOST, TLB) \ | 215 | + HV_SYS_REG_DBGWVR14_EL1, |
293 | +static inline void HNAME##_host(void *za, intptr_t off, void *host) \ | 216 | + HV_SYS_REG_DBGWVR15_EL1, |
294 | +{ \ | 217 | +}; |
295 | + uint64_t val0 = HOST(host), val1 = HOST(host + 8); \ | 218 | + |
296 | + uint64_t *ptr = za + off; \ | 219 | +static inline int hvf_arm_num_brps(hv_vcpu_config_t config) |
297 | + ptr[0] = BE ? val1 : val0, ptr[1] = BE ? val0 : val1; \ | 220 | +{ |
298 | +} \ | 221 | + uint64_t val; |
299 | +static inline void VNAME##_v_host(void *za, intptr_t off, void *host) \ | 222 | + hv_return_t ret; |
300 | +{ \ | 223 | + ret = hv_vcpu_config_get_feature_reg(config, HV_FEATURE_REG_ID_AA64DFR0_EL1, |
301 | + HNAME##_host(za, tile_vslice_offset(off), host); \ | 224 | + &val); |
302 | +} \ | 225 | + assert_hvf_ok(ret); |
303 | +static inline void HNAME##_tlb(CPUARMState *env, void *za, intptr_t off, \ | 226 | + return FIELD_EX64(val, ID_AA64DFR0, BRPS) + 1; |
304 | + target_ulong addr, uintptr_t ra) \ | 227 | +} |
305 | +{ \ | 228 | + |
306 | + uint64_t val0 = TLB(env, useronly_clean_ptr(addr), ra); \ | 229 | +static inline int hvf_arm_num_wrps(hv_vcpu_config_t config) |
307 | + uint64_t val1 = TLB(env, useronly_clean_ptr(addr + 8), ra); \ | 230 | +{ |
308 | + uint64_t *ptr = za + off; \ | 231 | + uint64_t val; |
309 | + ptr[0] = BE ? val1 : val0, ptr[1] = BE ? val0 : val1; \ | 232 | + hv_return_t ret; |
310 | +} \ | 233 | + ret = hv_vcpu_config_get_feature_reg(config, HV_FEATURE_REG_ID_AA64DFR0_EL1, |
311 | +static inline void VNAME##_v_tlb(CPUARMState *env, void *za, intptr_t off, \ | 234 | + &val); |
312 | + target_ulong addr, uintptr_t ra) \ | 235 | + assert_hvf_ok(ret); |
313 | +{ \ | 236 | + return FIELD_EX64(val, ID_AA64DFR0, WRPS) + 1; |
314 | + HNAME##_tlb(env, za, tile_vslice_offset(off), addr, ra); \ | 237 | +} |
315 | +} | 238 | + |
316 | + | 239 | +void hvf_arm_init_debug(void) |
317 | +#define DO_STQ(HNAME, VNAME, BE, HOST, TLB) \ | 240 | +{ |
318 | +static inline void HNAME##_host(void *za, intptr_t off, void *host) \ | 241 | + hv_vcpu_config_t config; |
319 | +{ \ | 242 | + config = hv_vcpu_config_create(); |
320 | + uint64_t *ptr = za + off; \ | 243 | + |
321 | + HOST(host, ptr[BE]); \ | 244 | + max_hw_bps = hvf_arm_num_brps(config); |
322 | + HOST(host + 1, ptr[!BE]); \ | 245 | + hw_breakpoints = |
323 | +} \ | 246 | + g_array_sized_new(true, true, sizeof(HWBreakpoint), max_hw_bps); |
324 | +static inline void VNAME##_v_host(void *za, intptr_t off, void *host) \ | 247 | + |
325 | +{ \ | 248 | + max_hw_wps = hvf_arm_num_wrps(config); |
326 | + HNAME##_host(za, tile_vslice_offset(off), host); \ | 249 | + hw_watchpoints = |
327 | +} \ | 250 | + g_array_sized_new(true, true, sizeof(HWWatchpoint), max_hw_wps); |
328 | +static inline void HNAME##_tlb(CPUARMState *env, void *za, intptr_t off, \ | 251 | +} |
329 | + target_ulong addr, uintptr_t ra) \ | 252 | + |
330 | +{ \ | 253 | #define HVF_SYSREG(crn, crm, op0, op1, op2) \ |
331 | + uint64_t *ptr = za + off; \ | 254 | ENCODE_AA64_CP_REG(CP_REG_ARM64_SYSREG_CP, crn, crm, op0, op1, op2) |
332 | + TLB(env, useronly_clean_ptr(addr), ptr[BE], ra); \ | 255 | #define PL1_WRITE_MASK 0x4 |
333 | + TLB(env, useronly_clean_ptr(addr + 8), ptr[!BE], ra); \ | 256 | @@ -XXX,XX +XXX,XX @@ int hvf_get_registers(CPUState *cpu) |
334 | +} \ | 257 | continue; |
335 | +static inline void VNAME##_v_tlb(CPUARMState *env, void *za, intptr_t off, \ | 258 | } |
336 | + target_ulong addr, uintptr_t ra) \ | 259 | |
337 | +{ \ | 260 | + if (cpu->hvf->guest_debug_enabled) { |
338 | + HNAME##_tlb(env, za, tile_vslice_offset(off), addr, ra); \ | 261 | + /* Handle debug registers */ |
339 | +} | 262 | + switch (hvf_sreg_match[i].reg) { |
340 | + | 263 | + case HV_SYS_REG_DBGBVR0_EL1: |
341 | +DO_LD(ld1b, uint8_t, ldub_p, cpu_ldub_data_ra) | 264 | + case HV_SYS_REG_DBGBCR0_EL1: |
342 | +DO_LD(ld1h_be, uint16_t, lduw_be_p, cpu_lduw_be_data_ra) | 265 | + case HV_SYS_REG_DBGWVR0_EL1: |
343 | +DO_LD(ld1h_le, uint16_t, lduw_le_p, cpu_lduw_le_data_ra) | 266 | + case HV_SYS_REG_DBGWCR0_EL1: |
344 | +DO_LD(ld1s_be, uint32_t, ldl_be_p, cpu_ldl_be_data_ra) | 267 | + case HV_SYS_REG_DBGBVR1_EL1: |
345 | +DO_LD(ld1s_le, uint32_t, ldl_le_p, cpu_ldl_le_data_ra) | 268 | + case HV_SYS_REG_DBGBCR1_EL1: |
346 | +DO_LD(ld1d_be, uint64_t, ldq_be_p, cpu_ldq_be_data_ra) | 269 | + case HV_SYS_REG_DBGWVR1_EL1: |
347 | +DO_LD(ld1d_le, uint64_t, ldq_le_p, cpu_ldq_le_data_ra) | 270 | + case HV_SYS_REG_DBGWCR1_EL1: |
348 | + | 271 | + case HV_SYS_REG_DBGBVR2_EL1: |
349 | +DO_LDQ(sve_ld1qq_be, sme_ld1q_be, 1, ldq_be_p, cpu_ldq_be_data_ra) | 272 | + case HV_SYS_REG_DBGBCR2_EL1: |
350 | +DO_LDQ(sve_ld1qq_le, sme_ld1q_le, 0, ldq_le_p, cpu_ldq_le_data_ra) | 273 | + case HV_SYS_REG_DBGWVR2_EL1: |
351 | + | 274 | + case HV_SYS_REG_DBGWCR2_EL1: |
352 | +DO_ST(st1b, uint8_t, stb_p, cpu_stb_data_ra) | 275 | + case HV_SYS_REG_DBGBVR3_EL1: |
353 | +DO_ST(st1h_be, uint16_t, stw_be_p, cpu_stw_be_data_ra) | 276 | + case HV_SYS_REG_DBGBCR3_EL1: |
354 | +DO_ST(st1h_le, uint16_t, stw_le_p, cpu_stw_le_data_ra) | 277 | + case HV_SYS_REG_DBGWVR3_EL1: |
355 | +DO_ST(st1s_be, uint32_t, stl_be_p, cpu_stl_be_data_ra) | 278 | + case HV_SYS_REG_DBGWCR3_EL1: |
356 | +DO_ST(st1s_le, uint32_t, stl_le_p, cpu_stl_le_data_ra) | 279 | + case HV_SYS_REG_DBGBVR4_EL1: |
357 | +DO_ST(st1d_be, uint64_t, stq_be_p, cpu_stq_be_data_ra) | 280 | + case HV_SYS_REG_DBGBCR4_EL1: |
358 | +DO_ST(st1d_le, uint64_t, stq_le_p, cpu_stq_le_data_ra) | 281 | + case HV_SYS_REG_DBGWVR4_EL1: |
359 | + | 282 | + case HV_SYS_REG_DBGWCR4_EL1: |
360 | +DO_STQ(sve_st1qq_be, sme_st1q_be, 1, stq_be_p, cpu_stq_be_data_ra) | 283 | + case HV_SYS_REG_DBGBVR5_EL1: |
361 | +DO_STQ(sve_st1qq_le, sme_st1q_le, 0, stq_le_p, cpu_stq_le_data_ra) | 284 | + case HV_SYS_REG_DBGBCR5_EL1: |
362 | + | 285 | + case HV_SYS_REG_DBGWVR5_EL1: |
363 | +#undef DO_LD | 286 | + case HV_SYS_REG_DBGWCR5_EL1: |
364 | +#undef DO_ST | 287 | + case HV_SYS_REG_DBGBVR6_EL1: |
365 | +#undef DO_LDQ | 288 | + case HV_SYS_REG_DBGBCR6_EL1: |
366 | +#undef DO_STQ | 289 | + case HV_SYS_REG_DBGWVR6_EL1: |
367 | + | 290 | + case HV_SYS_REG_DBGWCR6_EL1: |
368 | +/* | 291 | + case HV_SYS_REG_DBGBVR7_EL1: |
369 | + * Common helper for all contiguous predicated loads. | 292 | + case HV_SYS_REG_DBGBCR7_EL1: |
370 | + */ | 293 | + case HV_SYS_REG_DBGWVR7_EL1: |
371 | + | 294 | + case HV_SYS_REG_DBGWCR7_EL1: |
372 | +static inline QEMU_ALWAYS_INLINE | 295 | + case HV_SYS_REG_DBGBVR8_EL1: |
373 | +void sme_ld1(CPUARMState *env, void *za, uint64_t *vg, | 296 | + case HV_SYS_REG_DBGBCR8_EL1: |
374 | + const target_ulong addr, uint32_t desc, const uintptr_t ra, | 297 | + case HV_SYS_REG_DBGWVR8_EL1: |
375 | + const int esz, uint32_t mtedesc, bool vertical, | 298 | + case HV_SYS_REG_DBGWCR8_EL1: |
376 | + sve_ldst1_host_fn *host_fn, | 299 | + case HV_SYS_REG_DBGBVR9_EL1: |
377 | + sve_ldst1_tlb_fn *tlb_fn, | 300 | + case HV_SYS_REG_DBGBCR9_EL1: |
378 | + ClearFn *clr_fn, | 301 | + case HV_SYS_REG_DBGWVR9_EL1: |
379 | + CopyFn *cpy_fn) | 302 | + case HV_SYS_REG_DBGWCR9_EL1: |
380 | +{ | 303 | + case HV_SYS_REG_DBGBVR10_EL1: |
381 | + const intptr_t reg_max = simd_oprsz(desc); | 304 | + case HV_SYS_REG_DBGBCR10_EL1: |
382 | + const intptr_t esize = 1 << esz; | 305 | + case HV_SYS_REG_DBGWVR10_EL1: |
383 | + intptr_t reg_off, reg_last; | 306 | + case HV_SYS_REG_DBGWCR10_EL1: |
384 | + SVEContLdSt info; | 307 | + case HV_SYS_REG_DBGBVR11_EL1: |
385 | + void *host; | 308 | + case HV_SYS_REG_DBGBCR11_EL1: |
386 | + int flags; | 309 | + case HV_SYS_REG_DBGWVR11_EL1: |
387 | + | 310 | + case HV_SYS_REG_DBGWCR11_EL1: |
388 | + /* Find the active elements. */ | 311 | + case HV_SYS_REG_DBGBVR12_EL1: |
389 | + if (!sve_cont_ldst_elements(&info, addr, vg, reg_max, esz, esize)) { | 312 | + case HV_SYS_REG_DBGBCR12_EL1: |
390 | + /* The entire predicate was false; no load occurs. */ | 313 | + case HV_SYS_REG_DBGWVR12_EL1: |
391 | + clr_fn(za, 0, reg_max); | 314 | + case HV_SYS_REG_DBGWCR12_EL1: |
392 | + return; | 315 | + case HV_SYS_REG_DBGBVR13_EL1: |
393 | + } | 316 | + case HV_SYS_REG_DBGBCR13_EL1: |
394 | + | 317 | + case HV_SYS_REG_DBGWVR13_EL1: |
395 | + /* Probe the page(s). Exit with exception for any invalid page. */ | 318 | + case HV_SYS_REG_DBGWCR13_EL1: |
396 | + sve_cont_ldst_pages(&info, FAULT_ALL, env, addr, MMU_DATA_LOAD, ra); | 319 | + case HV_SYS_REG_DBGBVR14_EL1: |
397 | + | 320 | + case HV_SYS_REG_DBGBCR14_EL1: |
398 | + /* Handle watchpoints for all active elements. */ | 321 | + case HV_SYS_REG_DBGWVR14_EL1: |
399 | + sve_cont_ldst_watchpoints(&info, env, vg, addr, esize, esize, | 322 | + case HV_SYS_REG_DBGWCR14_EL1: |
400 | + BP_MEM_READ, ra); | 323 | + case HV_SYS_REG_DBGBVR15_EL1: |
401 | + | 324 | + case HV_SYS_REG_DBGBCR15_EL1: |
402 | + /* | 325 | + case HV_SYS_REG_DBGWVR15_EL1: |
403 | + * Handle mte checks for all active elements. | 326 | + case HV_SYS_REG_DBGWCR15_EL1: { |
404 | + * Since TBI must be set for MTE, !mtedesc => !mte_active. | 327 | + /* |
405 | + */ | 328 | + * If the guest is being debugged, the vCPU's debug registers |
406 | + if (mtedesc) { | 329 | + * are holding the gdbstub's view of the registers (set in |
407 | + sve_cont_ldst_mte_check(&info, env, vg, addr, esize, esize, | 330 | + * hvf_arch_update_guest_debug()). |
408 | + mtedesc, ra); | 331 | + * Since the environment is used to store only the guest's view |
409 | + } | 332 | + * of the registers, don't update it with the values from the |
410 | + | 333 | + * vCPU but simply keep the values from the previous |
411 | + flags = info.page[0].flags | info.page[1].flags; | 334 | + * environment. |
412 | + if (unlikely(flags != 0)) { | 335 | + */ |
413 | +#ifdef CONFIG_USER_ONLY | 336 | + const ARMCPRegInfo *ri; |
414 | + g_assert_not_reached(); | 337 | + ri = get_arm_cp_reginfo(arm_cpu->cp_regs, hvf_sreg_match[i].key); |
415 | +#else | 338 | + val = read_raw_cp_reg(env, ri); |
416 | + /* | 339 | + |
417 | + * At least one page includes MMIO. | 340 | + arm_cpu->cpreg_values[hvf_sreg_match[i].cp_idx] = val; |
418 | + * Any bus operation can fail with cpu_transaction_failed, | 341 | + continue; |
419 | + * which for ARM will raise SyncExternal. Perform the load | 342 | + } |
420 | + * into scratch memory to preserve register state until the end. | ||
421 | + */ | ||
422 | + ARMVectorReg scratch = { }; | ||
423 | + | ||
424 | + reg_off = info.reg_off_first[0]; | ||
425 | + reg_last = info.reg_off_last[1]; | ||
426 | + if (reg_last < 0) { | ||
427 | + reg_last = info.reg_off_split; | ||
428 | + if (reg_last < 0) { | ||
429 | + reg_last = info.reg_off_last[0]; | ||
430 | + } | 343 | + } |
431 | + } | 344 | + } |
432 | + | 345 | + |
433 | + do { | 346 | ret = hv_vcpu_get_sys_reg(cpu->hvf->fd, hvf_sreg_match[i].reg, &val); |
434 | + uint64_t pg = vg[reg_off >> 6]; | 347 | assert_hvf_ok(ret); |
435 | + do { | 348 | |
436 | + if ((pg >> (reg_off & 63)) & 1) { | 349 | @@ -XXX,XX +XXX,XX @@ int hvf_put_registers(CPUState *cpu) |
437 | + tlb_fn(env, &scratch, reg_off, addr + reg_off, ra); | 350 | continue; |
438 | + } | 351 | } |
439 | + reg_off += esize; | 352 | |
440 | + } while (reg_off & 63); | 353 | + if (cpu->hvf->guest_debug_enabled) { |
441 | + } while (reg_off <= reg_last); | 354 | + /* Handle debug registers */ |
442 | + | 355 | + switch (hvf_sreg_match[i].reg) { |
443 | + cpy_fn(za, &scratch, reg_max); | 356 | + case HV_SYS_REG_DBGBVR0_EL1: |
444 | + return; | 357 | + case HV_SYS_REG_DBGBCR0_EL1: |
445 | +#endif | 358 | + case HV_SYS_REG_DBGWVR0_EL1: |
446 | + } | 359 | + case HV_SYS_REG_DBGWCR0_EL1: |
447 | + | 360 | + case HV_SYS_REG_DBGBVR1_EL1: |
448 | + /* The entire operation is in RAM, on valid pages. */ | 361 | + case HV_SYS_REG_DBGBCR1_EL1: |
449 | + | 362 | + case HV_SYS_REG_DBGWVR1_EL1: |
450 | + reg_off = info.reg_off_first[0]; | 363 | + case HV_SYS_REG_DBGWCR1_EL1: |
451 | + reg_last = info.reg_off_last[0]; | 364 | + case HV_SYS_REG_DBGBVR2_EL1: |
452 | + host = info.page[0].host; | 365 | + case HV_SYS_REG_DBGBCR2_EL1: |
453 | + | 366 | + case HV_SYS_REG_DBGWVR2_EL1: |
454 | + if (!vertical) { | 367 | + case HV_SYS_REG_DBGWCR2_EL1: |
455 | + memset(za, 0, reg_max); | 368 | + case HV_SYS_REG_DBGBVR3_EL1: |
456 | + } else if (reg_off) { | 369 | + case HV_SYS_REG_DBGBCR3_EL1: |
457 | + clr_fn(za, 0, reg_off); | 370 | + case HV_SYS_REG_DBGWVR3_EL1: |
458 | + } | 371 | + case HV_SYS_REG_DBGWCR3_EL1: |
459 | + | 372 | + case HV_SYS_REG_DBGBVR4_EL1: |
460 | + while (reg_off <= reg_last) { | 373 | + case HV_SYS_REG_DBGBCR4_EL1: |
461 | + uint64_t pg = vg[reg_off >> 6]; | 374 | + case HV_SYS_REG_DBGWVR4_EL1: |
462 | + do { | 375 | + case HV_SYS_REG_DBGWCR4_EL1: |
463 | + if ((pg >> (reg_off & 63)) & 1) { | 376 | + case HV_SYS_REG_DBGBVR5_EL1: |
464 | + host_fn(za, reg_off, host + reg_off); | 377 | + case HV_SYS_REG_DBGBCR5_EL1: |
465 | + } else if (vertical) { | 378 | + case HV_SYS_REG_DBGWVR5_EL1: |
466 | + clr_fn(za, reg_off, esize); | 379 | + case HV_SYS_REG_DBGWCR5_EL1: |
467 | + } | 380 | + case HV_SYS_REG_DBGBVR6_EL1: |
468 | + reg_off += esize; | 381 | + case HV_SYS_REG_DBGBCR6_EL1: |
469 | + } while (reg_off <= reg_last && (reg_off & 63)); | 382 | + case HV_SYS_REG_DBGWVR6_EL1: |
470 | + } | 383 | + case HV_SYS_REG_DBGWCR6_EL1: |
471 | + | 384 | + case HV_SYS_REG_DBGBVR7_EL1: |
472 | + /* | 385 | + case HV_SYS_REG_DBGBCR7_EL1: |
473 | + * Use the slow path to manage the cross-page misalignment. | 386 | + case HV_SYS_REG_DBGWVR7_EL1: |
474 | + * But we know this is RAM and cannot trap. | 387 | + case HV_SYS_REG_DBGWCR7_EL1: |
475 | + */ | 388 | + case HV_SYS_REG_DBGBVR8_EL1: |
476 | + reg_off = info.reg_off_split; | 389 | + case HV_SYS_REG_DBGBCR8_EL1: |
477 | + if (unlikely(reg_off >= 0)) { | 390 | + case HV_SYS_REG_DBGWVR8_EL1: |
478 | + tlb_fn(env, za, reg_off, addr + reg_off, ra); | 391 | + case HV_SYS_REG_DBGWCR8_EL1: |
479 | + } | 392 | + case HV_SYS_REG_DBGBVR9_EL1: |
480 | + | 393 | + case HV_SYS_REG_DBGBCR9_EL1: |
481 | + reg_off = info.reg_off_first[1]; | 394 | + case HV_SYS_REG_DBGWVR9_EL1: |
482 | + if (unlikely(reg_off >= 0)) { | 395 | + case HV_SYS_REG_DBGWCR9_EL1: |
483 | + reg_last = info.reg_off_last[1]; | 396 | + case HV_SYS_REG_DBGBVR10_EL1: |
484 | + host = info.page[1].host; | 397 | + case HV_SYS_REG_DBGBCR10_EL1: |
485 | + | 398 | + case HV_SYS_REG_DBGWVR10_EL1: |
486 | + do { | 399 | + case HV_SYS_REG_DBGWCR10_EL1: |
487 | + uint64_t pg = vg[reg_off >> 6]; | 400 | + case HV_SYS_REG_DBGBVR11_EL1: |
488 | + do { | 401 | + case HV_SYS_REG_DBGBCR11_EL1: |
489 | + if ((pg >> (reg_off & 63)) & 1) { | 402 | + case HV_SYS_REG_DBGWVR11_EL1: |
490 | + host_fn(za, reg_off, host + reg_off); | 403 | + case HV_SYS_REG_DBGWCR11_EL1: |
491 | + } else if (vertical) { | 404 | + case HV_SYS_REG_DBGBVR12_EL1: |
492 | + clr_fn(za, reg_off, esize); | 405 | + case HV_SYS_REG_DBGBCR12_EL1: |
493 | + } | 406 | + case HV_SYS_REG_DBGWVR12_EL1: |
494 | + reg_off += esize; | 407 | + case HV_SYS_REG_DBGWCR12_EL1: |
495 | + } while (reg_off & 63); | 408 | + case HV_SYS_REG_DBGBVR13_EL1: |
496 | + } while (reg_off <= reg_last); | 409 | + case HV_SYS_REG_DBGBCR13_EL1: |
497 | + } | 410 | + case HV_SYS_REG_DBGWVR13_EL1: |
498 | +} | 411 | + case HV_SYS_REG_DBGWCR13_EL1: |
499 | + | 412 | + case HV_SYS_REG_DBGBVR14_EL1: |
500 | +static inline QEMU_ALWAYS_INLINE | 413 | + case HV_SYS_REG_DBGBCR14_EL1: |
501 | +void sme_ld1_mte(CPUARMState *env, void *za, uint64_t *vg, | 414 | + case HV_SYS_REG_DBGWVR14_EL1: |
502 | + target_ulong addr, uint32_t desc, uintptr_t ra, | 415 | + case HV_SYS_REG_DBGWCR14_EL1: |
503 | + const int esz, bool vertical, | 416 | + case HV_SYS_REG_DBGBVR15_EL1: |
504 | + sve_ldst1_host_fn *host_fn, | 417 | + case HV_SYS_REG_DBGBCR15_EL1: |
505 | + sve_ldst1_tlb_fn *tlb_fn, | 418 | + case HV_SYS_REG_DBGWVR15_EL1: |
506 | + ClearFn *clr_fn, | 419 | + case HV_SYS_REG_DBGWCR15_EL1: |
507 | + CopyFn *cpy_fn) | 420 | + /* |
508 | +{ | 421 | + * If the guest is being debugged, the vCPU's debug registers |
509 | + uint32_t mtedesc = desc >> (SIMD_DATA_SHIFT + SVE_MTEDESC_SHIFT); | 422 | + * are already holding the gdbstub's view of the registers (set |
510 | + int bit55 = extract64(addr, 55, 1); | 423 | + * in hvf_arch_update_guest_debug()). |
511 | + | 424 | + */ |
512 | + /* Remove mtedesc from the normal sve descriptor. */ | 425 | + continue; |
513 | + desc = extract32(desc, 0, SIMD_DATA_SHIFT + SVE_MTEDESC_SHIFT); | ||
514 | + | ||
515 | + /* Perform gross MTE suppression early. */ | ||
516 | + if (!tbi_check(desc, bit55) || | ||
517 | + tcma_check(desc, bit55, allocation_tag_from_addr(addr))) { | ||
518 | + mtedesc = 0; | ||
519 | + } | ||
520 | + | ||
521 | + sme_ld1(env, za, vg, addr, desc, ra, esz, mtedesc, vertical, | ||
522 | + host_fn, tlb_fn, clr_fn, cpy_fn); | ||
523 | +} | ||
524 | + | ||
525 | +#define DO_LD(L, END, ESZ) \ | ||
526 | +void HELPER(sme_ld1##L##END##_h)(CPUARMState *env, void *za, void *vg, \ | ||
527 | + target_ulong addr, uint32_t desc) \ | ||
528 | +{ \ | ||
529 | + sme_ld1(env, za, vg, addr, desc, GETPC(), ESZ, 0, false, \ | ||
530 | + sve_ld1##L##L##END##_host, sve_ld1##L##L##END##_tlb, \ | ||
531 | + clear_horizontal, copy_horizontal); \ | ||
532 | +} \ | ||
533 | +void HELPER(sme_ld1##L##END##_v)(CPUARMState *env, void *za, void *vg, \ | ||
534 | + target_ulong addr, uint32_t desc) \ | ||
535 | +{ \ | ||
536 | + sme_ld1(env, za, vg, addr, desc, GETPC(), ESZ, 0, true, \ | ||
537 | + sme_ld1##L##END##_v_host, sme_ld1##L##END##_v_tlb, \ | ||
538 | + clear_vertical_##L, copy_vertical_##L); \ | ||
539 | +} \ | ||
540 | +void HELPER(sme_ld1##L##END##_h_mte)(CPUARMState *env, void *za, void *vg, \ | ||
541 | + target_ulong addr, uint32_t desc) \ | ||
542 | +{ \ | ||
543 | + sme_ld1_mte(env, za, vg, addr, desc, GETPC(), ESZ, false, \ | ||
544 | + sve_ld1##L##L##END##_host, sve_ld1##L##L##END##_tlb, \ | ||
545 | + clear_horizontal, copy_horizontal); \ | ||
546 | +} \ | ||
547 | +void HELPER(sme_ld1##L##END##_v_mte)(CPUARMState *env, void *za, void *vg, \ | ||
548 | + target_ulong addr, uint32_t desc) \ | ||
549 | +{ \ | ||
550 | + sme_ld1_mte(env, za, vg, addr, desc, GETPC(), ESZ, true, \ | ||
551 | + sme_ld1##L##END##_v_host, sme_ld1##L##END##_v_tlb, \ | ||
552 | + clear_vertical_##L, copy_vertical_##L); \ | ||
553 | +} | ||
554 | + | ||
555 | +DO_LD(b, , MO_8) | ||
556 | +DO_LD(h, _be, MO_16) | ||
557 | +DO_LD(h, _le, MO_16) | ||
558 | +DO_LD(s, _be, MO_32) | ||
559 | +DO_LD(s, _le, MO_32) | ||
560 | +DO_LD(d, _be, MO_64) | ||
561 | +DO_LD(d, _le, MO_64) | ||
562 | +DO_LD(q, _be, MO_128) | ||
563 | +DO_LD(q, _le, MO_128) | ||
564 | + | ||
565 | +#undef DO_LD | ||
566 | + | ||
567 | +/* | ||
568 | + * Common helper for all contiguous predicated stores. | ||
569 | + */ | ||
570 | + | ||
571 | +static inline QEMU_ALWAYS_INLINE | ||
572 | +void sme_st1(CPUARMState *env, void *za, uint64_t *vg, | ||
573 | + const target_ulong addr, uint32_t desc, const uintptr_t ra, | ||
574 | + const int esz, uint32_t mtedesc, bool vertical, | ||
575 | + sve_ldst1_host_fn *host_fn, | ||
576 | + sve_ldst1_tlb_fn *tlb_fn) | ||
577 | +{ | ||
578 | + const intptr_t reg_max = simd_oprsz(desc); | ||
579 | + const intptr_t esize = 1 << esz; | ||
580 | + intptr_t reg_off, reg_last; | ||
581 | + SVEContLdSt info; | ||
582 | + void *host; | ||
583 | + int flags; | ||
584 | + | ||
585 | + /* Find the active elements. */ | ||
586 | + if (!sve_cont_ldst_elements(&info, addr, vg, reg_max, esz, esize)) { | ||
587 | + /* The entire predicate was false; no store occurs. */ | ||
588 | + return; | ||
589 | + } | ||
590 | + | ||
591 | + /* Probe the page(s). Exit with exception for any invalid page. */ | ||
592 | + sve_cont_ldst_pages(&info, FAULT_ALL, env, addr, MMU_DATA_STORE, ra); | ||
593 | + | ||
594 | + /* Handle watchpoints for all active elements. */ | ||
595 | + sve_cont_ldst_watchpoints(&info, env, vg, addr, esize, esize, | ||
596 | + BP_MEM_WRITE, ra); | ||
597 | + | ||
598 | + /* | ||
599 | + * Handle mte checks for all active elements. | ||
600 | + * Since TBI must be set for MTE, !mtedesc => !mte_active. | ||
601 | + */ | ||
602 | + if (mtedesc) { | ||
603 | + sve_cont_ldst_mte_check(&info, env, vg, addr, esize, esize, | ||
604 | + mtedesc, ra); | ||
605 | + } | ||
606 | + | ||
607 | + flags = info.page[0].flags | info.page[1].flags; | ||
608 | + if (unlikely(flags != 0)) { | ||
609 | +#ifdef CONFIG_USER_ONLY | ||
610 | + g_assert_not_reached(); | ||
611 | +#else | ||
612 | + /* | ||
613 | + * At least one page includes MMIO. | ||
614 | + * Any bus operation can fail with cpu_transaction_failed, | ||
615 | + * which for ARM will raise SyncExternal. We cannot avoid | ||
616 | + * this fault and will leave with the store incomplete. | ||
617 | + */ | ||
618 | + reg_off = info.reg_off_first[0]; | ||
619 | + reg_last = info.reg_off_last[1]; | ||
620 | + if (reg_last < 0) { | ||
621 | + reg_last = info.reg_off_split; | ||
622 | + if (reg_last < 0) { | ||
623 | + reg_last = info.reg_off_last[0]; | ||
624 | + } | 426 | + } |
625 | + } | 427 | + } |
626 | + | 428 | + |
627 | + do { | 429 | val = arm_cpu->cpreg_values[hvf_sreg_match[i].cp_idx]; |
628 | + uint64_t pg = vg[reg_off >> 6]; | 430 | ret = hv_vcpu_set_sys_reg(cpu->hvf->fd, hvf_sreg_match[i].reg, val); |
629 | + do { | 431 | assert_hvf_ok(ret); |
630 | + if ((pg >> (reg_off & 63)) & 1) { | 432 | @@ -XXX,XX +XXX,XX @@ int hvf_vcpu_exec(CPUState *cpu) |
631 | + tlb_fn(env, za, reg_off, addr + reg_off, ra); | 433 | { |
632 | + } | 434 | ARMCPU *arm_cpu = ARM_CPU(cpu); |
633 | + reg_off += esize; | 435 | CPUARMState *env = &arm_cpu->env; |
634 | + } while (reg_off & 63); | 436 | + int ret; |
635 | + } while (reg_off <= reg_last); | 437 | hv_vcpu_exit_t *hvf_exit = cpu->hvf->exit; |
636 | + return; | 438 | hv_return_t r; |
637 | +#endif | 439 | bool advance_pc = false; |
638 | + } | 440 | |
639 | + | 441 | - if (hvf_inject_interrupts(cpu)) { |
640 | + reg_off = info.reg_off_first[0]; | 442 | + if (!(cpu->singlestep_enabled & SSTEP_NOIRQ) && |
641 | + reg_last = info.reg_off_last[0]; | 443 | + hvf_inject_interrupts(cpu)) { |
642 | + host = info.page[0].host; | 444 | return EXCP_INTERRUPT; |
643 | + | 445 | } |
644 | + while (reg_off <= reg_last) { | 446 | |
645 | + uint64_t pg = vg[reg_off >> 6]; | 447 | @@ -XXX,XX +XXX,XX @@ int hvf_vcpu_exec(CPUState *cpu) |
646 | + do { | 448 | uint64_t syndrome = hvf_exit->exception.syndrome; |
647 | + if ((pg >> (reg_off & 63)) & 1) { | 449 | uint32_t ec = syn_get_ec(syndrome); |
648 | + host_fn(za, reg_off, host + reg_off); | 450 | |
649 | + } | 451 | + ret = 0; |
650 | + reg_off += 1 << esz; | 452 | qemu_mutex_lock_iothread(); |
651 | + } while (reg_off <= reg_last && (reg_off & 63)); | 453 | switch (exit_reason) { |
652 | + } | 454 | case HV_EXIT_REASON_EXCEPTION: |
653 | + | 455 | @@ -XXX,XX +XXX,XX @@ int hvf_vcpu_exec(CPUState *cpu) |
654 | + /* | 456 | hvf_sync_vtimer(cpu); |
655 | + * Use the slow path to manage the cross-page misalignment. | 457 | |
656 | + * But we know this is RAM and cannot trap. | 458 | switch (ec) { |
657 | + */ | 459 | + case EC_SOFTWARESTEP: { |
658 | + reg_off = info.reg_off_split; | 460 | + ret = EXCP_DEBUG; |
659 | + if (unlikely(reg_off >= 0)) { | 461 | + |
660 | + tlb_fn(env, za, reg_off, addr + reg_off, ra); | 462 | + if (!cpu->singlestep_enabled) { |
661 | + } | 463 | + error_report("EC_SOFTWARESTEP but single-stepping not enabled"); |
662 | + | 464 | + } |
663 | + reg_off = info.reg_off_first[1]; | 465 | + break; |
664 | + if (unlikely(reg_off >= 0)) { | 466 | + } |
665 | + reg_last = info.reg_off_last[1]; | 467 | + case EC_AA64_BKPT: { |
666 | + host = info.page[1].host; | 468 | + ret = EXCP_DEBUG; |
667 | + | 469 | + |
668 | + do { | 470 | + cpu_synchronize_state(cpu); |
669 | + uint64_t pg = vg[reg_off >> 6]; | 471 | + |
670 | + do { | 472 | + if (!hvf_find_sw_breakpoint(cpu, env->pc)) { |
671 | + if ((pg >> (reg_off & 63)) & 1) { | 473 | + /* Re-inject into the guest */ |
672 | + host_fn(za, reg_off, host + reg_off); | 474 | + ret = 0; |
673 | + } | 475 | + hvf_raise_exception(cpu, EXCP_BKPT, syn_aa64_bkpt(0)); |
674 | + reg_off += 1 << esz; | 476 | + } |
675 | + } while (reg_off & 63); | 477 | + break; |
676 | + } while (reg_off <= reg_last); | 478 | + } |
677 | + } | 479 | + case EC_BREAKPOINT: { |
678 | +} | 480 | + ret = EXCP_DEBUG; |
679 | + | 481 | + |
680 | +static inline QEMU_ALWAYS_INLINE | 482 | + cpu_synchronize_state(cpu); |
681 | +void sme_st1_mte(CPUARMState *env, void *za, uint64_t *vg, target_ulong addr, | 483 | + |
682 | + uint32_t desc, uintptr_t ra, int esz, bool vertical, | 484 | + if (!find_hw_breakpoint(cpu, env->pc)) { |
683 | + sve_ldst1_host_fn *host_fn, | 485 | + error_report("EC_BREAKPOINT but unknown hw breakpoint"); |
684 | + sve_ldst1_tlb_fn *tlb_fn) | 486 | + } |
685 | +{ | 487 | + break; |
686 | + uint32_t mtedesc = desc >> (SIMD_DATA_SHIFT + SVE_MTEDESC_SHIFT); | 488 | + } |
687 | + int bit55 = extract64(addr, 55, 1); | 489 | + case EC_WATCHPOINT: { |
688 | + | 490 | + ret = EXCP_DEBUG; |
689 | + /* Remove mtedesc from the normal sve descriptor. */ | 491 | + |
690 | + desc = extract32(desc, 0, SIMD_DATA_SHIFT + SVE_MTEDESC_SHIFT); | 492 | + cpu_synchronize_state(cpu); |
691 | + | 493 | + |
692 | + /* Perform gross MTE suppression early. */ | 494 | + CPUWatchpoint *wp = |
693 | + if (!tbi_check(desc, bit55) || | 495 | + find_hw_watchpoint(cpu, hvf_exit->exception.virtual_address); |
694 | + tcma_check(desc, bit55, allocation_tag_from_addr(addr))) { | 496 | + if (!wp) { |
695 | + mtedesc = 0; | 497 | + error_report("EXCP_DEBUG but unknown hw watchpoint"); |
696 | + } | 498 | + } |
697 | + | 499 | + cpu->watchpoint_hit = wp; |
698 | + sme_st1(env, za, vg, addr, desc, ra, esz, mtedesc, | 500 | + break; |
699 | + vertical, host_fn, tlb_fn); | 501 | + } |
700 | +} | 502 | case EC_DATAABORT: { |
701 | + | 503 | bool isv = syndrome & ARM_EL_ISV; |
702 | +#define DO_ST(L, END, ESZ) \ | 504 | bool iswrite = (syndrome >> 6) & 1; |
703 | +void HELPER(sme_st1##L##END##_h)(CPUARMState *env, void *za, void *vg, \ | 505 | @@ -XXX,XX +XXX,XX @@ int hvf_vcpu_exec(CPUState *cpu) |
704 | + target_ulong addr, uint32_t desc) \ | 506 | pc += 4; |
705 | +{ \ | 507 | r = hv_vcpu_set_reg(cpu->hvf->fd, HV_REG_PC, pc); |
706 | + sme_st1(env, za, vg, addr, desc, GETPC(), ESZ, 0, false, \ | 508 | assert_hvf_ok(r); |
707 | + sve_st1##L##L##END##_host, sve_st1##L##L##END##_tlb); \ | 509 | + |
708 | +} \ | 510 | + /* Handle single-stepping over instructions which trigger a VM exit */ |
709 | +void HELPER(sme_st1##L##END##_v)(CPUARMState *env, void *za, void *vg, \ | 511 | + if (cpu->singlestep_enabled) { |
710 | + target_ulong addr, uint32_t desc) \ | 512 | + ret = EXCP_DEBUG; |
711 | +{ \ | 513 | + } |
712 | + sme_st1(env, za, vg, addr, desc, GETPC(), ESZ, 0, true, \ | 514 | } |
713 | + sme_st1##L##END##_v_host, sme_st1##L##END##_v_tlb); \ | 515 | |
714 | +} \ | 516 | - return 0; |
715 | +void HELPER(sme_st1##L##END##_h_mte)(CPUARMState *env, void *za, void *vg, \ | 517 | + return ret; |
716 | + target_ulong addr, uint32_t desc) \ | 518 | } |
717 | +{ \ | 519 | |
718 | + sme_st1_mte(env, za, vg, addr, desc, GETPC(), ESZ, false, \ | 520 | static const VMStateDescription vmstate_hvf_vtimer = { |
719 | + sve_st1##L##L##END##_host, sve_st1##L##L##END##_tlb); \ | 521 | @@ -XXX,XX +XXX,XX @@ int hvf_arch_init(void) |
720 | +} \ | 522 | hvf_state->vtimer_offset = mach_absolute_time(); |
721 | +void HELPER(sme_st1##L##END##_v_mte)(CPUARMState *env, void *za, void *vg, \ | 523 | vmstate_register(NULL, 0, &vmstate_hvf_vtimer, &vtimer); |
722 | + target_ulong addr, uint32_t desc) \ | 524 | qemu_add_vm_change_state_handler(hvf_vm_state_change, &vtimer); |
723 | +{ \ | 525 | + |
724 | + sme_st1_mte(env, za, vg, addr, desc, GETPC(), ESZ, true, \ | 526 | + hvf_arm_init_debug(); |
725 | + sme_st1##L##END##_v_host, sme_st1##L##END##_v_tlb); \ | 527 | + |
726 | +} | 528 | return 0; |
727 | + | 529 | } |
728 | +DO_ST(b, , MO_8) | 530 | |
729 | +DO_ST(h, _be, MO_16) | 531 | @@ -XXX,XX +XXX,XX @@ void hvf_arch_remove_all_hw_breakpoints(void) |
730 | +DO_ST(h, _le, MO_16) | 532 | g_array_remove_range(hw_breakpoints, 0, cur_hw_bps); |
731 | +DO_ST(s, _be, MO_32) | 533 | } |
732 | +DO_ST(s, _le, MO_32) | 534 | } |
733 | +DO_ST(d, _be, MO_64) | 535 | + |
734 | +DO_ST(d, _le, MO_64) | 536 | +/* |
735 | +DO_ST(q, _be, MO_128) | 537 | + * Update the vCPU with the gdbstub's view of debug registers. This view |
736 | +DO_ST(q, _le, MO_128) | 538 | + * consists of all hardware breakpoints and watchpoints inserted so far while |
737 | + | 539 | + * debugging the guest. |
738 | +#undef DO_ST | 540 | + */ |
739 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 541 | +static void hvf_put_gdbstub_debug_registers(CPUState *cpu) |
542 | +{ | ||
543 | + hv_return_t r = HV_SUCCESS; | ||
544 | + int i; | ||
545 | + | ||
546 | + for (i = 0; i < cur_hw_bps; i++) { | ||
547 | + HWBreakpoint *bp = get_hw_bp(i); | ||
548 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgbcr_regs[i], bp->bcr); | ||
549 | + assert_hvf_ok(r); | ||
550 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgbvr_regs[i], bp->bvr); | ||
551 | + assert_hvf_ok(r); | ||
552 | + } | ||
553 | + for (i = cur_hw_bps; i < max_hw_bps; i++) { | ||
554 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgbcr_regs[i], 0); | ||
555 | + assert_hvf_ok(r); | ||
556 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgbvr_regs[i], 0); | ||
557 | + assert_hvf_ok(r); | ||
558 | + } | ||
559 | + | ||
560 | + for (i = 0; i < cur_hw_wps; i++) { | ||
561 | + HWWatchpoint *wp = get_hw_wp(i); | ||
562 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgwcr_regs[i], wp->wcr); | ||
563 | + assert_hvf_ok(r); | ||
564 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgwvr_regs[i], wp->wvr); | ||
565 | + assert_hvf_ok(r); | ||
566 | + } | ||
567 | + for (i = cur_hw_wps; i < max_hw_wps; i++) { | ||
568 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgwcr_regs[i], 0); | ||
569 | + assert_hvf_ok(r); | ||
570 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgwvr_regs[i], 0); | ||
571 | + assert_hvf_ok(r); | ||
572 | + } | ||
573 | +} | ||
574 | + | ||
575 | +/* | ||
576 | + * Update the vCPU with the guest's view of debug registers. This view is kept | ||
577 | + * in the environment at all times. | ||
578 | + */ | ||
579 | +static void hvf_put_guest_debug_registers(CPUState *cpu) | ||
580 | +{ | ||
581 | + ARMCPU *arm_cpu = ARM_CPU(cpu); | ||
582 | + CPUARMState *env = &arm_cpu->env; | ||
583 | + hv_return_t r = HV_SUCCESS; | ||
584 | + int i; | ||
585 | + | ||
586 | + for (i = 0; i < max_hw_bps; i++) { | ||
587 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgbcr_regs[i], | ||
588 | + env->cp15.dbgbcr[i]); | ||
589 | + assert_hvf_ok(r); | ||
590 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgbvr_regs[i], | ||
591 | + env->cp15.dbgbvr[i]); | ||
592 | + assert_hvf_ok(r); | ||
593 | + } | ||
594 | + | ||
595 | + for (i = 0; i < max_hw_wps; i++) { | ||
596 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgwcr_regs[i], | ||
597 | + env->cp15.dbgwcr[i]); | ||
598 | + assert_hvf_ok(r); | ||
599 | + r = hv_vcpu_set_sys_reg(cpu->hvf->fd, dbgwvr_regs[i], | ||
600 | + env->cp15.dbgwvr[i]); | ||
601 | + assert_hvf_ok(r); | ||
602 | + } | ||
603 | +} | ||
604 | + | ||
605 | +static inline bool hvf_arm_hw_debug_active(CPUState *cpu) | ||
606 | +{ | ||
607 | + return ((cur_hw_wps > 0) || (cur_hw_bps > 0)); | ||
608 | +} | ||
609 | + | ||
610 | +static void hvf_arch_set_traps(void) | ||
611 | +{ | ||
612 | + CPUState *cpu; | ||
613 | + bool should_enable_traps = false; | ||
614 | + hv_return_t r = HV_SUCCESS; | ||
615 | + | ||
616 | + /* Check whether guest debugging is enabled for at least one vCPU; if it | ||
617 | + * is, enable exiting the guest on all vCPUs */ | ||
618 | + CPU_FOREACH(cpu) { | ||
619 | + should_enable_traps |= cpu->hvf->guest_debug_enabled; | ||
620 | + } | ||
621 | + CPU_FOREACH(cpu) { | ||
622 | + /* Set whether debug exceptions exit the guest */ | ||
623 | + r = hv_vcpu_set_trap_debug_exceptions(cpu->hvf->fd, | ||
624 | + should_enable_traps); | ||
625 | + assert_hvf_ok(r); | ||
626 | + | ||
627 | + /* Set whether accesses to debug registers exit the guest */ | ||
628 | + r = hv_vcpu_set_trap_debug_reg_accesses(cpu->hvf->fd, | ||
629 | + should_enable_traps); | ||
630 | + assert_hvf_ok(r); | ||
631 | + } | ||
632 | +} | ||
633 | + | ||
634 | +void hvf_arch_update_guest_debug(CPUState *cpu) | ||
635 | +{ | ||
636 | + ARMCPU *arm_cpu = ARM_CPU(cpu); | ||
637 | + CPUARMState *env = &arm_cpu->env; | ||
638 | + | ||
639 | + /* Check whether guest debugging is enabled */ | ||
640 | + cpu->hvf->guest_debug_enabled = cpu->singlestep_enabled || | ||
641 | + hvf_sw_breakpoints_active(cpu) || | ||
642 | + hvf_arm_hw_debug_active(cpu); | ||
643 | + | ||
644 | + /* Update debug registers */ | ||
645 | + if (cpu->hvf->guest_debug_enabled) { | ||
646 | + hvf_put_gdbstub_debug_registers(cpu); | ||
647 | + } else { | ||
648 | + hvf_put_guest_debug_registers(cpu); | ||
649 | + } | ||
650 | + | ||
651 | + cpu_synchronize_state(cpu); | ||
652 | + | ||
653 | + /* Enable/disable single-stepping */ | ||
654 | + if (cpu->singlestep_enabled) { | ||
655 | + env->cp15.mdscr_el1 = | ||
656 | + deposit64(env->cp15.mdscr_el1, MDSCR_EL1_SS_SHIFT, 1, 1); | ||
657 | + pstate_write(env, pstate_read(env) | PSTATE_SS); | ||
658 | + } else { | ||
659 | + env->cp15.mdscr_el1 = | ||
660 | + deposit64(env->cp15.mdscr_el1, MDSCR_EL1_SS_SHIFT, 1, 0); | ||
661 | + } | ||
662 | + | ||
663 | + /* Enable/disable Breakpoint exceptions */ | ||
664 | + if (hvf_arm_hw_debug_active(cpu)) { | ||
665 | + env->cp15.mdscr_el1 = | ||
666 | + deposit64(env->cp15.mdscr_el1, MDSCR_EL1_MDE_SHIFT, 1, 1); | ||
667 | + } else { | ||
668 | + env->cp15.mdscr_el1 = | ||
669 | + deposit64(env->cp15.mdscr_el1, MDSCR_EL1_MDE_SHIFT, 1, 0); | ||
670 | + } | ||
671 | + | ||
672 | + hvf_arch_set_traps(); | ||
673 | +} | ||
674 | + | ||
675 | +inline bool hvf_arch_supports_guest_debug(void) | ||
676 | +{ | ||
677 | + return true; | ||
678 | +} | ||
679 | diff --git a/target/i386/hvf/hvf.c b/target/i386/hvf/hvf.c | ||
740 | index XXXXXXX..XXXXXXX 100644 | 680 | index XXXXXXX..XXXXXXX 100644 |
741 | --- a/target/arm/translate-sme.c | 681 | --- a/target/i386/hvf/hvf.c |
742 | +++ b/target/arm/translate-sme.c | 682 | +++ b/target/i386/hvf/hvf.c |
743 | @@ -XXX,XX +XXX,XX @@ static bool trans_MOVA(DisasContext *s, arg_MOVA *a) | 683 | @@ -XXX,XX +XXX,XX @@ int hvf_arch_remove_hw_breakpoint(target_ulong addr, target_ulong len, int type) |
744 | 684 | void hvf_arch_remove_all_hw_breakpoints(void) | |
745 | return true; | 685 | { |
746 | } | 686 | } |
747 | + | 687 | + |
748 | +static bool trans_LDST1(DisasContext *s, arg_LDST1 *a) | 688 | +void hvf_arch_update_guest_debug(CPUState *cpu) |
749 | +{ | 689 | +{ |
750 | + typedef void GenLdSt1(TCGv_env, TCGv_ptr, TCGv_ptr, TCGv, TCGv_i32); | 690 | +} |
751 | + | 691 | + |
752 | + /* | 692 | +inline bool hvf_arch_supports_guest_debug(void) |
753 | + * Indexed by [esz][be][v][mte][st], which is (except for load/store) | 693 | +{ |
754 | + * also the order in which the elements appear in the function names, | 694 | + return false; |
755 | + * and so how we must concatenate the pieces. | ||
756 | + */ | ||
757 | + | ||
758 | +#define FN_LS(F) { gen_helper_sme_ld1##F, gen_helper_sme_st1##F } | ||
759 | +#define FN_MTE(F) { FN_LS(F), FN_LS(F##_mte) } | ||
760 | +#define FN_HV(F) { FN_MTE(F##_h), FN_MTE(F##_v) } | ||
761 | +#define FN_END(L, B) { FN_HV(L), FN_HV(B) } | ||
762 | + | ||
763 | + static GenLdSt1 * const fns[5][2][2][2][2] = { | ||
764 | + FN_END(b, b), | ||
765 | + FN_END(h_le, h_be), | ||
766 | + FN_END(s_le, s_be), | ||
767 | + FN_END(d_le, d_be), | ||
768 | + FN_END(q_le, q_be), | ||
769 | + }; | ||
770 | + | ||
771 | +#undef FN_LS | ||
772 | +#undef FN_MTE | ||
773 | +#undef FN_HV | ||
774 | +#undef FN_END | ||
775 | + | ||
776 | + TCGv_ptr t_za, t_pg; | ||
777 | + TCGv_i64 addr; | ||
778 | + int svl, desc = 0; | ||
779 | + bool be = s->be_data == MO_BE; | ||
780 | + bool mte = s->mte_active[0]; | ||
781 | + | ||
782 | + if (!dc_isar_feature(aa64_sme, s)) { | ||
783 | + return false; | ||
784 | + } | ||
785 | + if (!sme_smza_enabled_check(s)) { | ||
786 | + return true; | ||
787 | + } | ||
788 | + | ||
789 | + t_za = get_tile_rowcol(s, a->esz, a->rs, a->za_imm, a->v); | ||
790 | + t_pg = pred_full_reg_ptr(s, a->pg); | ||
791 | + addr = tcg_temp_new_i64(); | ||
792 | + | ||
793 | + tcg_gen_shli_i64(addr, cpu_reg(s, a->rm), a->esz); | ||
794 | + tcg_gen_add_i64(addr, addr, cpu_reg_sp(s, a->rn)); | ||
795 | + | ||
796 | + if (mte) { | ||
797 | + desc = FIELD_DP32(desc, MTEDESC, MIDX, get_mem_index(s)); | ||
798 | + desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid); | ||
799 | + desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma); | ||
800 | + desc = FIELD_DP32(desc, MTEDESC, WRITE, a->st); | ||
801 | + desc = FIELD_DP32(desc, MTEDESC, SIZEM1, (1 << a->esz) - 1); | ||
802 | + desc <<= SVE_MTEDESC_SHIFT; | ||
803 | + } else { | ||
804 | + addr = clean_data_tbi(s, addr); | ||
805 | + } | ||
806 | + svl = streaming_vec_reg_size(s); | ||
807 | + desc = simd_desc(svl, svl, desc); | ||
808 | + | ||
809 | + fns[a->esz][be][a->v][mte][a->st](cpu_env, t_za, t_pg, addr, | ||
810 | + tcg_constant_i32(desc)); | ||
811 | + | ||
812 | + tcg_temp_free_ptr(t_za); | ||
813 | + tcg_temp_free_ptr(t_pg); | ||
814 | + tcg_temp_free_i64(addr); | ||
815 | + return true; | ||
816 | +} | 695 | +} |
817 | -- | 696 | -- |
818 | 2.25.1 | 697 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Vikram Garhwal <vikram.garhwal@amd.com> |
---|---|---|---|
2 | 2 | ||
3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 3 | The Xilinx Versal CANFD controller is developed based on SocketCAN, QEMU CAN bus |
4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 4 | implementation. Bus connection and socketCAN connection for each CAN module |
5 | Message-id: 20220708151540.18136-24-richard.henderson@linaro.org | 5 | can be set through command lines. |
6 | |||
7 | Signed-off-by: Vikram Garhwal <vikram.garhwal@amd.com> | ||
8 | Reviewed-by: Francisco Iglesias <frasse.iglesias@gmail.com> | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 10 | --- |
8 | target/arm/helper-sme.h | 5 +++ | 11 | include/hw/net/xlnx-versal-canfd.h | 87 ++ |
9 | target/arm/sme.decode | 11 +++++ | 12 | hw/net/can/xlnx-versal-canfd.c | 2107 ++++++++++++++++++++++++++++ |
10 | target/arm/sme_helper.c | 90 ++++++++++++++++++++++++++++++++++++++ | 13 | hw/net/can/meson.build | 1 + |
11 | target/arm/translate-sme.c | 31 +++++++++++++ | 14 | hw/net/can/trace-events | 7 + |
12 | 4 files changed, 137 insertions(+) | 15 | 4 files changed, 2202 insertions(+) |
16 | create mode 100644 include/hw/net/xlnx-versal-canfd.h | ||
17 | create mode 100644 hw/net/can/xlnx-versal-canfd.c | ||
13 | 18 | ||
14 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | 19 | diff --git a/include/hw/net/xlnx-versal-canfd.h b/include/hw/net/xlnx-versal-canfd.h |
15 | index XXXXXXX..XXXXXXX 100644 | 20 | new file mode 100644 |
16 | --- a/target/arm/helper-sme.h | 21 | index XXXXXXX..XXXXXXX |
17 | +++ b/target/arm/helper-sme.h | 22 | --- /dev/null |
18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(sme_st1q_be_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i | 23 | +++ b/include/hw/net/xlnx-versal-canfd.h |
19 | DEF_HELPER_FLAGS_5(sme_st1q_le_h_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 24 | @@ -XXX,XX +XXX,XX @@ |
20 | DEF_HELPER_FLAGS_5(sme_st1q_be_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 25 | +/* |
21 | DEF_HELPER_FLAGS_5(sme_st1q_le_v_mte, TCG_CALL_NO_WG, void, env, ptr, ptr, tl, i32) | 26 | + * QEMU model of the Xilinx Versal CANFD Controller. |
22 | + | 27 | + * |
23 | +DEF_HELPER_FLAGS_5(sme_addha_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 28 | + * Copyright (c) 2023 Advanced Micro Devices, Inc. |
24 | +DEF_HELPER_FLAGS_5(sme_addva_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 29 | + * |
25 | +DEF_HELPER_FLAGS_5(sme_addha_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 30 | + * Written-by: Vikram Garhwal<vikram.garhwal@amd.com> |
26 | +DEF_HELPER_FLAGS_5(sme_addva_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 31 | + * Based on QEMU CANFD Device emulation implemented by Jin Yang, Deniz Eren and |
27 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | 32 | + * Pavel Pisa. |
28 | index XXXXXXX..XXXXXXX 100644 | 33 | + * Permission is hereby granted, free of charge, to any person obtaining a copy |
29 | --- a/target/arm/sme.decode | 34 | + * of this software and associated documentation files (the "Software"), to deal |
30 | +++ b/target/arm/sme.decode | 35 | + * in the Software without restriction, including without limitation the rights |
31 | @@ -XXX,XX +XXX,XX @@ LDST1 1110000 111 st:1 rm:5 v:1 .. pg:3 rn:5 0 za_imm:4 \ | 36 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell |
32 | 37 | + * copies of the Software, and to permit persons to whom the Software is | |
33 | LDR 1110000 100 0 000000 .. 000 ..... 0 .... @ldstr | 38 | + * furnished to do so, subject to the following conditions: |
34 | STR 1110000 100 1 000000 .. 000 ..... 0 .... @ldstr | 39 | + * |
35 | + | 40 | + * The above copyright notice and this permission notice shall be included in |
36 | +### SME Add Vector to Array | 41 | + * all copies or substantial portions of the Software. |
37 | + | 42 | + * |
38 | +&adda zad zn pm pn | 43 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
39 | +@adda_32 ........ .. ..... . pm:3 pn:3 zn:5 ... zad:2 &adda | 44 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
40 | +@adda_64 ........ .. ..... . pm:3 pn:3 zn:5 .. zad:3 &adda | 45 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
41 | + | 46 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
42 | +ADDHA_s 11000000 10 01000 0 ... ... ..... 000 .. @adda_32 | 47 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
43 | +ADDVA_s 11000000 10 01000 1 ... ... ..... 000 .. @adda_32 | 48 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN |
44 | +ADDHA_d 11000000 11 01000 0 ... ... ..... 00 ... @adda_64 | 49 | + * THE SOFTWARE. |
45 | +ADDVA_d 11000000 11 01000 1 ... ... ..... 00 ... @adda_64 | 50 | + */ |
46 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | 51 | + |
47 | index XXXXXXX..XXXXXXX 100644 | 52 | +#ifndef HW_CANFD_XILINX_H |
48 | --- a/target/arm/sme_helper.c | 53 | +#define HW_CANFD_XILINX_H |
49 | +++ b/target/arm/sme_helper.c | 54 | + |
50 | @@ -XXX,XX +XXX,XX @@ DO_ST(q, _be, MO_128) | 55 | +#include "hw/register.h" |
51 | DO_ST(q, _le, MO_128) | 56 | +#include "hw/ptimer.h" |
52 | 57 | +#include "net/can_emu.h" | |
53 | #undef DO_ST | 58 | +#include "hw/qdev-clock.h" |
54 | + | 59 | + |
55 | +void HELPER(sme_addha_s)(void *vzda, void *vzn, void *vpn, | 60 | +#define TYPE_XILINX_CANFD "xlnx.versal-canfd" |
56 | + void *vpm, uint32_t desc) | 61 | + |
57 | +{ | 62 | +OBJECT_DECLARE_SIMPLE_TYPE(XlnxVersalCANFDState, XILINX_CANFD) |
58 | + intptr_t row, col, oprsz = simd_oprsz(desc) / 4; | 63 | + |
59 | + uint64_t *pn = vpn, *pm = vpm; | 64 | +#define NUM_REGS_PER_MSG_SPACE 18 /* 1 ID + 1 DLC + 16 Data(DW0 - DW15) regs. */ |
60 | + uint32_t *zda = vzda, *zn = vzn; | 65 | +#define MAX_NUM_RX 64 |
61 | + | 66 | +#define OFFSET_RX1_DW15 (0x4144 / 4) |
62 | + for (row = 0; row < oprsz; ) { | 67 | +#define CANFD_TIMER_MAX 0xFFFFUL |
63 | + uint64_t pa = pn[row >> 4]; | 68 | +#define CANFD_DEFAULT_CLOCK (25 * 1000 * 1000) |
64 | + do { | 69 | + |
65 | + if (pa & 1) { | 70 | +#define XLNX_VERSAL_CANFD_R_MAX (OFFSET_RX1_DW15 + \ |
66 | + for (col = 0; col < oprsz; ) { | 71 | + ((MAX_NUM_RX - 1) * NUM_REGS_PER_MSG_SPACE) + 1) |
67 | + uint64_t pb = pm[col >> 4]; | 72 | + |
68 | + do { | 73 | +typedef struct XlnxVersalCANFDState { |
69 | + if (pb & 1) { | 74 | + SysBusDevice parent_obj; |
70 | + zda[tile_vslice_index(row) + H4(col)] += zn[H4(col)]; | 75 | + MemoryRegion iomem; |
71 | + } | 76 | + |
72 | + pb >>= 4; | 77 | + qemu_irq irq_canfd_int; |
73 | + } while (++col & 15); | 78 | + qemu_irq irq_addr_err; |
79 | + | ||
80 | + RegisterInfo reg_info[XLNX_VERSAL_CANFD_R_MAX]; | ||
81 | + RegisterAccessInfo *tx_regs; | ||
82 | + RegisterAccessInfo *rx0_regs; | ||
83 | + RegisterAccessInfo *rx1_regs; | ||
84 | + RegisterAccessInfo *af_regs; | ||
85 | + RegisterAccessInfo *txe_regs; | ||
86 | + RegisterAccessInfo *rx_mailbox_regs; | ||
87 | + RegisterAccessInfo *af_mask_regs_mailbox; | ||
88 | + | ||
89 | + uint32_t regs[XLNX_VERSAL_CANFD_R_MAX]; | ||
90 | + | ||
91 | + ptimer_state *canfd_timer; | ||
92 | + | ||
93 | + CanBusClientState bus_client; | ||
94 | + CanBusState *canfdbus; | ||
95 | + | ||
96 | + struct { | ||
97 | + uint8_t rx0_fifo; | ||
98 | + uint8_t rx1_fifo; | ||
99 | + uint8_t tx_fifo; | ||
100 | + bool enable_rx_fifo1; | ||
101 | + uint32_t ext_clk_freq; | ||
102 | + } cfg; | ||
103 | + | ||
104 | +} XlnxVersalCANFDState; | ||
105 | + | ||
106 | +typedef struct tx_ready_reg_info { | ||
107 | + uint32_t can_id; | ||
108 | + uint32_t reg_num; | ||
109 | +} tx_ready_reg_info; | ||
110 | + | ||
111 | +#endif | ||
112 | diff --git a/hw/net/can/xlnx-versal-canfd.c b/hw/net/can/xlnx-versal-canfd.c | ||
113 | new file mode 100644 | ||
114 | index XXXXXXX..XXXXXXX | ||
115 | --- /dev/null | ||
116 | +++ b/hw/net/can/xlnx-versal-canfd.c | ||
117 | @@ -XXX,XX +XXX,XX @@ | ||
118 | +/* | ||
119 | + * QEMU model of the Xilinx Versal CANFD device. | ||
120 | + * | ||
121 | + * This implementation is based on the following datasheet: | ||
122 | + * https://docs.xilinx.com/v/u/2.0-English/pg223-canfd | ||
123 | + * | ||
124 | + * Copyright (c) 2023 Advanced Micro Devices, Inc. | ||
125 | + * | ||
126 | + * Written-by: Vikram Garhwal <vikram.garhwal@amd.com> | ||
127 | + * | ||
128 | + * Based on QEMU CANFD Device emulation implemented by Jin Yang, Deniz Eren and | ||
129 | + * Pavel Pisa | ||
130 | + * | ||
131 | + * Permission is hereby granted, free of charge, to any person obtaining a copy | ||
132 | + * of this software and associated documentation files (the "Software"), to deal | ||
133 | + * in the Software without restriction, including without limitation the rights | ||
134 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||
135 | + * copies of the Software, and to permit persons to whom the Software is | ||
136 | + * furnished to do so, subject to the following conditions: | ||
137 | + * | ||
138 | + * The above copyright notice and this permission notice shall be included in | ||
139 | + * all copies or substantial portions of the Software. | ||
140 | + * | ||
141 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
142 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
143 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | ||
144 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
145 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||
146 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | ||
147 | + * THE SOFTWARE. | ||
148 | + */ | ||
149 | + | ||
150 | +#include "qemu/osdep.h" | ||
151 | +#include "hw/sysbus.h" | ||
152 | +#include "hw/irq.h" | ||
153 | +#include "hw/register.h" | ||
154 | +#include "qapi/error.h" | ||
155 | +#include "qemu/bitops.h" | ||
156 | +#include "qemu/log.h" | ||
157 | +#include "qemu/cutils.h" | ||
158 | +#include "qemu/event_notifier.h" | ||
159 | +#include "hw/qdev-properties.h" | ||
160 | +#include "qom/object_interfaces.h" | ||
161 | +#include "migration/vmstate.h" | ||
162 | +#include "hw/net/xlnx-versal-canfd.h" | ||
163 | +#include "trace.h" | ||
164 | + | ||
165 | +REG32(SOFTWARE_RESET_REGISTER, 0x0) | ||
166 | + FIELD(SOFTWARE_RESET_REGISTER, CEN, 1, 1) | ||
167 | + FIELD(SOFTWARE_RESET_REGISTER, SRST, 0, 1) | ||
168 | +REG32(MODE_SELECT_REGISTER, 0x4) | ||
169 | + FIELD(MODE_SELECT_REGISTER, ITO, 8, 8) | ||
170 | + FIELD(MODE_SELECT_REGISTER, ABR, 7, 1) | ||
171 | + FIELD(MODE_SELECT_REGISTER, SBR, 6, 1) | ||
172 | + FIELD(MODE_SELECT_REGISTER, DPEE, 5, 1) | ||
173 | + FIELD(MODE_SELECT_REGISTER, DAR, 4, 1) | ||
174 | + FIELD(MODE_SELECT_REGISTER, BRSD, 3, 1) | ||
175 | + FIELD(MODE_SELECT_REGISTER, SNOOP, 2, 1) | ||
176 | + FIELD(MODE_SELECT_REGISTER, LBACK, 1, 1) | ||
177 | + FIELD(MODE_SELECT_REGISTER, SLEEP, 0, 1) | ||
178 | +REG32(ARBITRATION_PHASE_BAUD_RATE_PRESCALER_REGISTER, 0x8) | ||
179 | + FIELD(ARBITRATION_PHASE_BAUD_RATE_PRESCALER_REGISTER, BRP, 0, 8) | ||
180 | +REG32(ARBITRATION_PHASE_BIT_TIMING_REGISTER, 0xc) | ||
181 | + FIELD(ARBITRATION_PHASE_BIT_TIMING_REGISTER, SJW, 16, 7) | ||
182 | + FIELD(ARBITRATION_PHASE_BIT_TIMING_REGISTER, TS2, 8, 7) | ||
183 | + FIELD(ARBITRATION_PHASE_BIT_TIMING_REGISTER, TS1, 0, 8) | ||
184 | +REG32(ERROR_COUNTER_REGISTER, 0x10) | ||
185 | + FIELD(ERROR_COUNTER_REGISTER, REC, 8, 8) | ||
186 | + FIELD(ERROR_COUNTER_REGISTER, TEC, 0, 8) | ||
187 | +REG32(ERROR_STATUS_REGISTER, 0x14) | ||
188 | + FIELD(ERROR_STATUS_REGISTER, F_BERR, 11, 1) | ||
189 | + FIELD(ERROR_STATUS_REGISTER, F_STER, 10, 1) | ||
190 | + FIELD(ERROR_STATUS_REGISTER, F_FMER, 9, 1) | ||
191 | + FIELD(ERROR_STATUS_REGISTER, F_CRCER, 8, 1) | ||
192 | + FIELD(ERROR_STATUS_REGISTER, ACKER, 4, 1) | ||
193 | + FIELD(ERROR_STATUS_REGISTER, BERR, 3, 1) | ||
194 | + FIELD(ERROR_STATUS_REGISTER, STER, 2, 1) | ||
195 | + FIELD(ERROR_STATUS_REGISTER, FMER, 1, 1) | ||
196 | + FIELD(ERROR_STATUS_REGISTER, CRCER, 0, 1) | ||
197 | +REG32(STATUS_REGISTER, 0x18) | ||
198 | + FIELD(STATUS_REGISTER, TDCV, 16, 7) | ||
199 | + FIELD(STATUS_REGISTER, SNOOP, 12, 1) | ||
200 | + FIELD(STATUS_REGISTER, BSFR_CONFIG, 10, 1) | ||
201 | + FIELD(STATUS_REGISTER, PEE_CONFIG, 9, 1) | ||
202 | + FIELD(STATUS_REGISTER, ESTAT, 7, 2) | ||
203 | + FIELD(STATUS_REGISTER, ERRWRN, 6, 1) | ||
204 | + FIELD(STATUS_REGISTER, BBSY, 5, 1) | ||
205 | + FIELD(STATUS_REGISTER, BIDLE, 4, 1) | ||
206 | + FIELD(STATUS_REGISTER, NORMAL, 3, 1) | ||
207 | + FIELD(STATUS_REGISTER, SLEEP, 2, 1) | ||
208 | + FIELD(STATUS_REGISTER, LBACK, 1, 1) | ||
209 | + FIELD(STATUS_REGISTER, CONFIG, 0, 1) | ||
210 | +REG32(INTERRUPT_STATUS_REGISTER, 0x1c) | ||
211 | + FIELD(INTERRUPT_STATUS_REGISTER, TXEWMFLL, 31, 1) | ||
212 | + FIELD(INTERRUPT_STATUS_REGISTER, TXEOFLW, 30, 1) | ||
213 | + FIELD(INTERRUPT_STATUS_REGISTER, RXBOFLW_BI, 24, 6) | ||
214 | + FIELD(INTERRUPT_STATUS_REGISTER, RXLRM_BI, 18, 6) | ||
215 | + FIELD(INTERRUPT_STATUS_REGISTER, RXMNF, 17, 1) | ||
216 | + FIELD(INTERRUPT_STATUS_REGISTER, RXFWMFLL_1, 16, 1) | ||
217 | + FIELD(INTERRUPT_STATUS_REGISTER, RXFOFLW_1, 15, 1) | ||
218 | + FIELD(INTERRUPT_STATUS_REGISTER, TXCRS, 14, 1) | ||
219 | + FIELD(INTERRUPT_STATUS_REGISTER, TXRRS, 13, 1) | ||
220 | + FIELD(INTERRUPT_STATUS_REGISTER, RXFWMFLL, 12, 1) | ||
221 | + FIELD(INTERRUPT_STATUS_REGISTER, WKUP, 11, 1) | ||
222 | + FIELD(INTERRUPT_STATUS_REGISTER, SLP, 10, 1) | ||
223 | + FIELD(INTERRUPT_STATUS_REGISTER, BSOFF, 9, 1) | ||
224 | + /* | ||
225 | + * In the original HW description below bit is named as ERROR but an ERROR | ||
226 | + * field name collides with a macro in Windows build. To avoid Windows build | ||
227 | + * failures, the bit is renamed to ERROR_BIT. | ||
228 | + */ | ||
229 | + FIELD(INTERRUPT_STATUS_REGISTER, ERROR_BIT, 8, 1) | ||
230 | + FIELD(INTERRUPT_STATUS_REGISTER, RXFOFLW, 6, 1) | ||
231 | + FIELD(INTERRUPT_STATUS_REGISTER, TSCNT_OFLW, 5, 1) | ||
232 | + FIELD(INTERRUPT_STATUS_REGISTER, RXOK, 4, 1) | ||
233 | + FIELD(INTERRUPT_STATUS_REGISTER, BSFRD, 3, 1) | ||
234 | + FIELD(INTERRUPT_STATUS_REGISTER, PEE, 2, 1) | ||
235 | + FIELD(INTERRUPT_STATUS_REGISTER, TXOK, 1, 1) | ||
236 | + FIELD(INTERRUPT_STATUS_REGISTER, ARBLST, 0, 1) | ||
237 | +REG32(INTERRUPT_ENABLE_REGISTER, 0x20) | ||
238 | + FIELD(INTERRUPT_ENABLE_REGISTER, ETXEWMFLL, 31, 1) | ||
239 | + FIELD(INTERRUPT_ENABLE_REGISTER, ETXEOFLW, 30, 1) | ||
240 | + FIELD(INTERRUPT_ENABLE_REGISTER, ERXMNF, 17, 1) | ||
241 | + FIELD(INTERRUPT_ENABLE_REGISTER, ERXFWMFLL_1, 16, 1) | ||
242 | + FIELD(INTERRUPT_ENABLE_REGISTER, ERXFOFLW_1, 15, 1) | ||
243 | + FIELD(INTERRUPT_ENABLE_REGISTER, ETXCRS, 14, 1) | ||
244 | + FIELD(INTERRUPT_ENABLE_REGISTER, ETXRRS, 13, 1) | ||
245 | + FIELD(INTERRUPT_ENABLE_REGISTER, ERXFWMFLL, 12, 1) | ||
246 | + FIELD(INTERRUPT_ENABLE_REGISTER, EWKUP, 11, 1) | ||
247 | + FIELD(INTERRUPT_ENABLE_REGISTER, ESLP, 10, 1) | ||
248 | + FIELD(INTERRUPT_ENABLE_REGISTER, EBSOFF, 9, 1) | ||
249 | + FIELD(INTERRUPT_ENABLE_REGISTER, EERROR, 8, 1) | ||
250 | + FIELD(INTERRUPT_ENABLE_REGISTER, ERFXOFLW, 6, 1) | ||
251 | + FIELD(INTERRUPT_ENABLE_REGISTER, ETSCNT_OFLW, 5, 1) | ||
252 | + FIELD(INTERRUPT_ENABLE_REGISTER, ERXOK, 4, 1) | ||
253 | + FIELD(INTERRUPT_ENABLE_REGISTER, EBSFRD, 3, 1) | ||
254 | + FIELD(INTERRUPT_ENABLE_REGISTER, EPEE, 2, 1) | ||
255 | + FIELD(INTERRUPT_ENABLE_REGISTER, ETXOK, 1, 1) | ||
256 | + FIELD(INTERRUPT_ENABLE_REGISTER, EARBLOST, 0, 1) | ||
257 | +REG32(INTERRUPT_CLEAR_REGISTER, 0x24) | ||
258 | + FIELD(INTERRUPT_CLEAR_REGISTER, CTXEWMFLL, 31, 1) | ||
259 | + FIELD(INTERRUPT_CLEAR_REGISTER, CTXEOFLW, 30, 1) | ||
260 | + FIELD(INTERRUPT_CLEAR_REGISTER, CRXMNF, 17, 1) | ||
261 | + FIELD(INTERRUPT_CLEAR_REGISTER, CRXFWMFLL_1, 16, 1) | ||
262 | + FIELD(INTERRUPT_CLEAR_REGISTER, CRXFOFLW_1, 15, 1) | ||
263 | + FIELD(INTERRUPT_CLEAR_REGISTER, CTXCRS, 14, 1) | ||
264 | + FIELD(INTERRUPT_CLEAR_REGISTER, CTXRRS, 13, 1) | ||
265 | + FIELD(INTERRUPT_CLEAR_REGISTER, CRXFWMFLL, 12, 1) | ||
266 | + FIELD(INTERRUPT_CLEAR_REGISTER, CWKUP, 11, 1) | ||
267 | + FIELD(INTERRUPT_CLEAR_REGISTER, CSLP, 10, 1) | ||
268 | + FIELD(INTERRUPT_CLEAR_REGISTER, CBSOFF, 9, 1) | ||
269 | + FIELD(INTERRUPT_CLEAR_REGISTER, CERROR, 8, 1) | ||
270 | + FIELD(INTERRUPT_CLEAR_REGISTER, CRFXOFLW, 6, 1) | ||
271 | + FIELD(INTERRUPT_CLEAR_REGISTER, CTSCNT_OFLW, 5, 1) | ||
272 | + FIELD(INTERRUPT_CLEAR_REGISTER, CRXOK, 4, 1) | ||
273 | + FIELD(INTERRUPT_CLEAR_REGISTER, CBSFRD, 3, 1) | ||
274 | + FIELD(INTERRUPT_CLEAR_REGISTER, CPEE, 2, 1) | ||
275 | + FIELD(INTERRUPT_CLEAR_REGISTER, CTXOK, 1, 1) | ||
276 | + FIELD(INTERRUPT_CLEAR_REGISTER, CARBLOST, 0, 1) | ||
277 | +REG32(TIMESTAMP_REGISTER, 0x28) | ||
278 | + FIELD(TIMESTAMP_REGISTER, TIMESTAMP_CNT, 16, 16) | ||
279 | + FIELD(TIMESTAMP_REGISTER, CTS, 0, 1) | ||
280 | +REG32(DATA_PHASE_BAUD_RATE_PRESCALER_REGISTER, 0x88) | ||
281 | + FIELD(DATA_PHASE_BAUD_RATE_PRESCALER_REGISTER, TDC, 16, 1) | ||
282 | + FIELD(DATA_PHASE_BAUD_RATE_PRESCALER_REGISTER, TDCOFF, 8, 6) | ||
283 | + FIELD(DATA_PHASE_BAUD_RATE_PRESCALER_REGISTER, DP_BRP, 0, 8) | ||
284 | +REG32(DATA_PHASE_BIT_TIMING_REGISTER, 0x8c) | ||
285 | + FIELD(DATA_PHASE_BIT_TIMING_REGISTER, DP_SJW, 16, 4) | ||
286 | + FIELD(DATA_PHASE_BIT_TIMING_REGISTER, DP_TS2, 8, 4) | ||
287 | + FIELD(DATA_PHASE_BIT_TIMING_REGISTER, DP_TS1, 0, 5) | ||
288 | +REG32(TX_BUFFER_READY_REQUEST_REGISTER, 0x90) | ||
289 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR31, 31, 1) | ||
290 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR30, 30, 1) | ||
291 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR29, 29, 1) | ||
292 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR28, 28, 1) | ||
293 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR27, 27, 1) | ||
294 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR26, 26, 1) | ||
295 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR25, 25, 1) | ||
296 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR24, 24, 1) | ||
297 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR23, 23, 1) | ||
298 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR22, 22, 1) | ||
299 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR21, 21, 1) | ||
300 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR20, 20, 1) | ||
301 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR19, 19, 1) | ||
302 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR18, 18, 1) | ||
303 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR17, 17, 1) | ||
304 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR16, 16, 1) | ||
305 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR15, 15, 1) | ||
306 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR14, 14, 1) | ||
307 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR13, 13, 1) | ||
308 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR12, 12, 1) | ||
309 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR11, 11, 1) | ||
310 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR10, 10, 1) | ||
311 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR9, 9, 1) | ||
312 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR8, 8, 1) | ||
313 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR7, 7, 1) | ||
314 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR6, 6, 1) | ||
315 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR5, 5, 1) | ||
316 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR4, 4, 1) | ||
317 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR3, 3, 1) | ||
318 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR2, 2, 1) | ||
319 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR1, 1, 1) | ||
320 | + FIELD(TX_BUFFER_READY_REQUEST_REGISTER, RR0, 0, 1) | ||
321 | +REG32(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, 0x94) | ||
322 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS31, 31, 1) | ||
323 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS30, 30, 1) | ||
324 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS29, 29, 1) | ||
325 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS28, 28, 1) | ||
326 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS27, 27, 1) | ||
327 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS26, 26, 1) | ||
328 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS25, 25, 1) | ||
329 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS24, 24, 1) | ||
330 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS23, 23, 1) | ||
331 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS22, 22, 1) | ||
332 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS21, 21, 1) | ||
333 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS20, 20, 1) | ||
334 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS19, 19, 1) | ||
335 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS18, 18, 1) | ||
336 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS17, 17, 1) | ||
337 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS16, 16, 1) | ||
338 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS15, 15, 1) | ||
339 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS14, 14, 1) | ||
340 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS13, 13, 1) | ||
341 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS12, 12, 1) | ||
342 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS11, 11, 1) | ||
343 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS10, 10, 1) | ||
344 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS9, 9, 1) | ||
345 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS8, 8, 1) | ||
346 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS7, 7, 1) | ||
347 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS6, 6, 1) | ||
348 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS5, 5, 1) | ||
349 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS4, 4, 1) | ||
350 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS3, 3, 1) | ||
351 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS2, 2, 1) | ||
352 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS1, 1, 1) | ||
353 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, ERRS0, 0, 1) | ||
354 | +REG32(TX_BUFFER_CANCEL_REQUEST_REGISTER, 0x98) | ||
355 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR31, 31, 1) | ||
356 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR30, 30, 1) | ||
357 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR29, 29, 1) | ||
358 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR28, 28, 1) | ||
359 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR27, 27, 1) | ||
360 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR26, 26, 1) | ||
361 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR25, 25, 1) | ||
362 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR24, 24, 1) | ||
363 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR23, 23, 1) | ||
364 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR22, 22, 1) | ||
365 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR21, 21, 1) | ||
366 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR20, 20, 1) | ||
367 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR19, 19, 1) | ||
368 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR18, 18, 1) | ||
369 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR17, 17, 1) | ||
370 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR16, 16, 1) | ||
371 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR15, 15, 1) | ||
372 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR14, 14, 1) | ||
373 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR13, 13, 1) | ||
374 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR12, 12, 1) | ||
375 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR11, 11, 1) | ||
376 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR10, 10, 1) | ||
377 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR9, 9, 1) | ||
378 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR8, 8, 1) | ||
379 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR7, 7, 1) | ||
380 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR6, 6, 1) | ||
381 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR5, 5, 1) | ||
382 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR4, 4, 1) | ||
383 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR3, 3, 1) | ||
384 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR2, 2, 1) | ||
385 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR1, 1, 1) | ||
386 | + FIELD(TX_BUFFER_CANCEL_REQUEST_REGISTER, CR0, 0, 1) | ||
387 | +REG32(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, 0x9c) | ||
388 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS31, 31, | ||
389 | + 1) | ||
390 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS30, 30, | ||
391 | + 1) | ||
392 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS29, 29, | ||
393 | + 1) | ||
394 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS28, 28, | ||
395 | + 1) | ||
396 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS27, 27, | ||
397 | + 1) | ||
398 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS26, 26, | ||
399 | + 1) | ||
400 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS25, 25, | ||
401 | + 1) | ||
402 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS24, 24, | ||
403 | + 1) | ||
404 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS23, 23, | ||
405 | + 1) | ||
406 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS22, 22, | ||
407 | + 1) | ||
408 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS21, 21, | ||
409 | + 1) | ||
410 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS20, 20, | ||
411 | + 1) | ||
412 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS19, 19, | ||
413 | + 1) | ||
414 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS18, 18, | ||
415 | + 1) | ||
416 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS17, 17, | ||
417 | + 1) | ||
418 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS16, 16, | ||
419 | + 1) | ||
420 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS15, 15, | ||
421 | + 1) | ||
422 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS14, 14, | ||
423 | + 1) | ||
424 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS13, 13, | ||
425 | + 1) | ||
426 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS12, 12, | ||
427 | + 1) | ||
428 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS11, 11, | ||
429 | + 1) | ||
430 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS10, 10, | ||
431 | + 1) | ||
432 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS9, 9, 1) | ||
433 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS8, 8, 1) | ||
434 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS7, 7, 1) | ||
435 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS6, 6, 1) | ||
436 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS5, 5, 1) | ||
437 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS4, 4, 1) | ||
438 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS3, 3, 1) | ||
439 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS2, 2, 1) | ||
440 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS1, 1, 1) | ||
441 | + FIELD(INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, ECRS0, 0, 1) | ||
442 | +REG32(TX_EVENT_FIFO_STATUS_REGISTER, 0xa0) | ||
443 | + FIELD(TX_EVENT_FIFO_STATUS_REGISTER, TXE_FL, 8, 6) | ||
444 | + FIELD(TX_EVENT_FIFO_STATUS_REGISTER, TXE_IRI, 7, 1) | ||
445 | + FIELD(TX_EVENT_FIFO_STATUS_REGISTER, TXE_RI, 0, 5) | ||
446 | +REG32(TX_EVENT_FIFO_WATERMARK_REGISTER, 0xa4) | ||
447 | + FIELD(TX_EVENT_FIFO_WATERMARK_REGISTER, TXE_FWM, 0, 5) | ||
448 | +REG32(ACCEPTANCE_FILTER_CONTROL_REGISTER, 0xe0) | ||
449 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF31, 31, 1) | ||
450 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF30, 30, 1) | ||
451 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF29, 29, 1) | ||
452 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF28, 28, 1) | ||
453 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF27, 27, 1) | ||
454 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF26, 26, 1) | ||
455 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF25, 25, 1) | ||
456 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF24, 24, 1) | ||
457 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF23, 23, 1) | ||
458 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF22, 22, 1) | ||
459 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF21, 21, 1) | ||
460 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF20, 20, 1) | ||
461 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF19, 19, 1) | ||
462 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF18, 18, 1) | ||
463 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF17, 17, 1) | ||
464 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF16, 16, 1) | ||
465 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF15, 15, 1) | ||
466 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF14, 14, 1) | ||
467 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF13, 13, 1) | ||
468 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF12, 12, 1) | ||
469 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF11, 11, 1) | ||
470 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF10, 10, 1) | ||
471 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF9, 9, 1) | ||
472 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF8, 8, 1) | ||
473 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF7, 7, 1) | ||
474 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF6, 6, 1) | ||
475 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF5, 5, 1) | ||
476 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF4, 4, 1) | ||
477 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF3, 3, 1) | ||
478 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF2, 2, 1) | ||
479 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF1, 1, 1) | ||
480 | + FIELD(ACCEPTANCE_FILTER_CONTROL_REGISTER, UAF0, 0, 1) | ||
481 | +REG32(RX_FIFO_STATUS_REGISTER, 0xe8) | ||
482 | + FIELD(RX_FIFO_STATUS_REGISTER, FL_1, 24, 7) | ||
483 | + FIELD(RX_FIFO_STATUS_REGISTER, IRI_1, 23, 1) | ||
484 | + FIELD(RX_FIFO_STATUS_REGISTER, RI_1, 16, 6) | ||
485 | + FIELD(RX_FIFO_STATUS_REGISTER, FL, 8, 7) | ||
486 | + FIELD(RX_FIFO_STATUS_REGISTER, IRI, 7, 1) | ||
487 | + FIELD(RX_FIFO_STATUS_REGISTER, RI, 0, 6) | ||
488 | +REG32(RX_FIFO_WATERMARK_REGISTER, 0xec) | ||
489 | + FIELD(RX_FIFO_WATERMARK_REGISTER, RXFP, 16, 5) | ||
490 | + FIELD(RX_FIFO_WATERMARK_REGISTER, RXFWM_1, 8, 6) | ||
491 | + FIELD(RX_FIFO_WATERMARK_REGISTER, RXFWM, 0, 6) | ||
492 | +REG32(TB_ID_REGISTER, 0x100) | ||
493 | + FIELD(TB_ID_REGISTER, ID, 21, 11) | ||
494 | + FIELD(TB_ID_REGISTER, SRR_RTR_RRS, 20, 1) | ||
495 | + FIELD(TB_ID_REGISTER, IDE, 19, 1) | ||
496 | + FIELD(TB_ID_REGISTER, ID_EXT, 1, 18) | ||
497 | + FIELD(TB_ID_REGISTER, RTR_RRS, 0, 1) | ||
498 | +REG32(TB0_DLC_REGISTER, 0x104) | ||
499 | + FIELD(TB0_DLC_REGISTER, DLC, 28, 4) | ||
500 | + FIELD(TB0_DLC_REGISTER, FDF, 27, 1) | ||
501 | + FIELD(TB0_DLC_REGISTER, BRS, 26, 1) | ||
502 | + FIELD(TB0_DLC_REGISTER, RSVD2, 25, 1) | ||
503 | + FIELD(TB0_DLC_REGISTER, EFC, 24, 1) | ||
504 | + FIELD(TB0_DLC_REGISTER, MM, 16, 8) | ||
505 | + FIELD(TB0_DLC_REGISTER, RSVD1, 0, 16) | ||
506 | +REG32(TB_DW0_REGISTER, 0x108) | ||
507 | + FIELD(TB_DW0_REGISTER, DATA_BYTES0, 24, 8) | ||
508 | + FIELD(TB_DW0_REGISTER, DATA_BYTES1, 16, 8) | ||
509 | + FIELD(TB_DW0_REGISTER, DATA_BYTES2, 8, 8) | ||
510 | + FIELD(TB_DW0_REGISTER, DATA_BYTES3, 0, 8) | ||
511 | +REG32(TB_DW1_REGISTER, 0x10c) | ||
512 | + FIELD(TB_DW1_REGISTER, DATA_BYTES4, 24, 8) | ||
513 | + FIELD(TB_DW1_REGISTER, DATA_BYTES5, 16, 8) | ||
514 | + FIELD(TB_DW1_REGISTER, DATA_BYTES6, 8, 8) | ||
515 | + FIELD(TB_DW1_REGISTER, DATA_BYTES7, 0, 8) | ||
516 | +REG32(TB_DW2_REGISTER, 0x110) | ||
517 | + FIELD(TB_DW2_REGISTER, DATA_BYTES8, 24, 8) | ||
518 | + FIELD(TB_DW2_REGISTER, DATA_BYTES9, 16, 8) | ||
519 | + FIELD(TB_DW2_REGISTER, DATA_BYTES10, 8, 8) | ||
520 | + FIELD(TB_DW2_REGISTER, DATA_BYTES11, 0, 8) | ||
521 | +REG32(TB_DW3_REGISTER, 0x114) | ||
522 | + FIELD(TB_DW3_REGISTER, DATA_BYTES12, 24, 8) | ||
523 | + FIELD(TB_DW3_REGISTER, DATA_BYTES13, 16, 8) | ||
524 | + FIELD(TB_DW3_REGISTER, DATA_BYTES14, 8, 8) | ||
525 | + FIELD(TB_DW3_REGISTER, DATA_BYTES15, 0, 8) | ||
526 | +REG32(TB_DW4_REGISTER, 0x118) | ||
527 | + FIELD(TB_DW4_REGISTER, DATA_BYTES16, 24, 8) | ||
528 | + FIELD(TB_DW4_REGISTER, DATA_BYTES17, 16, 8) | ||
529 | + FIELD(TB_DW4_REGISTER, DATA_BYTES18, 8, 8) | ||
530 | + FIELD(TB_DW4_REGISTER, DATA_BYTES19, 0, 8) | ||
531 | +REG32(TB_DW5_REGISTER, 0x11c) | ||
532 | + FIELD(TB_DW5_REGISTER, DATA_BYTES20, 24, 8) | ||
533 | + FIELD(TB_DW5_REGISTER, DATA_BYTES21, 16, 8) | ||
534 | + FIELD(TB_DW5_REGISTER, DATA_BYTES22, 8, 8) | ||
535 | + FIELD(TB_DW5_REGISTER, DATA_BYTES23, 0, 8) | ||
536 | +REG32(TB_DW6_REGISTER, 0x120) | ||
537 | + FIELD(TB_DW6_REGISTER, DATA_BYTES24, 24, 8) | ||
538 | + FIELD(TB_DW6_REGISTER, DATA_BYTES25, 16, 8) | ||
539 | + FIELD(TB_DW6_REGISTER, DATA_BYTES26, 8, 8) | ||
540 | + FIELD(TB_DW6_REGISTER, DATA_BYTES27, 0, 8) | ||
541 | +REG32(TB_DW7_REGISTER, 0x124) | ||
542 | + FIELD(TB_DW7_REGISTER, DATA_BYTES28, 24, 8) | ||
543 | + FIELD(TB_DW7_REGISTER, DATA_BYTES29, 16, 8) | ||
544 | + FIELD(TB_DW7_REGISTER, DATA_BYTES30, 8, 8) | ||
545 | + FIELD(TB_DW7_REGISTER, DATA_BYTES31, 0, 8) | ||
546 | +REG32(TB_DW8_REGISTER, 0x128) | ||
547 | + FIELD(TB_DW8_REGISTER, DATA_BYTES32, 24, 8) | ||
548 | + FIELD(TB_DW8_REGISTER, DATA_BYTES33, 16, 8) | ||
549 | + FIELD(TB_DW8_REGISTER, DATA_BYTES34, 8, 8) | ||
550 | + FIELD(TB_DW8_REGISTER, DATA_BYTES35, 0, 8) | ||
551 | +REG32(TB_DW9_REGISTER, 0x12c) | ||
552 | + FIELD(TB_DW9_REGISTER, DATA_BYTES36, 24, 8) | ||
553 | + FIELD(TB_DW9_REGISTER, DATA_BYTES37, 16, 8) | ||
554 | + FIELD(TB_DW9_REGISTER, DATA_BYTES38, 8, 8) | ||
555 | + FIELD(TB_DW9_REGISTER, DATA_BYTES39, 0, 8) | ||
556 | +REG32(TB_DW10_REGISTER, 0x130) | ||
557 | + FIELD(TB_DW10_REGISTER, DATA_BYTES40, 24, 8) | ||
558 | + FIELD(TB_DW10_REGISTER, DATA_BYTES41, 16, 8) | ||
559 | + FIELD(TB_DW10_REGISTER, DATA_BYTES42, 8, 8) | ||
560 | + FIELD(TB_DW10_REGISTER, DATA_BYTES43, 0, 8) | ||
561 | +REG32(TB_DW11_REGISTER, 0x134) | ||
562 | + FIELD(TB_DW11_REGISTER, DATA_BYTES44, 24, 8) | ||
563 | + FIELD(TB_DW11_REGISTER, DATA_BYTES45, 16, 8) | ||
564 | + FIELD(TB_DW11_REGISTER, DATA_BYTES46, 8, 8) | ||
565 | + FIELD(TB_DW11_REGISTER, DATA_BYTES47, 0, 8) | ||
566 | +REG32(TB_DW12_REGISTER, 0x138) | ||
567 | + FIELD(TB_DW12_REGISTER, DATA_BYTES48, 24, 8) | ||
568 | + FIELD(TB_DW12_REGISTER, DATA_BYTES49, 16, 8) | ||
569 | + FIELD(TB_DW12_REGISTER, DATA_BYTES50, 8, 8) | ||
570 | + FIELD(TB_DW12_REGISTER, DATA_BYTES51, 0, 8) | ||
571 | +REG32(TB_DW13_REGISTER, 0x13c) | ||
572 | + FIELD(TB_DW13_REGISTER, DATA_BYTES52, 24, 8) | ||
573 | + FIELD(TB_DW13_REGISTER, DATA_BYTES53, 16, 8) | ||
574 | + FIELD(TB_DW13_REGISTER, DATA_BYTES54, 8, 8) | ||
575 | + FIELD(TB_DW13_REGISTER, DATA_BYTES55, 0, 8) | ||
576 | +REG32(TB_DW14_REGISTER, 0x140) | ||
577 | + FIELD(TB_DW14_REGISTER, DATA_BYTES56, 24, 8) | ||
578 | + FIELD(TB_DW14_REGISTER, DATA_BYTES57, 16, 8) | ||
579 | + FIELD(TB_DW14_REGISTER, DATA_BYTES58, 8, 8) | ||
580 | + FIELD(TB_DW14_REGISTER, DATA_BYTES59, 0, 8) | ||
581 | +REG32(TB_DW15_REGISTER, 0x144) | ||
582 | + FIELD(TB_DW15_REGISTER, DATA_BYTES60, 24, 8) | ||
583 | + FIELD(TB_DW15_REGISTER, DATA_BYTES61, 16, 8) | ||
584 | + FIELD(TB_DW15_REGISTER, DATA_BYTES62, 8, 8) | ||
585 | + FIELD(TB_DW15_REGISTER, DATA_BYTES63, 0, 8) | ||
586 | +REG32(AFMR_REGISTER, 0xa00) | ||
587 | + FIELD(AFMR_REGISTER, AMID, 21, 11) | ||
588 | + FIELD(AFMR_REGISTER, AMSRR, 20, 1) | ||
589 | + FIELD(AFMR_REGISTER, AMIDE, 19, 1) | ||
590 | + FIELD(AFMR_REGISTER, AMID_EXT, 1, 18) | ||
591 | + FIELD(AFMR_REGISTER, AMRTR, 0, 1) | ||
592 | +REG32(AFIR_REGISTER, 0xa04) | ||
593 | + FIELD(AFIR_REGISTER, AIID, 21, 11) | ||
594 | + FIELD(AFIR_REGISTER, AISRR, 20, 1) | ||
595 | + FIELD(AFIR_REGISTER, AIIDE, 19, 1) | ||
596 | + FIELD(AFIR_REGISTER, AIID_EXT, 1, 18) | ||
597 | + FIELD(AFIR_REGISTER, AIRTR, 0, 1) | ||
598 | +REG32(TXE_FIFO_TB_ID_REGISTER, 0x2000) | ||
599 | + FIELD(TXE_FIFO_TB_ID_REGISTER, ID, 21, 11) | ||
600 | + FIELD(TXE_FIFO_TB_ID_REGISTER, SRR_RTR_RRS, 20, 1) | ||
601 | + FIELD(TXE_FIFO_TB_ID_REGISTER, IDE, 19, 1) | ||
602 | + FIELD(TXE_FIFO_TB_ID_REGISTER, ID_EXT, 1, 18) | ||
603 | + FIELD(TXE_FIFO_TB_ID_REGISTER, RTR_RRS, 0, 1) | ||
604 | +REG32(TXE_FIFO_TB_DLC_REGISTER, 0x2004) | ||
605 | + FIELD(TXE_FIFO_TB_DLC_REGISTER, DLC, 28, 4) | ||
606 | + FIELD(TXE_FIFO_TB_DLC_REGISTER, FDF, 27, 1) | ||
607 | + FIELD(TXE_FIFO_TB_DLC_REGISTER, BRS, 26, 1) | ||
608 | + FIELD(TXE_FIFO_TB_DLC_REGISTER, ET, 24, 2) | ||
609 | + FIELD(TXE_FIFO_TB_DLC_REGISTER, MM, 16, 8) | ||
610 | + FIELD(TXE_FIFO_TB_DLC_REGISTER, TIMESTAMP, 0, 16) | ||
611 | +REG32(RB_ID_REGISTER, 0x2100) | ||
612 | + FIELD(RB_ID_REGISTER, ID, 21, 11) | ||
613 | + FIELD(RB_ID_REGISTER, SRR_RTR_RRS, 20, 1) | ||
614 | + FIELD(RB_ID_REGISTER, IDE, 19, 1) | ||
615 | + FIELD(RB_ID_REGISTER, ID_EXT, 1, 18) | ||
616 | + FIELD(RB_ID_REGISTER, RTR_RRS, 0, 1) | ||
617 | +REG32(RB_DLC_REGISTER, 0x2104) | ||
618 | + FIELD(RB_DLC_REGISTER, DLC, 28, 4) | ||
619 | + FIELD(RB_DLC_REGISTER, FDF, 27, 1) | ||
620 | + FIELD(RB_DLC_REGISTER, BRS, 26, 1) | ||
621 | + FIELD(RB_DLC_REGISTER, ESI, 25, 1) | ||
622 | + FIELD(RB_DLC_REGISTER, MATCHED_FILTER_INDEX, 16, 5) | ||
623 | + FIELD(RB_DLC_REGISTER, TIMESTAMP, 0, 16) | ||
624 | +REG32(RB_DW0_REGISTER, 0x2108) | ||
625 | + FIELD(RB_DW0_REGISTER, DATA_BYTES0, 24, 8) | ||
626 | + FIELD(RB_DW0_REGISTER, DATA_BYTES1, 16, 8) | ||
627 | + FIELD(RB_DW0_REGISTER, DATA_BYTES2, 8, 8) | ||
628 | + FIELD(RB_DW0_REGISTER, DATA_BYTES3, 0, 8) | ||
629 | +REG32(RB_DW1_REGISTER, 0x210c) | ||
630 | + FIELD(RB_DW1_REGISTER, DATA_BYTES4, 24, 8) | ||
631 | + FIELD(RB_DW1_REGISTER, DATA_BYTES5, 16, 8) | ||
632 | + FIELD(RB_DW1_REGISTER, DATA_BYTES6, 8, 8) | ||
633 | + FIELD(RB_DW1_REGISTER, DATA_BYTES7, 0, 8) | ||
634 | +REG32(RB_DW2_REGISTER, 0x2110) | ||
635 | + FIELD(RB_DW2_REGISTER, DATA_BYTES8, 24, 8) | ||
636 | + FIELD(RB_DW2_REGISTER, DATA_BYTES9, 16, 8) | ||
637 | + FIELD(RB_DW2_REGISTER, DATA_BYTES10, 8, 8) | ||
638 | + FIELD(RB_DW2_REGISTER, DATA_BYTES11, 0, 8) | ||
639 | +REG32(RB_DW3_REGISTER, 0x2114) | ||
640 | + FIELD(RB_DW3_REGISTER, DATA_BYTES12, 24, 8) | ||
641 | + FIELD(RB_DW3_REGISTER, DATA_BYTES13, 16, 8) | ||
642 | + FIELD(RB_DW3_REGISTER, DATA_BYTES14, 8, 8) | ||
643 | + FIELD(RB_DW3_REGISTER, DATA_BYTES15, 0, 8) | ||
644 | +REG32(RB_DW4_REGISTER, 0x2118) | ||
645 | + FIELD(RB_DW4_REGISTER, DATA_BYTES16, 24, 8) | ||
646 | + FIELD(RB_DW4_REGISTER, DATA_BYTES17, 16, 8) | ||
647 | + FIELD(RB_DW4_REGISTER, DATA_BYTES18, 8, 8) | ||
648 | + FIELD(RB_DW4_REGISTER, DATA_BYTES19, 0, 8) | ||
649 | +REG32(RB_DW5_REGISTER, 0x211c) | ||
650 | + FIELD(RB_DW5_REGISTER, DATA_BYTES20, 24, 8) | ||
651 | + FIELD(RB_DW5_REGISTER, DATA_BYTES21, 16, 8) | ||
652 | + FIELD(RB_DW5_REGISTER, DATA_BYTES22, 8, 8) | ||
653 | + FIELD(RB_DW5_REGISTER, DATA_BYTES23, 0, 8) | ||
654 | +REG32(RB_DW6_REGISTER, 0x2120) | ||
655 | + FIELD(RB_DW6_REGISTER, DATA_BYTES24, 24, 8) | ||
656 | + FIELD(RB_DW6_REGISTER, DATA_BYTES25, 16, 8) | ||
657 | + FIELD(RB_DW6_REGISTER, DATA_BYTES26, 8, 8) | ||
658 | + FIELD(RB_DW6_REGISTER, DATA_BYTES27, 0, 8) | ||
659 | +REG32(RB_DW7_REGISTER, 0x2124) | ||
660 | + FIELD(RB_DW7_REGISTER, DATA_BYTES28, 24, 8) | ||
661 | + FIELD(RB_DW7_REGISTER, DATA_BYTES29, 16, 8) | ||
662 | + FIELD(RB_DW7_REGISTER, DATA_BYTES30, 8, 8) | ||
663 | + FIELD(RB_DW7_REGISTER, DATA_BYTES31, 0, 8) | ||
664 | +REG32(RB_DW8_REGISTER, 0x2128) | ||
665 | + FIELD(RB_DW8_REGISTER, DATA_BYTES32, 24, 8) | ||
666 | + FIELD(RB_DW8_REGISTER, DATA_BYTES33, 16, 8) | ||
667 | + FIELD(RB_DW8_REGISTER, DATA_BYTES34, 8, 8) | ||
668 | + FIELD(RB_DW8_REGISTER, DATA_BYTES35, 0, 8) | ||
669 | +REG32(RB_DW9_REGISTER, 0x212c) | ||
670 | + FIELD(RB_DW9_REGISTER, DATA_BYTES36, 24, 8) | ||
671 | + FIELD(RB_DW9_REGISTER, DATA_BYTES37, 16, 8) | ||
672 | + FIELD(RB_DW9_REGISTER, DATA_BYTES38, 8, 8) | ||
673 | + FIELD(RB_DW9_REGISTER, DATA_BYTES39, 0, 8) | ||
674 | +REG32(RB_DW10_REGISTER, 0x2130) | ||
675 | + FIELD(RB_DW10_REGISTER, DATA_BYTES40, 24, 8) | ||
676 | + FIELD(RB_DW10_REGISTER, DATA_BYTES41, 16, 8) | ||
677 | + FIELD(RB_DW10_REGISTER, DATA_BYTES42, 8, 8) | ||
678 | + FIELD(RB_DW10_REGISTER, DATA_BYTES43, 0, 8) | ||
679 | +REG32(RB_DW11_REGISTER, 0x2134) | ||
680 | + FIELD(RB_DW11_REGISTER, DATA_BYTES44, 24, 8) | ||
681 | + FIELD(RB_DW11_REGISTER, DATA_BYTES45, 16, 8) | ||
682 | + FIELD(RB_DW11_REGISTER, DATA_BYTES46, 8, 8) | ||
683 | + FIELD(RB_DW11_REGISTER, DATA_BYTES47, 0, 8) | ||
684 | +REG32(RB_DW12_REGISTER, 0x2138) | ||
685 | + FIELD(RB_DW12_REGISTER, DATA_BYTES48, 24, 8) | ||
686 | + FIELD(RB_DW12_REGISTER, DATA_BYTES49, 16, 8) | ||
687 | + FIELD(RB_DW12_REGISTER, DATA_BYTES50, 8, 8) | ||
688 | + FIELD(RB_DW12_REGISTER, DATA_BYTES51, 0, 8) | ||
689 | +REG32(RB_DW13_REGISTER, 0x213c) | ||
690 | + FIELD(RB_DW13_REGISTER, DATA_BYTES52, 24, 8) | ||
691 | + FIELD(RB_DW13_REGISTER, DATA_BYTES53, 16, 8) | ||
692 | + FIELD(RB_DW13_REGISTER, DATA_BYTES54, 8, 8) | ||
693 | + FIELD(RB_DW13_REGISTER, DATA_BYTES55, 0, 8) | ||
694 | +REG32(RB_DW14_REGISTER, 0x2140) | ||
695 | + FIELD(RB_DW14_REGISTER, DATA_BYTES56, 24, 8) | ||
696 | + FIELD(RB_DW14_REGISTER, DATA_BYTES57, 16, 8) | ||
697 | + FIELD(RB_DW14_REGISTER, DATA_BYTES58, 8, 8) | ||
698 | + FIELD(RB_DW14_REGISTER, DATA_BYTES59, 0, 8) | ||
699 | +REG32(RB_DW15_REGISTER, 0x2144) | ||
700 | + FIELD(RB_DW15_REGISTER, DATA_BYTES60, 24, 8) | ||
701 | + FIELD(RB_DW15_REGISTER, DATA_BYTES61, 16, 8) | ||
702 | + FIELD(RB_DW15_REGISTER, DATA_BYTES62, 8, 8) | ||
703 | + FIELD(RB_DW15_REGISTER, DATA_BYTES63, 0, 8) | ||
704 | +REG32(RB_ID_REGISTER_1, 0x4100) | ||
705 | + FIELD(RB_ID_REGISTER_1, ID, 21, 11) | ||
706 | + FIELD(RB_ID_REGISTER_1, SRR_RTR_RRS, 20, 1) | ||
707 | + FIELD(RB_ID_REGISTER_1, IDE, 19, 1) | ||
708 | + FIELD(RB_ID_REGISTER_1, ID_EXT, 1, 18) | ||
709 | + FIELD(RB_ID_REGISTER_1, RTR_RRS, 0, 1) | ||
710 | +REG32(RB_DLC_REGISTER_1, 0x4104) | ||
711 | + FIELD(RB_DLC_REGISTER_1, DLC, 28, 4) | ||
712 | + FIELD(RB_DLC_REGISTER_1, FDF, 27, 1) | ||
713 | + FIELD(RB_DLC_REGISTER_1, BRS, 26, 1) | ||
714 | + FIELD(RB_DLC_REGISTER_1, ESI, 25, 1) | ||
715 | + FIELD(RB_DLC_REGISTER_1, MATCHED_FILTER_INDEX, 16, 5) | ||
716 | + FIELD(RB_DLC_REGISTER_1, TIMESTAMP, 0, 16) | ||
717 | +REG32(RB0_DW0_REGISTER_1, 0x4108) | ||
718 | + FIELD(RB0_DW0_REGISTER_1, DATA_BYTES0, 24, 8) | ||
719 | + FIELD(RB0_DW0_REGISTER_1, DATA_BYTES1, 16, 8) | ||
720 | + FIELD(RB0_DW0_REGISTER_1, DATA_BYTES2, 8, 8) | ||
721 | + FIELD(RB0_DW0_REGISTER_1, DATA_BYTES3, 0, 8) | ||
722 | +REG32(RB_DW1_REGISTER_1, 0x410c) | ||
723 | + FIELD(RB_DW1_REGISTER_1, DATA_BYTES4, 24, 8) | ||
724 | + FIELD(RB_DW1_REGISTER_1, DATA_BYTES5, 16, 8) | ||
725 | + FIELD(RB_DW1_REGISTER_1, DATA_BYTES6, 8, 8) | ||
726 | + FIELD(RB_DW1_REGISTER_1, DATA_BYTES7, 0, 8) | ||
727 | +REG32(RB_DW2_REGISTER_1, 0x4110) | ||
728 | + FIELD(RB_DW2_REGISTER_1, DATA_BYTES8, 24, 8) | ||
729 | + FIELD(RB_DW2_REGISTER_1, DATA_BYTES9, 16, 8) | ||
730 | + FIELD(RB_DW2_REGISTER_1, DATA_BYTES10, 8, 8) | ||
731 | + FIELD(RB_DW2_REGISTER_1, DATA_BYTES11, 0, 8) | ||
732 | +REG32(RB_DW3_REGISTER_1, 0x4114) | ||
733 | + FIELD(RB_DW3_REGISTER_1, DATA_BYTES12, 24, 8) | ||
734 | + FIELD(RB_DW3_REGISTER_1, DATA_BYTES13, 16, 8) | ||
735 | + FIELD(RB_DW3_REGISTER_1, DATA_BYTES14, 8, 8) | ||
736 | + FIELD(RB_DW3_REGISTER_1, DATA_BYTES15, 0, 8) | ||
737 | +REG32(RB_DW4_REGISTER_1, 0x4118) | ||
738 | + FIELD(RB_DW4_REGISTER_1, DATA_BYTES16, 24, 8) | ||
739 | + FIELD(RB_DW4_REGISTER_1, DATA_BYTES17, 16, 8) | ||
740 | + FIELD(RB_DW4_REGISTER_1, DATA_BYTES18, 8, 8) | ||
741 | + FIELD(RB_DW4_REGISTER_1, DATA_BYTES19, 0, 8) | ||
742 | +REG32(RB_DW5_REGISTER_1, 0x411c) | ||
743 | + FIELD(RB_DW5_REGISTER_1, DATA_BYTES20, 24, 8) | ||
744 | + FIELD(RB_DW5_REGISTER_1, DATA_BYTES21, 16, 8) | ||
745 | + FIELD(RB_DW5_REGISTER_1, DATA_BYTES22, 8, 8) | ||
746 | + FIELD(RB_DW5_REGISTER_1, DATA_BYTES23, 0, 8) | ||
747 | +REG32(RB_DW6_REGISTER_1, 0x4120) | ||
748 | + FIELD(RB_DW6_REGISTER_1, DATA_BYTES24, 24, 8) | ||
749 | + FIELD(RB_DW6_REGISTER_1, DATA_BYTES25, 16, 8) | ||
750 | + FIELD(RB_DW6_REGISTER_1, DATA_BYTES26, 8, 8) | ||
751 | + FIELD(RB_DW6_REGISTER_1, DATA_BYTES27, 0, 8) | ||
752 | +REG32(RB_DW7_REGISTER_1, 0x4124) | ||
753 | + FIELD(RB_DW7_REGISTER_1, DATA_BYTES28, 24, 8) | ||
754 | + FIELD(RB_DW7_REGISTER_1, DATA_BYTES29, 16, 8) | ||
755 | + FIELD(RB_DW7_REGISTER_1, DATA_BYTES30, 8, 8) | ||
756 | + FIELD(RB_DW7_REGISTER_1, DATA_BYTES31, 0, 8) | ||
757 | +REG32(RB_DW8_REGISTER_1, 0x4128) | ||
758 | + FIELD(RB_DW8_REGISTER_1, DATA_BYTES32, 24, 8) | ||
759 | + FIELD(RB_DW8_REGISTER_1, DATA_BYTES33, 16, 8) | ||
760 | + FIELD(RB_DW8_REGISTER_1, DATA_BYTES34, 8, 8) | ||
761 | + FIELD(RB_DW8_REGISTER_1, DATA_BYTES35, 0, 8) | ||
762 | +REG32(RB_DW9_REGISTER_1, 0x412c) | ||
763 | + FIELD(RB_DW9_REGISTER_1, DATA_BYTES36, 24, 8) | ||
764 | + FIELD(RB_DW9_REGISTER_1, DATA_BYTES37, 16, 8) | ||
765 | + FIELD(RB_DW9_REGISTER_1, DATA_BYTES38, 8, 8) | ||
766 | + FIELD(RB_DW9_REGISTER_1, DATA_BYTES39, 0, 8) | ||
767 | +REG32(RB_DW10_REGISTER_1, 0x4130) | ||
768 | + FIELD(RB_DW10_REGISTER_1, DATA_BYTES40, 24, 8) | ||
769 | + FIELD(RB_DW10_REGISTER_1, DATA_BYTES41, 16, 8) | ||
770 | + FIELD(RB_DW10_REGISTER_1, DATA_BYTES42, 8, 8) | ||
771 | + FIELD(RB_DW10_REGISTER_1, DATA_BYTES43, 0, 8) | ||
772 | +REG32(RB_DW11_REGISTER_1, 0x4134) | ||
773 | + FIELD(RB_DW11_REGISTER_1, DATA_BYTES44, 24, 8) | ||
774 | + FIELD(RB_DW11_REGISTER_1, DATA_BYTES45, 16, 8) | ||
775 | + FIELD(RB_DW11_REGISTER_1, DATA_BYTES46, 8, 8) | ||
776 | + FIELD(RB_DW11_REGISTER_1, DATA_BYTES47, 0, 8) | ||
777 | +REG32(RB_DW12_REGISTER_1, 0x4138) | ||
778 | + FIELD(RB_DW12_REGISTER_1, DATA_BYTES48, 24, 8) | ||
779 | + FIELD(RB_DW12_REGISTER_1, DATA_BYTES49, 16, 8) | ||
780 | + FIELD(RB_DW12_REGISTER_1, DATA_BYTES50, 8, 8) | ||
781 | + FIELD(RB_DW12_REGISTER_1, DATA_BYTES51, 0, 8) | ||
782 | +REG32(RB_DW13_REGISTER_1, 0x413c) | ||
783 | + FIELD(RB_DW13_REGISTER_1, DATA_BYTES52, 24, 8) | ||
784 | + FIELD(RB_DW13_REGISTER_1, DATA_BYTES53, 16, 8) | ||
785 | + FIELD(RB_DW13_REGISTER_1, DATA_BYTES54, 8, 8) | ||
786 | + FIELD(RB_DW13_REGISTER_1, DATA_BYTES55, 0, 8) | ||
787 | +REG32(RB_DW14_REGISTER_1, 0x4140) | ||
788 | + FIELD(RB_DW14_REGISTER_1, DATA_BYTES56, 24, 8) | ||
789 | + FIELD(RB_DW14_REGISTER_1, DATA_BYTES57, 16, 8) | ||
790 | + FIELD(RB_DW14_REGISTER_1, DATA_BYTES58, 8, 8) | ||
791 | + FIELD(RB_DW14_REGISTER_1, DATA_BYTES59, 0, 8) | ||
792 | +REG32(RB_DW15_REGISTER_1, 0x4144) | ||
793 | + FIELD(RB_DW15_REGISTER_1, DATA_BYTES60, 24, 8) | ||
794 | + FIELD(RB_DW15_REGISTER_1, DATA_BYTES61, 16, 8) | ||
795 | + FIELD(RB_DW15_REGISTER_1, DATA_BYTES62, 8, 8) | ||
796 | + FIELD(RB_DW15_REGISTER_1, DATA_BYTES63, 0, 8) | ||
797 | + | ||
798 | +static uint8_t canfd_dlc_array[8] = {8, 12, 16, 20, 24, 32, 48, 64}; | ||
799 | + | ||
800 | +static void canfd_update_irq(XlnxVersalCANFDState *s) | ||
801 | +{ | ||
802 | + unsigned int irq = s->regs[R_INTERRUPT_STATUS_REGISTER] & | ||
803 | + s->regs[R_INTERRUPT_ENABLE_REGISTER]; | ||
804 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
805 | + | ||
806 | + /* RX watermark interrupts. */ | ||
807 | + if (ARRAY_FIELD_EX32(s->regs, RX_FIFO_STATUS_REGISTER, FL) > | ||
808 | + ARRAY_FIELD_EX32(s->regs, RX_FIFO_WATERMARK_REGISTER, RXFWM)) { | ||
809 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXFWMFLL, 1); | ||
810 | + } | ||
811 | + | ||
812 | + if (ARRAY_FIELD_EX32(s->regs, RX_FIFO_STATUS_REGISTER, FL_1) > | ||
813 | + ARRAY_FIELD_EX32(s->regs, RX_FIFO_WATERMARK_REGISTER, RXFWM_1)) { | ||
814 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXFWMFLL_1, 1); | ||
815 | + } | ||
816 | + | ||
817 | + /* TX watermark interrupt. */ | ||
818 | + if (ARRAY_FIELD_EX32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, TXE_FL) > | ||
819 | + ARRAY_FIELD_EX32(s->regs, TX_EVENT_FIFO_WATERMARK_REGISTER, TXE_FWM)) { | ||
820 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, TXEWMFLL, 1); | ||
821 | + } | ||
822 | + | ||
823 | + trace_xlnx_canfd_update_irq(path, s->regs[R_INTERRUPT_STATUS_REGISTER], | ||
824 | + s->regs[R_INTERRUPT_ENABLE_REGISTER], irq); | ||
825 | + | ||
826 | + qemu_set_irq(s->irq_canfd_int, irq); | ||
827 | +} | ||
828 | + | ||
829 | +static void canfd_ier_post_write(RegisterInfo *reg, uint64_t val64) | ||
830 | +{ | ||
831 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
832 | + | ||
833 | + canfd_update_irq(s); | ||
834 | +} | ||
835 | + | ||
836 | +static uint64_t canfd_icr_pre_write(RegisterInfo *reg, uint64_t val64) | ||
837 | +{ | ||
838 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
839 | + uint32_t val = val64; | ||
840 | + | ||
841 | + s->regs[R_INTERRUPT_STATUS_REGISTER] &= ~val; | ||
842 | + | ||
843 | + /* | ||
844 | + * RXBOFLW_BI field is automatically cleared to default if RXBOFLW bit is | ||
845 | + * cleared in ISR. | ||
846 | + */ | ||
847 | + if (ARRAY_FIELD_EX32(s->regs, INTERRUPT_STATUS_REGISTER, RXFWMFLL_1)) { | ||
848 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXBOFLW_BI, 0); | ||
849 | + } | ||
850 | + | ||
851 | + canfd_update_irq(s); | ||
852 | + | ||
853 | + return 0; | ||
854 | +} | ||
855 | + | ||
856 | +static void canfd_config_reset(XlnxVersalCANFDState *s) | ||
857 | +{ | ||
858 | + | ||
859 | + unsigned int i; | ||
860 | + | ||
861 | + /* Reset all the configuration registers. */ | ||
862 | + for (i = 0; i < R_RX_FIFO_WATERMARK_REGISTER; ++i) { | ||
863 | + register_reset(&s->reg_info[i]); | ||
864 | + } | ||
865 | + | ||
866 | + canfd_update_irq(s); | ||
867 | +} | ||
868 | + | ||
869 | +static void canfd_config_mode(XlnxVersalCANFDState *s) | ||
870 | +{ | ||
871 | + register_reset(&s->reg_info[R_ERROR_COUNTER_REGISTER]); | ||
872 | + register_reset(&s->reg_info[R_ERROR_STATUS_REGISTER]); | ||
873 | + register_reset(&s->reg_info[R_STATUS_REGISTER]); | ||
874 | + | ||
875 | + /* Put XlnxVersalCANFDState in configuration mode. */ | ||
876 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, CONFIG, 1); | ||
877 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, WKUP, 0); | ||
878 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, SLP, 0); | ||
879 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, BSOFF, 0); | ||
880 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, ERROR_BIT, 0); | ||
881 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXFOFLW, 0); | ||
882 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXFOFLW_1, 0); | ||
883 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXOK, 0); | ||
884 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, TXOK, 0); | ||
885 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, ARBLST, 0); | ||
886 | + | ||
887 | + /* Clear the time stamp. */ | ||
888 | + ptimer_transaction_begin(s->canfd_timer); | ||
889 | + ptimer_set_count(s->canfd_timer, 0); | ||
890 | + ptimer_transaction_commit(s->canfd_timer); | ||
891 | + | ||
892 | + canfd_update_irq(s); | ||
893 | +} | ||
894 | + | ||
895 | +static void update_status_register_mode_bits(XlnxVersalCANFDState *s) | ||
896 | +{ | ||
897 | + bool sleep_status = ARRAY_FIELD_EX32(s->regs, STATUS_REGISTER, SLEEP); | ||
898 | + bool sleep_mode = ARRAY_FIELD_EX32(s->regs, MODE_SELECT_REGISTER, SLEEP); | ||
899 | + /* Wake up interrupt bit. */ | ||
900 | + bool wakeup_irq_val = !sleep_mode && sleep_status; | ||
901 | + /* Sleep interrupt bit. */ | ||
902 | + bool sleep_irq_val = sleep_mode && !sleep_status; | ||
903 | + | ||
904 | + /* Clear previous core mode status bits. */ | ||
905 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, LBACK, 0); | ||
906 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, SLEEP, 0); | ||
907 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, SNOOP, 0); | ||
908 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, NORMAL, 0); | ||
909 | + | ||
910 | + /* set current mode bit and generate irqs accordingly. */ | ||
911 | + if (ARRAY_FIELD_EX32(s->regs, MODE_SELECT_REGISTER, LBACK)) { | ||
912 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, LBACK, 1); | ||
913 | + } else if (ARRAY_FIELD_EX32(s->regs, MODE_SELECT_REGISTER, SLEEP)) { | ||
914 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, SLEEP, 1); | ||
915 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, SLP, | ||
916 | + sleep_irq_val); | ||
917 | + } else if (ARRAY_FIELD_EX32(s->regs, MODE_SELECT_REGISTER, SNOOP)) { | ||
918 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, SNOOP, 1); | ||
919 | + } else { | ||
920 | + /* If all bits are zero, XlnxVersalCANFDState is set in normal mode. */ | ||
921 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, NORMAL, 1); | ||
922 | + /* Set wakeup interrupt bit. */ | ||
923 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, WKUP, | ||
924 | + wakeup_irq_val); | ||
925 | + } | ||
926 | + | ||
927 | + /* Put the CANFD in error active state. */ | ||
928 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, ESTAT, 1); | ||
929 | + | ||
930 | + canfd_update_irq(s); | ||
931 | +} | ||
932 | + | ||
933 | +static uint64_t canfd_msr_pre_write(RegisterInfo *reg, uint64_t val64) | ||
934 | +{ | ||
935 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
936 | + uint32_t val = val64; | ||
937 | + uint8_t multi_mode = 0; | ||
938 | + | ||
939 | + /* | ||
940 | + * Multiple mode set check. This is done to make sure user doesn't set | ||
941 | + * multiple modes. | ||
942 | + */ | ||
943 | + multi_mode = FIELD_EX32(val, MODE_SELECT_REGISTER, LBACK) + | ||
944 | + FIELD_EX32(val, MODE_SELECT_REGISTER, SLEEP) + | ||
945 | + FIELD_EX32(val, MODE_SELECT_REGISTER, SNOOP); | ||
946 | + | ||
947 | + if (multi_mode > 1) { | ||
948 | + qemu_log_mask(LOG_GUEST_ERROR, "Attempting to configure several modes" | ||
949 | + " simultaneously. One mode will be selected according to" | ||
950 | + " their priority: LBACK > SLEEP > SNOOP.\n"); | ||
951 | + } | ||
952 | + | ||
953 | + if (ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, CEN) == 0) { | ||
954 | + /* In configuration mode, any mode can be selected. */ | ||
955 | + s->regs[R_MODE_SELECT_REGISTER] = val; | ||
956 | + } else { | ||
957 | + bool sleep_mode_bit = FIELD_EX32(val, MODE_SELECT_REGISTER, SLEEP); | ||
958 | + | ||
959 | + ARRAY_FIELD_DP32(s->regs, MODE_SELECT_REGISTER, SLEEP, sleep_mode_bit); | ||
960 | + | ||
961 | + if (FIELD_EX32(val, MODE_SELECT_REGISTER, LBACK)) { | ||
962 | + qemu_log_mask(LOG_GUEST_ERROR, "Attempting to set LBACK mode" | ||
963 | + " without setting CEN bit as 0\n"); | ||
964 | + } else if (FIELD_EX32(val, MODE_SELECT_REGISTER, SNOOP)) { | ||
965 | + qemu_log_mask(LOG_GUEST_ERROR, "Attempting to set SNOOP mode" | ||
966 | + " without setting CEN bit as 0\n"); | ||
967 | + } | ||
968 | + | ||
969 | + update_status_register_mode_bits(s); | ||
970 | + } | ||
971 | + | ||
972 | + return s->regs[R_MODE_SELECT_REGISTER]; | ||
973 | +} | ||
974 | + | ||
975 | +static void canfd_exit_sleep_mode(XlnxVersalCANFDState *s) | ||
976 | +{ | ||
977 | + ARRAY_FIELD_DP32(s->regs, MODE_SELECT_REGISTER, SLEEP, 0); | ||
978 | + update_status_register_mode_bits(s); | ||
979 | +} | ||
980 | + | ||
981 | +static void regs2frame(XlnxVersalCANFDState *s, qemu_can_frame *frame, | ||
982 | + uint32_t reg_num) | ||
983 | +{ | ||
984 | + uint32_t i = 0; | ||
985 | + uint32_t j = 0; | ||
986 | + uint32_t val = 0; | ||
987 | + uint32_t dlc_reg_val = 0; | ||
988 | + uint32_t dlc_value = 0; | ||
989 | + | ||
990 | + /* Check that reg_num should be within TX register space. */ | ||
991 | + assert(reg_num <= R_TB_ID_REGISTER + (NUM_REGS_PER_MSG_SPACE * | ||
992 | + s->cfg.tx_fifo)); | ||
993 | + | ||
994 | + dlc_reg_val = s->regs[reg_num + 1]; | ||
995 | + dlc_value = FIELD_EX32(dlc_reg_val, TB0_DLC_REGISTER, DLC); | ||
996 | + | ||
997 | + frame->can_id = s->regs[reg_num]; | ||
998 | + | ||
999 | + if (FIELD_EX32(dlc_reg_val, TB0_DLC_REGISTER, FDF)) { | ||
1000 | + /* | ||
1001 | + * CANFD frame. | ||
1002 | + * Converting dlc(0 to 15) 4 Byte data to plain length(i.e. 0 to 64) | ||
1003 | + * 1 Byte data. This is done to make it work with SocketCAN. | ||
1004 | + * On actual CANFD frame, this value can't be more than 0xF. | ||
1005 | + * Conversion table for DLC to plain length: | ||
1006 | + * | ||
1007 | + * DLC Plain Length | ||
1008 | + * 0 - 8 0 - 8 | ||
1009 | + * 9 9 - 12 | ||
1010 | + * 10 13 - 16 | ||
1011 | + * 11 17 - 20 | ||
1012 | + * 12 21 - 24 | ||
1013 | + * 13 25 - 32 | ||
1014 | + * 14 33 - 48 | ||
1015 | + * 15 49 - 64 | ||
1016 | + */ | ||
1017 | + | ||
1018 | + frame->flags = QEMU_CAN_FRMF_TYPE_FD; | ||
1019 | + | ||
1020 | + if (dlc_value < 8) { | ||
1021 | + frame->can_dlc = dlc_value; | ||
1022 | + } else { | ||
1023 | + assert((dlc_value - 8) < ARRAY_SIZE(canfd_dlc_array)); | ||
1024 | + frame->can_dlc = canfd_dlc_array[dlc_value - 8]; | ||
1025 | + } | ||
1026 | + } else { | ||
1027 | + /* | ||
1028 | + * FD Format bit not set that means it is a CAN Frame. | ||
1029 | + * Conversion table for classic CAN: | ||
1030 | + * | ||
1031 | + * DLC Plain Length | ||
1032 | + * 0 - 7 0 - 7 | ||
1033 | + * 8 - 15 8 | ||
1034 | + */ | ||
1035 | + | ||
1036 | + if (dlc_value > 8) { | ||
1037 | + frame->can_dlc = 8; | ||
1038 | + qemu_log_mask(LOG_GUEST_ERROR, "Maximum DLC value for Classic CAN" | ||
1039 | + " frame is 8. Only 8 byte data will be sent.\n"); | ||
1040 | + } else { | ||
1041 | + frame->can_dlc = dlc_value; | ||
1042 | + } | ||
1043 | + } | ||
1044 | + | ||
1045 | + for (j = 0; j < frame->can_dlc; j++) { | ||
1046 | + val = 8 * i; | ||
1047 | + | ||
1048 | + frame->data[j] = extract32(s->regs[reg_num + 2 + (j / 4)], val, 8); | ||
1049 | + i++; | ||
1050 | + | ||
1051 | + if (i % 4 == 0) { | ||
1052 | + i = 0; | ||
1053 | + } | ||
1054 | + } | ||
1055 | +} | ||
1056 | + | ||
1057 | +static void process_cancellation_requests(XlnxVersalCANFDState *s) | ||
1058 | +{ | ||
1059 | + uint32_t clear_mask = s->regs[R_TX_BUFFER_READY_REQUEST_REGISTER] & | ||
1060 | + s->regs[R_TX_BUFFER_CANCEL_REQUEST_REGISTER]; | ||
1061 | + | ||
1062 | + s->regs[R_TX_BUFFER_READY_REQUEST_REGISTER] &= ~clear_mask; | ||
1063 | + s->regs[R_TX_BUFFER_CANCEL_REQUEST_REGISTER] &= ~clear_mask; | ||
1064 | + | ||
1065 | + canfd_update_irq(s); | ||
1066 | +} | ||
1067 | + | ||
1068 | +static void store_rx_sequential(XlnxVersalCANFDState *s, | ||
1069 | + const qemu_can_frame *frame, | ||
1070 | + uint32_t fill_level, uint32_t read_index, | ||
1071 | + uint32_t store_location, uint8_t rx_fifo, | ||
1072 | + bool rx_fifo_id, uint8_t filter_index) | ||
1073 | +{ | ||
1074 | + int i; | ||
1075 | + bool is_canfd_frame; | ||
1076 | + uint8_t dlc = frame->can_dlc; | ||
1077 | + uint8_t rx_reg_num = 0; | ||
1078 | + uint32_t dlc_reg_val = 0; | ||
1079 | + uint32_t data_reg_val = 0; | ||
1080 | + | ||
1081 | + /* Getting RX0/1 fill level */ | ||
1082 | + if ((fill_level) > rx_fifo - 1) { | ||
1083 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1084 | + | ||
1085 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: RX%d Buffer is full. Discarding the" | ||
1086 | + " message\n", path, rx_fifo_id); | ||
1087 | + | ||
1088 | + /* Set the corresponding RF buffer overflow interrupt. */ | ||
1089 | + if (rx_fifo_id == 0) { | ||
1090 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXFOFLW, 1); | ||
1091 | + } else { | ||
1092 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXFOFLW_1, 1); | ||
1093 | + } | ||
1094 | + } else { | ||
1095 | + uint16_t rx_timestamp = CANFD_TIMER_MAX - | ||
1096 | + ptimer_get_count(s->canfd_timer); | ||
1097 | + | ||
1098 | + if (rx_timestamp == 0xFFFF) { | ||
1099 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, TSCNT_OFLW, 1); | ||
1100 | + } else { | ||
1101 | + ARRAY_FIELD_DP32(s->regs, TIMESTAMP_REGISTER, TIMESTAMP_CNT, | ||
1102 | + rx_timestamp); | ||
1103 | + } | ||
1104 | + | ||
1105 | + if (rx_fifo_id == 0) { | ||
1106 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, FL, | ||
1107 | + fill_level + 1); | ||
1108 | + assert(store_location <= | ||
1109 | + R_RB_ID_REGISTER + (s->cfg.rx0_fifo * | ||
1110 | + NUM_REGS_PER_MSG_SPACE)); | ||
1111 | + } else { | ||
1112 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, FL_1, | ||
1113 | + fill_level + 1); | ||
1114 | + assert(store_location <= | ||
1115 | + R_RB_ID_REGISTER_1 + (s->cfg.rx1_fifo * | ||
1116 | + NUM_REGS_PER_MSG_SPACE)); | ||
1117 | + } | ||
1118 | + | ||
1119 | + s->regs[store_location] = frame->can_id; | ||
1120 | + | ||
1121 | + dlc = frame->can_dlc; | ||
1122 | + | ||
1123 | + if (frame->flags == QEMU_CAN_FRMF_TYPE_FD) { | ||
1124 | + is_canfd_frame = true; | ||
1125 | + | ||
1126 | + /* Store dlc value in Xilinx specific format. */ | ||
1127 | + for (i = 0; i < ARRAY_SIZE(canfd_dlc_array); i++) { | ||
1128 | + if (canfd_dlc_array[i] == frame->can_dlc) { | ||
1129 | + dlc_reg_val = FIELD_DP32(0, RB_DLC_REGISTER, DLC, 8 + i); | ||
74 | + } | 1130 | + } |
75 | + } | 1131 | + } |
76 | + pa >>= 4; | 1132 | + } else { |
77 | + } while (++row & 15); | 1133 | + is_canfd_frame = false; |
78 | + } | 1134 | + |
79 | +} | 1135 | + if (frame->can_dlc > 8) { |
80 | + | 1136 | + dlc = 8; |
81 | +void HELPER(sme_addha_d)(void *vzda, void *vzn, void *vpn, | 1137 | + } |
82 | + void *vpm, uint32_t desc) | 1138 | + |
83 | +{ | 1139 | + dlc_reg_val = FIELD_DP32(0, RB_DLC_REGISTER, DLC, dlc); |
84 | + intptr_t row, col, oprsz = simd_oprsz(desc) / 8; | 1140 | + } |
85 | + uint8_t *pn = vpn, *pm = vpm; | 1141 | + |
86 | + uint64_t *zda = vzda, *zn = vzn; | 1142 | + dlc_reg_val |= FIELD_DP32(0, RB_DLC_REGISTER, FDF, is_canfd_frame); |
87 | + | 1143 | + dlc_reg_val |= FIELD_DP32(0, RB_DLC_REGISTER, TIMESTAMP, rx_timestamp); |
88 | + for (row = 0; row < oprsz; ++row) { | 1144 | + dlc_reg_val |= FIELD_DP32(0, RB_DLC_REGISTER, MATCHED_FILTER_INDEX, |
89 | + if (pn[H1(row)] & 1) { | 1145 | + filter_index); |
90 | + for (col = 0; col < oprsz; ++col) { | 1146 | + s->regs[store_location + 1] = dlc_reg_val; |
91 | + if (pm[H1(col)] & 1) { | 1147 | + |
92 | + zda[tile_vslice_index(row) + col] += zn[col]; | 1148 | + for (i = 0; i < dlc; i++) { |
1149 | + /* Register size is 4 byte but frame->data each is 1 byte. */ | ||
1150 | + switch (i % 4) { | ||
1151 | + case 0: | ||
1152 | + rx_reg_num = i / 4; | ||
1153 | + | ||
1154 | + data_reg_val = FIELD_DP32(0, RB_DW0_REGISTER, DATA_BYTES3, | ||
1155 | + frame->data[i]); | ||
1156 | + break; | ||
1157 | + case 1: | ||
1158 | + data_reg_val |= FIELD_DP32(0, RB_DW0_REGISTER, DATA_BYTES2, | ||
1159 | + frame->data[i]); | ||
1160 | + break; | ||
1161 | + case 2: | ||
1162 | + data_reg_val |= FIELD_DP32(0, RB_DW0_REGISTER, DATA_BYTES1, | ||
1163 | + frame->data[i]); | ||
1164 | + break; | ||
1165 | + case 3: | ||
1166 | + data_reg_val |= FIELD_DP32(0, RB_DW0_REGISTER, DATA_BYTES0, | ||
1167 | + frame->data[i]); | ||
1168 | + /* | ||
1169 | + * Last Bytes data which means we have all 4 bytes ready to | ||
1170 | + * store in one rx regs. | ||
1171 | + */ | ||
1172 | + s->regs[store_location + rx_reg_num + 2] = data_reg_val; | ||
1173 | + break; | ||
1174 | + } | ||
1175 | + } | ||
1176 | + | ||
1177 | + if (i % 4) { | ||
1178 | + /* | ||
1179 | + * In case DLC is not multiplier of 4, data is not saved to RX FIFO | ||
1180 | + * in above switch case. Store the remaining bytes here. | ||
1181 | + */ | ||
1182 | + s->regs[store_location + rx_reg_num + 2] = data_reg_val; | ||
1183 | + } | ||
1184 | + | ||
1185 | + /* set the interrupt as RXOK. */ | ||
1186 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXOK, 1); | ||
1187 | + } | ||
1188 | +} | ||
1189 | + | ||
1190 | +static void update_rx_sequential(XlnxVersalCANFDState *s, | ||
1191 | + const qemu_can_frame *frame) | ||
1192 | +{ | ||
1193 | + bool filter_pass = false; | ||
1194 | + uint8_t filter_index = 0; | ||
1195 | + int i; | ||
1196 | + int filter_partition = ARRAY_FIELD_EX32(s->regs, | ||
1197 | + RX_FIFO_WATERMARK_REGISTER, RXFP); | ||
1198 | + uint32_t store_location; | ||
1199 | + uint32_t fill_level; | ||
1200 | + uint32_t read_index; | ||
1201 | + uint8_t store_index = 0; | ||
1202 | + g_autofree char *path = NULL; | ||
1203 | + /* | ||
1204 | + * If all UAF bits are set to 0, then received messages are not stored | ||
1205 | + * in the RX buffers. | ||
1206 | + */ | ||
1207 | + if (s->regs[R_ACCEPTANCE_FILTER_CONTROL_REGISTER]) { | ||
1208 | + uint32_t acceptance_filter_status = | ||
1209 | + s->regs[R_ACCEPTANCE_FILTER_CONTROL_REGISTER]; | ||
1210 | + | ||
1211 | + for (i = 0; i < 32; i++) { | ||
1212 | + if (acceptance_filter_status & 0x1) { | ||
1213 | + uint32_t msg_id_masked = s->regs[R_AFMR_REGISTER + 2 * i] & | ||
1214 | + frame->can_id; | ||
1215 | + uint32_t afir_id_masked = s->regs[R_AFIR_REGISTER + 2 * i] & | ||
1216 | + s->regs[R_AFMR_REGISTER + 2 * i]; | ||
1217 | + uint16_t std_msg_id_masked = FIELD_EX32(msg_id_masked, | ||
1218 | + AFIR_REGISTER, AIID); | ||
1219 | + uint16_t std_afir_id_masked = FIELD_EX32(afir_id_masked, | ||
1220 | + AFIR_REGISTER, AIID); | ||
1221 | + uint32_t ext_msg_id_masked = FIELD_EX32(msg_id_masked, | ||
1222 | + AFIR_REGISTER, | ||
1223 | + AIID_EXT); | ||
1224 | + uint32_t ext_afir_id_masked = FIELD_EX32(afir_id_masked, | ||
1225 | + AFIR_REGISTER, | ||
1226 | + AIID_EXT); | ||
1227 | + bool ext_ide = FIELD_EX32(s->regs[R_AFMR_REGISTER + 2 * i], | ||
1228 | + AFMR_REGISTER, AMIDE); | ||
1229 | + | ||
1230 | + if (std_msg_id_masked == std_afir_id_masked) { | ||
1231 | + if (ext_ide) { | ||
1232 | + /* Extended message ID message. */ | ||
1233 | + if (ext_msg_id_masked == ext_afir_id_masked) { | ||
1234 | + filter_pass = true; | ||
1235 | + filter_index = i; | ||
1236 | + | ||
1237 | + break; | ||
1238 | + } | ||
1239 | + } else { | ||
1240 | + /* Standard message ID. */ | ||
1241 | + filter_pass = true; | ||
1242 | + filter_index = i; | ||
1243 | + | ||
1244 | + break; | ||
1245 | + } | ||
93 | + } | 1246 | + } |
94 | + } | 1247 | + } |
1248 | + acceptance_filter_status >>= 1; | ||
95 | + } | 1249 | + } |
96 | + } | 1250 | + } |
97 | +} | 1251 | + |
98 | + | 1252 | + if (!filter_pass) { |
99 | +void HELPER(sme_addva_s)(void *vzda, void *vzn, void *vpn, | 1253 | + path = object_get_canonical_path(OBJECT(s)); |
100 | + void *vpm, uint32_t desc) | 1254 | + |
101 | +{ | 1255 | + trace_xlnx_canfd_rx_fifo_filter_reject(path, frame->can_id, |
102 | + intptr_t row, col, oprsz = simd_oprsz(desc) / 4; | 1256 | + frame->can_dlc); |
103 | + uint64_t *pn = vpn, *pm = vpm; | 1257 | + } else { |
104 | + uint32_t *zda = vzda, *zn = vzn; | 1258 | + if (filter_index <= filter_partition) { |
105 | + | 1259 | + fill_level = ARRAY_FIELD_EX32(s->regs, RX_FIFO_STATUS_REGISTER, FL); |
106 | + for (row = 0; row < oprsz; ) { | 1260 | + read_index = ARRAY_FIELD_EX32(s->regs, RX_FIFO_STATUS_REGISTER, RI); |
107 | + uint64_t pa = pn[row >> 4]; | 1261 | + store_index = read_index + fill_level; |
108 | + do { | 1262 | + |
109 | + if (pa & 1) { | 1263 | + if (read_index == s->cfg.rx0_fifo - 1) { |
110 | + uint32_t zn_row = zn[H4(row)]; | 1264 | + /* |
111 | + for (col = 0; col < oprsz; ) { | 1265 | + * When ri is s->cfg.rx0_fifo - 1 i.e. max, it goes cyclic that |
112 | + uint64_t pb = pm[col >> 4]; | 1266 | + * means we reset the ri to 0x0. |
113 | + do { | 1267 | + */ |
114 | + if (pb & 1) { | 1268 | + read_index = 0; |
115 | + zda[tile_vslice_index(row) + H4(col)] += zn_row; | 1269 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, RI, |
116 | + } | 1270 | + read_index); |
117 | + pb >>= 4; | ||
118 | + } while (++col & 15); | ||
119 | + } | ||
120 | + } | 1271 | + } |
121 | + pa >>= 4; | 1272 | + |
122 | + } while (++row & 15); | 1273 | + if (store_index > s->cfg.rx0_fifo - 1) { |
123 | + } | 1274 | + store_index -= s->cfg.rx0_fifo - 1; |
124 | +} | 1275 | + } |
125 | + | 1276 | + |
126 | +void HELPER(sme_addva_d)(void *vzda, void *vzn, void *vpn, | 1277 | + store_location = R_RB_ID_REGISTER + |
127 | + void *vpm, uint32_t desc) | 1278 | + (store_index * NUM_REGS_PER_MSG_SPACE); |
128 | +{ | 1279 | + |
129 | + intptr_t row, col, oprsz = simd_oprsz(desc) / 8; | 1280 | + store_rx_sequential(s, frame, fill_level, read_index, |
130 | + uint8_t *pn = vpn, *pm = vpm; | 1281 | + store_location, s->cfg.rx0_fifo, 0, |
131 | + uint64_t *zda = vzda, *zn = vzn; | 1282 | + filter_index); |
132 | + | 1283 | + } else { |
133 | + for (row = 0; row < oprsz; ++row) { | 1284 | + /* RX 1 fill level message */ |
134 | + if (pn[H1(row)] & 1) { | 1285 | + fill_level = ARRAY_FIELD_EX32(s->regs, RX_FIFO_STATUS_REGISTER, |
135 | + uint64_t zn_row = zn[row]; | 1286 | + FL_1); |
136 | + for (col = 0; col < oprsz; ++col) { | 1287 | + read_index = ARRAY_FIELD_EX32(s->regs, RX_FIFO_STATUS_REGISTER, |
137 | + if (pm[H1(col)] & 1) { | 1288 | + RI_1); |
138 | + zda[tile_vslice_index(row) + col] += zn_row; | 1289 | + store_index = read_index + fill_level; |
139 | + } | 1290 | + |
1291 | + if (read_index == s->cfg.rx1_fifo - 1) { | ||
1292 | + /* | ||
1293 | + * When ri is s->cfg.rx1_fifo - 1 i.e. max, it goes cyclic that | ||
1294 | + * means we reset the ri to 0x0. | ||
1295 | + */ | ||
1296 | + read_index = 0; | ||
1297 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, RI_1, | ||
1298 | + read_index); | ||
1299 | + } | ||
1300 | + | ||
1301 | + if (store_index > s->cfg.rx1_fifo - 1) { | ||
1302 | + store_index -= s->cfg.rx1_fifo - 1; | ||
1303 | + } | ||
1304 | + | ||
1305 | + store_location = R_RB_ID_REGISTER_1 + | ||
1306 | + (store_index * NUM_REGS_PER_MSG_SPACE); | ||
1307 | + | ||
1308 | + store_rx_sequential(s, frame, fill_level, read_index, | ||
1309 | + store_location, s->cfg.rx1_fifo, 1, | ||
1310 | + filter_index); | ||
1311 | + } | ||
1312 | + | ||
1313 | + path = object_get_canonical_path(OBJECT(s)); | ||
1314 | + | ||
1315 | + trace_xlnx_canfd_rx_data(path, frame->can_id, frame->can_dlc, | ||
1316 | + frame->flags); | ||
1317 | + canfd_update_irq(s); | ||
1318 | + } | ||
1319 | +} | ||
1320 | + | ||
1321 | +static bool tx_ready_check(XlnxVersalCANFDState *s) | ||
1322 | +{ | ||
1323 | + if (ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, SRST)) { | ||
1324 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1325 | + | ||
1326 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Attempting to transfer data while" | ||
1327 | + " XlnxVersalCANFDState is in reset mode\n", path); | ||
1328 | + | ||
1329 | + return false; | ||
1330 | + } | ||
1331 | + | ||
1332 | + if (ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, CEN) == 0) { | ||
1333 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1334 | + | ||
1335 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Attempting to transfer data while" | ||
1336 | + " XlnxVersalCANFDState is in configuration mode." | ||
1337 | + " Reset the core so operations can start fresh\n", | ||
1338 | + path); | ||
1339 | + return false; | ||
1340 | + } | ||
1341 | + | ||
1342 | + if (ARRAY_FIELD_EX32(s->regs, MODE_SELECT_REGISTER, SNOOP)) { | ||
1343 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1344 | + | ||
1345 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Attempting to transfer data while" | ||
1346 | + " XlnxVersalCANFDState is in SNOOP MODE\n", | ||
1347 | + path); | ||
1348 | + return false; | ||
1349 | + } | ||
1350 | + | ||
1351 | + return true; | ||
1352 | +} | ||
1353 | + | ||
1354 | +static void tx_fifo_stamp(XlnxVersalCANFDState *s, uint32_t tb0_regid) | ||
1355 | +{ | ||
1356 | + /* | ||
1357 | + * If EFC bit in DLC message is set, this means we will store the | ||
1358 | + * event of this transmitted message with time stamp. | ||
1359 | + */ | ||
1360 | + uint32_t dlc_reg_val = 0; | ||
1361 | + | ||
1362 | + if (FIELD_EX32(s->regs[tb0_regid + 1], TB0_DLC_REGISTER, EFC)) { | ||
1363 | + uint8_t dlc_val = FIELD_EX32(s->regs[tb0_regid + 1], TB0_DLC_REGISTER, | ||
1364 | + DLC); | ||
1365 | + bool fdf_val = FIELD_EX32(s->regs[tb0_regid + 1], TB0_DLC_REGISTER, | ||
1366 | + FDF); | ||
1367 | + bool brs_val = FIELD_EX32(s->regs[tb0_regid + 1], TB0_DLC_REGISTER, | ||
1368 | + BRS); | ||
1369 | + uint8_t mm_val = FIELD_EX32(s->regs[tb0_regid + 1], TB0_DLC_REGISTER, | ||
1370 | + MM); | ||
1371 | + uint8_t fill_level = ARRAY_FIELD_EX32(s->regs, | ||
1372 | + TX_EVENT_FIFO_STATUS_REGISTER, | ||
1373 | + TXE_FL); | ||
1374 | + uint8_t read_index = ARRAY_FIELD_EX32(s->regs, | ||
1375 | + TX_EVENT_FIFO_STATUS_REGISTER, | ||
1376 | + TXE_RI); | ||
1377 | + uint8_t store_index = fill_level + read_index; | ||
1378 | + | ||
1379 | + if ((fill_level) > s->cfg.tx_fifo - 1) { | ||
1380 | + qemu_log_mask(LOG_GUEST_ERROR, "TX Event Buffer is full." | ||
1381 | + " Discarding the message\n"); | ||
1382 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, TXEOFLW, 1); | ||
1383 | + } else { | ||
1384 | + if (read_index == s->cfg.tx_fifo - 1) { | ||
1385 | + /* | ||
1386 | + * When ri is s->cfg.tx_fifo - 1 i.e. max, it goes cyclic that | ||
1387 | + * means we reset the ri to 0x0. | ||
1388 | + */ | ||
1389 | + read_index = 0; | ||
1390 | + ARRAY_FIELD_DP32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, TXE_RI, | ||
1391 | + read_index); | ||
1392 | + } | ||
1393 | + | ||
1394 | + if (store_index > s->cfg.tx_fifo - 1) { | ||
1395 | + store_index -= s->cfg.tx_fifo - 1; | ||
1396 | + } | ||
1397 | + | ||
1398 | + assert(store_index < s->cfg.tx_fifo); | ||
1399 | + | ||
1400 | + uint32_t tx_event_reg0_id = R_TXE_FIFO_TB_ID_REGISTER + | ||
1401 | + (store_index * 2); | ||
1402 | + | ||
1403 | + /* Store message ID in TX event register. */ | ||
1404 | + s->regs[tx_event_reg0_id] = s->regs[tb0_regid]; | ||
1405 | + | ||
1406 | + uint16_t tx_timestamp = CANFD_TIMER_MAX - | ||
1407 | + ptimer_get_count(s->canfd_timer); | ||
1408 | + | ||
1409 | + /* Store DLC with time stamp in DLC regs. */ | ||
1410 | + dlc_reg_val = FIELD_DP32(0, TXE_FIFO_TB_DLC_REGISTER, DLC, dlc_val); | ||
1411 | + dlc_reg_val |= FIELD_DP32(0, TXE_FIFO_TB_DLC_REGISTER, FDF, | ||
1412 | + fdf_val); | ||
1413 | + dlc_reg_val |= FIELD_DP32(0, TXE_FIFO_TB_DLC_REGISTER, BRS, | ||
1414 | + brs_val); | ||
1415 | + dlc_reg_val |= FIELD_DP32(0, TXE_FIFO_TB_DLC_REGISTER, ET, 0x3); | ||
1416 | + dlc_reg_val |= FIELD_DP32(0, TXE_FIFO_TB_DLC_REGISTER, MM, mm_val); | ||
1417 | + dlc_reg_val |= FIELD_DP32(0, TXE_FIFO_TB_DLC_REGISTER, TIMESTAMP, | ||
1418 | + tx_timestamp); | ||
1419 | + s->regs[tx_event_reg0_id + 1] = dlc_reg_val; | ||
1420 | + | ||
1421 | + ARRAY_FIELD_DP32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, TXE_FL, | ||
1422 | + fill_level + 1); | ||
1423 | + } | ||
1424 | + } | ||
1425 | +} | ||
1426 | + | ||
1427 | +static gint g_cmp_ids(gconstpointer data1, gconstpointer data2) | ||
1428 | +{ | ||
1429 | + tx_ready_reg_info *tx_reg_1 = (tx_ready_reg_info *) data1; | ||
1430 | + tx_ready_reg_info *tx_reg_2 = (tx_ready_reg_info *) data2; | ||
1431 | + | ||
1432 | + return tx_reg_1->can_id - tx_reg_2->can_id; | ||
1433 | +} | ||
1434 | + | ||
1435 | +static void free_list(GSList *list) | ||
1436 | +{ | ||
1437 | + GSList *iterator = NULL; | ||
1438 | + | ||
1439 | + for (iterator = list; iterator != NULL; iterator = iterator->next) { | ||
1440 | + g_free((tx_ready_reg_info *)iterator->data); | ||
1441 | + } | ||
1442 | + | ||
1443 | + g_slist_free(list); | ||
1444 | + | ||
1445 | + return; | ||
1446 | +} | ||
1447 | + | ||
1448 | +static GSList *prepare_tx_data(XlnxVersalCANFDState *s) | ||
1449 | +{ | ||
1450 | + uint8_t i = 0; | ||
1451 | + GSList *list = NULL; | ||
1452 | + uint32_t reg_num = 0; | ||
1453 | + uint32_t reg_ready = s->regs[R_TX_BUFFER_READY_REQUEST_REGISTER]; | ||
1454 | + | ||
1455 | + /* First find the messages which are ready for transmission. */ | ||
1456 | + for (i = 0; i < s->cfg.tx_fifo; i++) { | ||
1457 | + if (reg_ready & 1) { | ||
1458 | + reg_num = R_TB_ID_REGISTER + (NUM_REGS_PER_MSG_SPACE * i); | ||
1459 | + tx_ready_reg_info *temp = g_new(tx_ready_reg_info, 1); | ||
1460 | + | ||
1461 | + temp->can_id = s->regs[reg_num]; | ||
1462 | + temp->reg_num = reg_num; | ||
1463 | + list = g_slist_prepend(list, temp); | ||
1464 | + list = g_slist_sort(list, g_cmp_ids); | ||
1465 | + } | ||
1466 | + | ||
1467 | + reg_ready >>= 1; | ||
1468 | + } | ||
1469 | + | ||
1470 | + s->regs[R_TX_BUFFER_READY_REQUEST_REGISTER] = 0; | ||
1471 | + s->regs[R_TX_BUFFER_CANCEL_REQUEST_REGISTER] = 0; | ||
1472 | + | ||
1473 | + return list; | ||
1474 | +} | ||
1475 | + | ||
1476 | +static void transfer_data(XlnxVersalCANFDState *s) | ||
1477 | +{ | ||
1478 | + bool canfd_tx = tx_ready_check(s); | ||
1479 | + GSList *list, *iterator = NULL; | ||
1480 | + qemu_can_frame frame; | ||
1481 | + | ||
1482 | + if (!canfd_tx) { | ||
1483 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1484 | + | ||
1485 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Controller not enabled for data" | ||
1486 | + " transfer\n", path); | ||
1487 | + return; | ||
1488 | + } | ||
1489 | + | ||
1490 | + list = prepare_tx_data(s); | ||
1491 | + if (list == NULL) { | ||
1492 | + return; | ||
1493 | + } | ||
1494 | + | ||
1495 | + for (iterator = list; iterator != NULL; iterator = iterator->next) { | ||
1496 | + regs2frame(s, &frame, | ||
1497 | + ((tx_ready_reg_info *)iterator->data)->reg_num); | ||
1498 | + | ||
1499 | + if (ARRAY_FIELD_EX32(s->regs, STATUS_REGISTER, LBACK)) { | ||
1500 | + update_rx_sequential(s, &frame); | ||
1501 | + tx_fifo_stamp(s, ((tx_ready_reg_info *)iterator->data)->reg_num); | ||
1502 | + | ||
1503 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, RXOK, 1); | ||
1504 | + } else { | ||
1505 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1506 | + | ||
1507 | + trace_xlnx_canfd_tx_data(path, frame.can_id, frame.can_dlc, | ||
1508 | + frame.flags); | ||
1509 | + can_bus_client_send(&s->bus_client, &frame, 1); | ||
1510 | + tx_fifo_stamp(s, | ||
1511 | + ((tx_ready_reg_info *)iterator->data)->reg_num); | ||
1512 | + | ||
1513 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, TXRRS, 1); | ||
1514 | + | ||
1515 | + if (ARRAY_FIELD_EX32(s->regs, STATUS_REGISTER, SLEEP)) { | ||
1516 | + canfd_exit_sleep_mode(s); | ||
140 | + } | 1517 | + } |
141 | + } | 1518 | + } |
142 | + } | 1519 | + } |
143 | +} | 1520 | + |
144 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 1521 | + ARRAY_FIELD_DP32(s->regs, INTERRUPT_STATUS_REGISTER, TXOK, 1); |
1522 | + free_list(list); | ||
1523 | + | ||
1524 | + canfd_update_irq(s); | ||
1525 | +} | ||
1526 | + | ||
1527 | +static uint64_t canfd_srr_pre_write(RegisterInfo *reg, uint64_t val64) | ||
1528 | +{ | ||
1529 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1530 | + uint32_t val = val64; | ||
1531 | + | ||
1532 | + ARRAY_FIELD_DP32(s->regs, SOFTWARE_RESET_REGISTER, CEN, | ||
1533 | + FIELD_EX32(val, SOFTWARE_RESET_REGISTER, CEN)); | ||
1534 | + | ||
1535 | + if (FIELD_EX32(val, SOFTWARE_RESET_REGISTER, SRST)) { | ||
1536 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1537 | + | ||
1538 | + trace_xlnx_canfd_reset(path, val64); | ||
1539 | + | ||
1540 | + /* First, core will do software reset then will enter in config mode. */ | ||
1541 | + canfd_config_reset(s); | ||
1542 | + } else if (ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, CEN) == 0) { | ||
1543 | + canfd_config_mode(s); | ||
1544 | + } else { | ||
1545 | + /* | ||
1546 | + * Leave config mode. Now XlnxVersalCANFD core will enter Normal, Sleep, | ||
1547 | + * snoop or Loopback mode depending upon LBACK, SLEEP, SNOOP register | ||
1548 | + * states. | ||
1549 | + */ | ||
1550 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, CONFIG, 0); | ||
1551 | + | ||
1552 | + ptimer_transaction_begin(s->canfd_timer); | ||
1553 | + ptimer_set_count(s->canfd_timer, 0); | ||
1554 | + ptimer_transaction_commit(s->canfd_timer); | ||
1555 | + update_status_register_mode_bits(s); | ||
1556 | + transfer_data(s); | ||
1557 | + } | ||
1558 | + | ||
1559 | + return s->regs[R_SOFTWARE_RESET_REGISTER]; | ||
1560 | +} | ||
1561 | + | ||
1562 | +static uint64_t filter_mask(RegisterInfo *reg, uint64_t val64) | ||
1563 | +{ | ||
1564 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1565 | + uint32_t reg_idx = (reg->access->addr) / 4; | ||
1566 | + uint32_t val = val64; | ||
1567 | + uint32_t filter_offset = (reg_idx - R_AFMR_REGISTER) / 2; | ||
1568 | + | ||
1569 | + if (!(s->regs[R_ACCEPTANCE_FILTER_CONTROL_REGISTER] & | ||
1570 | + (1 << filter_offset))) { | ||
1571 | + s->regs[reg_idx] = val; | ||
1572 | + } else { | ||
1573 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1574 | + | ||
1575 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Acceptance filter %d not enabled\n", | ||
1576 | + path, filter_offset + 1); | ||
1577 | + } | ||
1578 | + | ||
1579 | + return s->regs[reg_idx]; | ||
1580 | +} | ||
1581 | + | ||
1582 | +static uint64_t filter_id(RegisterInfo *reg, uint64_t val64) | ||
1583 | +{ | ||
1584 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1585 | + hwaddr reg_idx = (reg->access->addr) / 4; | ||
1586 | + uint32_t val = val64; | ||
1587 | + uint32_t filter_offset = (reg_idx - R_AFIR_REGISTER) / 2; | ||
1588 | + | ||
1589 | + if (!(s->regs[R_ACCEPTANCE_FILTER_CONTROL_REGISTER] & | ||
1590 | + (1 << filter_offset))) { | ||
1591 | + s->regs[reg_idx] = val; | ||
1592 | + } else { | ||
1593 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1594 | + | ||
1595 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Acceptance filter %d not enabled\n", | ||
1596 | + path, filter_offset + 1); | ||
1597 | + } | ||
1598 | + | ||
1599 | + return s->regs[reg_idx]; | ||
1600 | +} | ||
1601 | + | ||
1602 | +static uint64_t canfd_tx_fifo_status_prew(RegisterInfo *reg, uint64_t val64) | ||
1603 | +{ | ||
1604 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1605 | + uint32_t val = val64; | ||
1606 | + uint8_t read_ind = 0; | ||
1607 | + uint8_t fill_ind = ARRAY_FIELD_EX32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, | ||
1608 | + TXE_FL); | ||
1609 | + | ||
1610 | + if (FIELD_EX32(val, TX_EVENT_FIFO_STATUS_REGISTER, TXE_IRI) && fill_ind) { | ||
1611 | + read_ind = ARRAY_FIELD_EX32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, | ||
1612 | + TXE_RI) + 1; | ||
1613 | + | ||
1614 | + if (read_ind > s->cfg.tx_fifo - 1) { | ||
1615 | + read_ind = 0; | ||
1616 | + } | ||
1617 | + | ||
1618 | + /* | ||
1619 | + * Increase the read index by 1 and decrease the fill level by 1. | ||
1620 | + */ | ||
1621 | + ARRAY_FIELD_DP32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, TXE_RI, | ||
1622 | + read_ind); | ||
1623 | + ARRAY_FIELD_DP32(s->regs, TX_EVENT_FIFO_STATUS_REGISTER, TXE_FL, | ||
1624 | + fill_ind - 1); | ||
1625 | + } | ||
1626 | + | ||
1627 | + return s->regs[R_TX_EVENT_FIFO_STATUS_REGISTER]; | ||
1628 | +} | ||
1629 | + | ||
1630 | +static uint64_t canfd_rx_fifo_status_prew(RegisterInfo *reg, uint64_t val64) | ||
1631 | +{ | ||
1632 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1633 | + uint32_t val = val64; | ||
1634 | + uint8_t read_ind = 0; | ||
1635 | + uint8_t fill_ind = 0; | ||
1636 | + | ||
1637 | + if (FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, IRI)) { | ||
1638 | + /* FL index is zero, setting IRI bit has no effect. */ | ||
1639 | + if (FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, FL) != 0) { | ||
1640 | + read_ind = FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, RI) + 1; | ||
1641 | + | ||
1642 | + if (read_ind > s->cfg.rx0_fifo - 1) { | ||
1643 | + read_ind = 0; | ||
1644 | + } | ||
1645 | + | ||
1646 | + fill_ind = FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, FL) - 1; | ||
1647 | + | ||
1648 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, RI, read_ind); | ||
1649 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, FL, fill_ind); | ||
1650 | + } | ||
1651 | + } | ||
1652 | + | ||
1653 | + if (FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, IRI_1)) { | ||
1654 | + /* FL_1 index is zero, setting IRI_1 bit has no effect. */ | ||
1655 | + if (FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, FL_1) != 0) { | ||
1656 | + read_ind = FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, RI_1) + 1; | ||
1657 | + | ||
1658 | + if (read_ind > s->cfg.rx1_fifo - 1) { | ||
1659 | + read_ind = 0; | ||
1660 | + } | ||
1661 | + | ||
1662 | + fill_ind = FIELD_EX32(val, RX_FIFO_STATUS_REGISTER, FL_1) - 1; | ||
1663 | + | ||
1664 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, RI_1, read_ind); | ||
1665 | + ARRAY_FIELD_DP32(s->regs, RX_FIFO_STATUS_REGISTER, FL_1, fill_ind); | ||
1666 | + } | ||
1667 | + } | ||
1668 | + | ||
1669 | + return s->regs[R_RX_FIFO_STATUS_REGISTER]; | ||
1670 | +} | ||
1671 | + | ||
1672 | +static uint64_t canfd_tsr_pre_write(RegisterInfo *reg, uint64_t val64) | ||
1673 | +{ | ||
1674 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1675 | + uint32_t val = val64; | ||
1676 | + | ||
1677 | + if (FIELD_EX32(val, TIMESTAMP_REGISTER, CTS)) { | ||
1678 | + ARRAY_FIELD_DP32(s->regs, TIMESTAMP_REGISTER, TIMESTAMP_CNT, 0); | ||
1679 | + ptimer_transaction_begin(s->canfd_timer); | ||
1680 | + ptimer_set_count(s->canfd_timer, 0); | ||
1681 | + ptimer_transaction_commit(s->canfd_timer); | ||
1682 | + } | ||
1683 | + | ||
1684 | + return 0; | ||
1685 | +} | ||
1686 | + | ||
1687 | +static uint64_t canfd_trr_reg_prew(RegisterInfo *reg, uint64_t val64) | ||
1688 | +{ | ||
1689 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1690 | + | ||
1691 | + if (ARRAY_FIELD_EX32(s->regs, MODE_SELECT_REGISTER, SNOOP)) { | ||
1692 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
1693 | + | ||
1694 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: Controller is in SNOOP mode." | ||
1695 | + " tx_ready_register will stay in reset mode\n", path); | ||
1696 | + return 0; | ||
1697 | + } else { | ||
1698 | + return val64; | ||
1699 | + } | ||
1700 | +} | ||
1701 | + | ||
1702 | +static void canfd_trr_reg_postw(RegisterInfo *reg, uint64_t val64) | ||
1703 | +{ | ||
1704 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1705 | + | ||
1706 | + transfer_data(s); | ||
1707 | +} | ||
1708 | + | ||
1709 | +static void canfd_cancel_reg_postw(RegisterInfo *reg, uint64_t val64) | ||
1710 | +{ | ||
1711 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1712 | + | ||
1713 | + process_cancellation_requests(s); | ||
1714 | +} | ||
1715 | + | ||
1716 | +static uint64_t canfd_write_check_prew(RegisterInfo *reg, uint64_t val64) | ||
1717 | +{ | ||
1718 | + XlnxVersalCANFDState *s = XILINX_CANFD(reg->opaque); | ||
1719 | + uint32_t val = val64; | ||
1720 | + | ||
1721 | + if (ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, CEN) == 0) { | ||
1722 | + return val; | ||
1723 | + } | ||
1724 | + return 0; | ||
1725 | +} | ||
1726 | + | ||
1727 | +static const RegisterAccessInfo canfd_tx_regs[] = { | ||
1728 | + { .name = "TB_ID_REGISTER", .addr = A_TB_ID_REGISTER, | ||
1729 | + },{ .name = "TB0_DLC_REGISTER", .addr = A_TB0_DLC_REGISTER, | ||
1730 | + },{ .name = "TB_DW0_REGISTER", .addr = A_TB_DW0_REGISTER, | ||
1731 | + },{ .name = "TB_DW1_REGISTER", .addr = A_TB_DW1_REGISTER, | ||
1732 | + },{ .name = "TB_DW2_REGISTER", .addr = A_TB_DW2_REGISTER, | ||
1733 | + },{ .name = "TB_DW3_REGISTER", .addr = A_TB_DW3_REGISTER, | ||
1734 | + },{ .name = "TB_DW4_REGISTER", .addr = A_TB_DW4_REGISTER, | ||
1735 | + },{ .name = "TB_DW5_REGISTER", .addr = A_TB_DW5_REGISTER, | ||
1736 | + },{ .name = "TB_DW6_REGISTER", .addr = A_TB_DW6_REGISTER, | ||
1737 | + },{ .name = "TB_DW7_REGISTER", .addr = A_TB_DW7_REGISTER, | ||
1738 | + },{ .name = "TB_DW8_REGISTER", .addr = A_TB_DW8_REGISTER, | ||
1739 | + },{ .name = "TB_DW9_REGISTER", .addr = A_TB_DW9_REGISTER, | ||
1740 | + },{ .name = "TB_DW10_REGISTER", .addr = A_TB_DW10_REGISTER, | ||
1741 | + },{ .name = "TB_DW11_REGISTER", .addr = A_TB_DW11_REGISTER, | ||
1742 | + },{ .name = "TB_DW12_REGISTER", .addr = A_TB_DW12_REGISTER, | ||
1743 | + },{ .name = "TB_DW13_REGISTER", .addr = A_TB_DW13_REGISTER, | ||
1744 | + },{ .name = "TB_DW14_REGISTER", .addr = A_TB_DW14_REGISTER, | ||
1745 | + },{ .name = "TB_DW15_REGISTER", .addr = A_TB_DW15_REGISTER, | ||
1746 | + } | ||
1747 | +}; | ||
1748 | + | ||
1749 | +static const RegisterAccessInfo canfd_rx0_regs[] = { | ||
1750 | + { .name = "RB_ID_REGISTER", .addr = A_RB_ID_REGISTER, | ||
1751 | + .ro = 0xffffffff, | ||
1752 | + },{ .name = "RB_DLC_REGISTER", .addr = A_RB_DLC_REGISTER, | ||
1753 | + .ro = 0xfe1fffff, | ||
1754 | + },{ .name = "RB_DW0_REGISTER", .addr = A_RB_DW0_REGISTER, | ||
1755 | + .ro = 0xffffffff, | ||
1756 | + },{ .name = "RB_DW1_REGISTER", .addr = A_RB_DW1_REGISTER, | ||
1757 | + .ro = 0xffffffff, | ||
1758 | + },{ .name = "RB_DW2_REGISTER", .addr = A_RB_DW2_REGISTER, | ||
1759 | + .ro = 0xffffffff, | ||
1760 | + },{ .name = "RB_DW3_REGISTER", .addr = A_RB_DW3_REGISTER, | ||
1761 | + .ro = 0xffffffff, | ||
1762 | + },{ .name = "RB_DW4_REGISTER", .addr = A_RB_DW4_REGISTER, | ||
1763 | + .ro = 0xffffffff, | ||
1764 | + },{ .name = "RB_DW5_REGISTER", .addr = A_RB_DW5_REGISTER, | ||
1765 | + .ro = 0xffffffff, | ||
1766 | + },{ .name = "RB_DW6_REGISTER", .addr = A_RB_DW6_REGISTER, | ||
1767 | + .ro = 0xffffffff, | ||
1768 | + },{ .name = "RB_DW7_REGISTER", .addr = A_RB_DW7_REGISTER, | ||
1769 | + .ro = 0xffffffff, | ||
1770 | + },{ .name = "RB_DW8_REGISTER", .addr = A_RB_DW8_REGISTER, | ||
1771 | + .ro = 0xffffffff, | ||
1772 | + },{ .name = "RB_DW9_REGISTER", .addr = A_RB_DW9_REGISTER, | ||
1773 | + .ro = 0xffffffff, | ||
1774 | + },{ .name = "RB_DW10_REGISTER", .addr = A_RB_DW10_REGISTER, | ||
1775 | + .ro = 0xffffffff, | ||
1776 | + },{ .name = "RB_DW11_REGISTER", .addr = A_RB_DW11_REGISTER, | ||
1777 | + .ro = 0xffffffff, | ||
1778 | + },{ .name = "RB_DW12_REGISTER", .addr = A_RB_DW12_REGISTER, | ||
1779 | + .ro = 0xffffffff, | ||
1780 | + },{ .name = "RB_DW13_REGISTER", .addr = A_RB_DW13_REGISTER, | ||
1781 | + .ro = 0xffffffff, | ||
1782 | + },{ .name = "RB_DW14_REGISTER", .addr = A_RB_DW14_REGISTER, | ||
1783 | + .ro = 0xffffffff, | ||
1784 | + },{ .name = "RB_DW15_REGISTER", .addr = A_RB_DW15_REGISTER, | ||
1785 | + .ro = 0xffffffff, | ||
1786 | + } | ||
1787 | +}; | ||
1788 | + | ||
1789 | +static const RegisterAccessInfo canfd_rx1_regs[] = { | ||
1790 | + { .name = "RB_ID_REGISTER_1", .addr = A_RB_ID_REGISTER_1, | ||
1791 | + .ro = 0xffffffff, | ||
1792 | + },{ .name = "RB_DLC_REGISTER_1", .addr = A_RB_DLC_REGISTER_1, | ||
1793 | + .ro = 0xfe1fffff, | ||
1794 | + },{ .name = "RB0_DW0_REGISTER_1", .addr = A_RB0_DW0_REGISTER_1, | ||
1795 | + .ro = 0xffffffff, | ||
1796 | + },{ .name = "RB_DW1_REGISTER_1", .addr = A_RB_DW1_REGISTER_1, | ||
1797 | + .ro = 0xffffffff, | ||
1798 | + },{ .name = "RB_DW2_REGISTER_1", .addr = A_RB_DW2_REGISTER_1, | ||
1799 | + .ro = 0xffffffff, | ||
1800 | + },{ .name = "RB_DW3_REGISTER_1", .addr = A_RB_DW3_REGISTER_1, | ||
1801 | + .ro = 0xffffffff, | ||
1802 | + },{ .name = "RB_DW4_REGISTER_1", .addr = A_RB_DW4_REGISTER_1, | ||
1803 | + .ro = 0xffffffff, | ||
1804 | + },{ .name = "RB_DW5_REGISTER_1", .addr = A_RB_DW5_REGISTER_1, | ||
1805 | + .ro = 0xffffffff, | ||
1806 | + },{ .name = "RB_DW6_REGISTER_1", .addr = A_RB_DW6_REGISTER_1, | ||
1807 | + .ro = 0xffffffff, | ||
1808 | + },{ .name = "RB_DW7_REGISTER_1", .addr = A_RB_DW7_REGISTER_1, | ||
1809 | + .ro = 0xffffffff, | ||
1810 | + },{ .name = "RB_DW8_REGISTER_1", .addr = A_RB_DW8_REGISTER_1, | ||
1811 | + .ro = 0xffffffff, | ||
1812 | + },{ .name = "RB_DW9_REGISTER_1", .addr = A_RB_DW9_REGISTER_1, | ||
1813 | + .ro = 0xffffffff, | ||
1814 | + },{ .name = "RB_DW10_REGISTER_1", .addr = A_RB_DW10_REGISTER_1, | ||
1815 | + .ro = 0xffffffff, | ||
1816 | + },{ .name = "RB_DW11_REGISTER_1", .addr = A_RB_DW11_REGISTER_1, | ||
1817 | + .ro = 0xffffffff, | ||
1818 | + },{ .name = "RB_DW12_REGISTER_1", .addr = A_RB_DW12_REGISTER_1, | ||
1819 | + .ro = 0xffffffff, | ||
1820 | + },{ .name = "RB_DW13_REGISTER_1", .addr = A_RB_DW13_REGISTER_1, | ||
1821 | + .ro = 0xffffffff, | ||
1822 | + },{ .name = "RB_DW14_REGISTER_1", .addr = A_RB_DW14_REGISTER_1, | ||
1823 | + .ro = 0xffffffff, | ||
1824 | + },{ .name = "RB_DW15_REGISTER_1", .addr = A_RB_DW15_REGISTER_1, | ||
1825 | + .ro = 0xffffffff, | ||
1826 | + } | ||
1827 | +}; | ||
1828 | + | ||
1829 | +/* Acceptance filter registers. */ | ||
1830 | +static const RegisterAccessInfo canfd_af_regs[] = { | ||
1831 | + { .name = "AFMR_REGISTER", .addr = A_AFMR_REGISTER, | ||
1832 | + .pre_write = filter_mask, | ||
1833 | + },{ .name = "AFIR_REGISTER", .addr = A_AFIR_REGISTER, | ||
1834 | + .pre_write = filter_id, | ||
1835 | + } | ||
1836 | +}; | ||
1837 | + | ||
1838 | +static const RegisterAccessInfo canfd_txe_regs[] = { | ||
1839 | + { .name = "TXE_FIFO_TB_ID_REGISTER", .addr = A_TXE_FIFO_TB_ID_REGISTER, | ||
1840 | + .ro = 0xffffffff, | ||
1841 | + },{ .name = "TXE_FIFO_TB_DLC_REGISTER", .addr = A_TXE_FIFO_TB_DLC_REGISTER, | ||
1842 | + .ro = 0xffffffff, | ||
1843 | + } | ||
1844 | +}; | ||
1845 | + | ||
1846 | +static const RegisterAccessInfo canfd_regs_info[] = { | ||
1847 | + { .name = "SOFTWARE_RESET_REGISTER", .addr = A_SOFTWARE_RESET_REGISTER, | ||
1848 | + .pre_write = canfd_srr_pre_write, | ||
1849 | + },{ .name = "MODE_SELECT_REGISTER", .addr = A_MODE_SELECT_REGISTER, | ||
1850 | + .pre_write = canfd_msr_pre_write, | ||
1851 | + },{ .name = "ARBITRATION_PHASE_BAUD_RATE_PRESCALER_REGISTER", | ||
1852 | + .addr = A_ARBITRATION_PHASE_BAUD_RATE_PRESCALER_REGISTER, | ||
1853 | + .pre_write = canfd_write_check_prew, | ||
1854 | + },{ .name = "ARBITRATION_PHASE_BIT_TIMING_REGISTER", | ||
1855 | + .addr = A_ARBITRATION_PHASE_BIT_TIMING_REGISTER, | ||
1856 | + .pre_write = canfd_write_check_prew, | ||
1857 | + },{ .name = "ERROR_COUNTER_REGISTER", .addr = A_ERROR_COUNTER_REGISTER, | ||
1858 | + .ro = 0xffff, | ||
1859 | + },{ .name = "ERROR_STATUS_REGISTER", .addr = A_ERROR_STATUS_REGISTER, | ||
1860 | + .w1c = 0xf1f, | ||
1861 | + },{ .name = "STATUS_REGISTER", .addr = A_STATUS_REGISTER, | ||
1862 | + .reset = 0x1, | ||
1863 | + .ro = 0x7f17ff, | ||
1864 | + },{ .name = "INTERRUPT_STATUS_REGISTER", | ||
1865 | + .addr = A_INTERRUPT_STATUS_REGISTER, | ||
1866 | + .ro = 0xffffff7f, | ||
1867 | + },{ .name = "INTERRUPT_ENABLE_REGISTER", | ||
1868 | + .addr = A_INTERRUPT_ENABLE_REGISTER, | ||
1869 | + .post_write = canfd_ier_post_write, | ||
1870 | + },{ .name = "INTERRUPT_CLEAR_REGISTER", | ||
1871 | + .addr = A_INTERRUPT_CLEAR_REGISTER, .pre_write = canfd_icr_pre_write, | ||
1872 | + },{ .name = "TIMESTAMP_REGISTER", .addr = A_TIMESTAMP_REGISTER, | ||
1873 | + .ro = 0xffff0000, | ||
1874 | + .pre_write = canfd_tsr_pre_write, | ||
1875 | + },{ .name = "DATA_PHASE_BAUD_RATE_PRESCALER_REGISTER", | ||
1876 | + .addr = A_DATA_PHASE_BAUD_RATE_PRESCALER_REGISTER, | ||
1877 | + .pre_write = canfd_write_check_prew, | ||
1878 | + },{ .name = "DATA_PHASE_BIT_TIMING_REGISTER", | ||
1879 | + .addr = A_DATA_PHASE_BIT_TIMING_REGISTER, | ||
1880 | + .pre_write = canfd_write_check_prew, | ||
1881 | + },{ .name = "TX_BUFFER_READY_REQUEST_REGISTER", | ||
1882 | + .addr = A_TX_BUFFER_READY_REQUEST_REGISTER, | ||
1883 | + .pre_write = canfd_trr_reg_prew, | ||
1884 | + .post_write = canfd_trr_reg_postw, | ||
1885 | + },{ .name = "INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER", | ||
1886 | + .addr = A_INTERRUPT_ENABLE_TX_BUFFER_READY_REQUEST_REGISTER, | ||
1887 | + },{ .name = "TX_BUFFER_CANCEL_REQUEST_REGISTER", | ||
1888 | + .addr = A_TX_BUFFER_CANCEL_REQUEST_REGISTER, | ||
1889 | + .post_write = canfd_cancel_reg_postw, | ||
1890 | + },{ .name = "INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER", | ||
1891 | + .addr = A_INTERRUPT_ENABLE_TX_BUFFER_CANCELLATION_REQUEST_REGISTER, | ||
1892 | + },{ .name = "TX_EVENT_FIFO_STATUS_REGISTER", | ||
1893 | + .addr = A_TX_EVENT_FIFO_STATUS_REGISTER, | ||
1894 | + .ro = 0x3f1f, .pre_write = canfd_tx_fifo_status_prew, | ||
1895 | + },{ .name = "TX_EVENT_FIFO_WATERMARK_REGISTER", | ||
1896 | + .addr = A_TX_EVENT_FIFO_WATERMARK_REGISTER, | ||
1897 | + .reset = 0xf, | ||
1898 | + .pre_write = canfd_write_check_prew, | ||
1899 | + },{ .name = "ACCEPTANCE_FILTER_CONTROL_REGISTER", | ||
1900 | + .addr = A_ACCEPTANCE_FILTER_CONTROL_REGISTER, | ||
1901 | + },{ .name = "RX_FIFO_STATUS_REGISTER", .addr = A_RX_FIFO_STATUS_REGISTER, | ||
1902 | + .ro = 0x7f3f7f3f, .pre_write = canfd_rx_fifo_status_prew, | ||
1903 | + },{ .name = "RX_FIFO_WATERMARK_REGISTER", | ||
1904 | + .addr = A_RX_FIFO_WATERMARK_REGISTER, | ||
1905 | + .reset = 0x1f0f0f, | ||
1906 | + .pre_write = canfd_write_check_prew, | ||
1907 | + } | ||
1908 | +}; | ||
1909 | + | ||
1910 | +static void xlnx_versal_canfd_ptimer_cb(void *opaque) | ||
1911 | +{ | ||
1912 | + /* No action required on the timer rollover. */ | ||
1913 | +} | ||
1914 | + | ||
1915 | +static const MemoryRegionOps canfd_ops = { | ||
1916 | + .read = register_read_memory, | ||
1917 | + .write = register_write_memory, | ||
1918 | + .endianness = DEVICE_LITTLE_ENDIAN, | ||
1919 | + .valid = { | ||
1920 | + .min_access_size = 4, | ||
1921 | + .max_access_size = 4, | ||
1922 | + }, | ||
1923 | +}; | ||
1924 | + | ||
1925 | +static void canfd_reset(DeviceState *dev) | ||
1926 | +{ | ||
1927 | + XlnxVersalCANFDState *s = XILINX_CANFD(dev); | ||
1928 | + unsigned int i; | ||
1929 | + | ||
1930 | + for (i = 0; i < ARRAY_SIZE(s->reg_info); ++i) { | ||
1931 | + register_reset(&s->reg_info[i]); | ||
1932 | + } | ||
1933 | + | ||
1934 | + ptimer_transaction_begin(s->canfd_timer); | ||
1935 | + ptimer_set_count(s->canfd_timer, 0); | ||
1936 | + ptimer_transaction_commit(s->canfd_timer); | ||
1937 | +} | ||
1938 | + | ||
1939 | +static bool can_xilinx_canfd_receive(CanBusClientState *client) | ||
1940 | +{ | ||
1941 | + XlnxVersalCANFDState *s = container_of(client, XlnxVersalCANFDState, | ||
1942 | + bus_client); | ||
1943 | + | ||
1944 | + bool reset_state = ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, SRST); | ||
1945 | + bool can_enabled = ARRAY_FIELD_EX32(s->regs, SOFTWARE_RESET_REGISTER, CEN); | ||
1946 | + | ||
1947 | + return !reset_state && can_enabled; | ||
1948 | +} | ||
1949 | + | ||
1950 | +static ssize_t canfd_xilinx_receive(CanBusClientState *client, | ||
1951 | + const qemu_can_frame *buf, | ||
1952 | + size_t buf_size) | ||
1953 | +{ | ||
1954 | + XlnxVersalCANFDState *s = container_of(client, XlnxVersalCANFDState, | ||
1955 | + bus_client); | ||
1956 | + const qemu_can_frame *frame = buf; | ||
1957 | + | ||
1958 | + assert(buf_size > 0); | ||
1959 | + | ||
1960 | + if (ARRAY_FIELD_EX32(s->regs, STATUS_REGISTER, LBACK)) { | ||
1961 | + /* | ||
1962 | + * XlnxVersalCANFDState will not participate in normal bus communication | ||
1963 | + * and does not receive any messages transmitted by other CAN nodes. | ||
1964 | + */ | ||
1965 | + return 1; | ||
1966 | + } | ||
1967 | + | ||
1968 | + /* Update the status register that we are receiving message. */ | ||
1969 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, BBSY, 1); | ||
1970 | + | ||
1971 | + if (ARRAY_FIELD_EX32(s->regs, STATUS_REGISTER, SNOOP)) { | ||
1972 | + /* Snoop Mode: Just keep the data. no response back. */ | ||
1973 | + update_rx_sequential(s, frame); | ||
1974 | + } else { | ||
1975 | + if ((ARRAY_FIELD_EX32(s->regs, STATUS_REGISTER, SLEEP))) { | ||
1976 | + /* | ||
1977 | + * XlnxVersalCANFDState is in sleep mode. Any data on bus will bring | ||
1978 | + * it to the wake up state. | ||
1979 | + */ | ||
1980 | + canfd_exit_sleep_mode(s); | ||
1981 | + } | ||
1982 | + | ||
1983 | + update_rx_sequential(s, frame); | ||
1984 | + } | ||
1985 | + | ||
1986 | + /* Message processing done. Update the status back to !busy */ | ||
1987 | + ARRAY_FIELD_DP32(s->regs, STATUS_REGISTER, BBSY, 0); | ||
1988 | + return 1; | ||
1989 | +} | ||
1990 | + | ||
1991 | +static CanBusClientInfo canfd_xilinx_bus_client_info = { | ||
1992 | + .can_receive = can_xilinx_canfd_receive, | ||
1993 | + .receive = canfd_xilinx_receive, | ||
1994 | +}; | ||
1995 | + | ||
1996 | +static int xlnx_canfd_connect_to_bus(XlnxVersalCANFDState *s, | ||
1997 | + CanBusState *bus) | ||
1998 | +{ | ||
1999 | + s->bus_client.info = &canfd_xilinx_bus_client_info; | ||
2000 | + | ||
2001 | + return can_bus_insert_client(bus, &s->bus_client); | ||
2002 | +} | ||
2003 | + | ||
2004 | +#define NUM_REG_PER_AF ARRAY_SIZE(canfd_af_regs) | ||
2005 | +#define NUM_AF 32 | ||
2006 | +#define NUM_REG_PER_TXE ARRAY_SIZE(canfd_txe_regs) | ||
2007 | +#define NUM_TXE 32 | ||
2008 | + | ||
2009 | +static int canfd_populate_regarray(XlnxVersalCANFDState *s, | ||
2010 | + RegisterInfoArray *r_array, int pos, | ||
2011 | + const RegisterAccessInfo *rae, | ||
2012 | + int num_rae) | ||
2013 | +{ | ||
2014 | + int i; | ||
2015 | + | ||
2016 | + for (i = 0; i < num_rae; i++) { | ||
2017 | + int index = rae[i].addr / 4; | ||
2018 | + RegisterInfo *r = &s->reg_info[index]; | ||
2019 | + | ||
2020 | + object_initialize(r, sizeof(*r), TYPE_REGISTER); | ||
2021 | + | ||
2022 | + *r = (RegisterInfo) { | ||
2023 | + .data = &s->regs[index], | ||
2024 | + .data_size = sizeof(uint32_t), | ||
2025 | + .access = &rae[i], | ||
2026 | + .opaque = OBJECT(s), | ||
2027 | + }; | ||
2028 | + | ||
2029 | + r_array->r[i + pos] = r; | ||
2030 | + } | ||
2031 | + return i + pos; | ||
2032 | +} | ||
2033 | + | ||
2034 | +static void canfd_create_rai(RegisterAccessInfo *rai_array, | ||
2035 | + const RegisterAccessInfo *canfd_regs, | ||
2036 | + int template_rai_array_sz, | ||
2037 | + int num_template_to_copy) | ||
2038 | +{ | ||
2039 | + int i; | ||
2040 | + int reg_num; | ||
2041 | + | ||
2042 | + for (reg_num = 0; reg_num < num_template_to_copy; reg_num++) { | ||
2043 | + int pos = reg_num * template_rai_array_sz; | ||
2044 | + | ||
2045 | + memcpy(rai_array + pos, canfd_regs, | ||
2046 | + template_rai_array_sz * sizeof(RegisterAccessInfo)); | ||
2047 | + | ||
2048 | + for (i = 0; i < template_rai_array_sz; i++) { | ||
2049 | + const char *name = canfd_regs[i].name; | ||
2050 | + uint64_t addr = canfd_regs[i].addr; | ||
2051 | + rai_array[i + pos].name = g_strdup_printf("%s%d", name, reg_num); | ||
2052 | + rai_array[i + pos].addr = addr + pos * 4; | ||
2053 | + } | ||
2054 | + } | ||
2055 | +} | ||
2056 | + | ||
2057 | +static RegisterInfoArray *canfd_create_regarray(XlnxVersalCANFDState *s) | ||
2058 | +{ | ||
2059 | + const char *device_prefix = object_get_typename(OBJECT(s)); | ||
2060 | + uint64_t memory_size = XLNX_VERSAL_CANFD_R_MAX * 4; | ||
2061 | + int num_regs; | ||
2062 | + int pos = 0; | ||
2063 | + RegisterInfoArray *r_array; | ||
2064 | + | ||
2065 | + num_regs = ARRAY_SIZE(canfd_regs_info) + | ||
2066 | + s->cfg.tx_fifo * NUM_REGS_PER_MSG_SPACE + | ||
2067 | + s->cfg.rx0_fifo * NUM_REGS_PER_MSG_SPACE + | ||
2068 | + NUM_AF * NUM_REG_PER_AF + | ||
2069 | + NUM_TXE * NUM_REG_PER_TXE; | ||
2070 | + | ||
2071 | + s->tx_regs = g_new0(RegisterAccessInfo, | ||
2072 | + s->cfg.tx_fifo * ARRAY_SIZE(canfd_tx_regs)); | ||
2073 | + | ||
2074 | + canfd_create_rai(s->tx_regs, canfd_tx_regs, | ||
2075 | + ARRAY_SIZE(canfd_tx_regs), s->cfg.tx_fifo); | ||
2076 | + | ||
2077 | + s->rx0_regs = g_new0(RegisterAccessInfo, | ||
2078 | + s->cfg.rx0_fifo * ARRAY_SIZE(canfd_rx0_regs)); | ||
2079 | + | ||
2080 | + canfd_create_rai(s->rx0_regs, canfd_rx0_regs, | ||
2081 | + ARRAY_SIZE(canfd_rx0_regs), s->cfg.rx0_fifo); | ||
2082 | + | ||
2083 | + s->af_regs = g_new0(RegisterAccessInfo, | ||
2084 | + NUM_AF * ARRAY_SIZE(canfd_af_regs)); | ||
2085 | + | ||
2086 | + canfd_create_rai(s->af_regs, canfd_af_regs, | ||
2087 | + ARRAY_SIZE(canfd_af_regs), NUM_AF); | ||
2088 | + | ||
2089 | + s->txe_regs = g_new0(RegisterAccessInfo, | ||
2090 | + NUM_TXE * ARRAY_SIZE(canfd_txe_regs)); | ||
2091 | + | ||
2092 | + canfd_create_rai(s->txe_regs, canfd_txe_regs, | ||
2093 | + ARRAY_SIZE(canfd_txe_regs), NUM_TXE); | ||
2094 | + | ||
2095 | + if (s->cfg.enable_rx_fifo1) { | ||
2096 | + num_regs += s->cfg.rx1_fifo * NUM_REGS_PER_MSG_SPACE; | ||
2097 | + | ||
2098 | + s->rx1_regs = g_new0(RegisterAccessInfo, | ||
2099 | + s->cfg.rx1_fifo * ARRAY_SIZE(canfd_rx1_regs)); | ||
2100 | + | ||
2101 | + canfd_create_rai(s->rx1_regs, canfd_rx1_regs, | ||
2102 | + ARRAY_SIZE(canfd_rx1_regs), s->cfg.rx1_fifo); | ||
2103 | + } | ||
2104 | + | ||
2105 | + r_array = g_new0(RegisterInfoArray, 1); | ||
2106 | + r_array->r = g_new0(RegisterInfo * , num_regs); | ||
2107 | + r_array->num_elements = num_regs; | ||
2108 | + r_array->prefix = device_prefix; | ||
2109 | + | ||
2110 | + pos = canfd_populate_regarray(s, r_array, pos, | ||
2111 | + canfd_regs_info, | ||
2112 | + ARRAY_SIZE(canfd_regs_info)); | ||
2113 | + pos = canfd_populate_regarray(s, r_array, pos, | ||
2114 | + s->tx_regs, s->cfg.tx_fifo * | ||
2115 | + NUM_REGS_PER_MSG_SPACE); | ||
2116 | + pos = canfd_populate_regarray(s, r_array, pos, | ||
2117 | + s->rx0_regs, s->cfg.rx0_fifo * | ||
2118 | + NUM_REGS_PER_MSG_SPACE); | ||
2119 | + if (s->cfg.enable_rx_fifo1) { | ||
2120 | + pos = canfd_populate_regarray(s, r_array, pos, | ||
2121 | + s->rx1_regs, s->cfg.rx1_fifo * | ||
2122 | + NUM_REGS_PER_MSG_SPACE); | ||
2123 | + } | ||
2124 | + pos = canfd_populate_regarray(s, r_array, pos, | ||
2125 | + s->af_regs, NUM_AF * NUM_REG_PER_AF); | ||
2126 | + pos = canfd_populate_regarray(s, r_array, pos, | ||
2127 | + s->txe_regs, NUM_TXE * NUM_REG_PER_TXE); | ||
2128 | + | ||
2129 | + memory_region_init_io(&r_array->mem, OBJECT(s), &canfd_ops, r_array, | ||
2130 | + device_prefix, memory_size); | ||
2131 | + return r_array; | ||
2132 | +} | ||
2133 | + | ||
2134 | +static void canfd_realize(DeviceState *dev, Error **errp) | ||
2135 | +{ | ||
2136 | + XlnxVersalCANFDState *s = XILINX_CANFD(dev); | ||
2137 | + RegisterInfoArray *reg_array; | ||
2138 | + | ||
2139 | + reg_array = canfd_create_regarray(s); | ||
2140 | + memory_region_add_subregion(&s->iomem, 0x00, ®_array->mem); | ||
2141 | + sysbus_init_mmio(SYS_BUS_DEVICE(dev), &s->iomem); | ||
2142 | + sysbus_init_irq(SYS_BUS_DEVICE(dev), &s->irq_canfd_int); | ||
2143 | + | ||
2144 | + if (s->canfdbus) { | ||
2145 | + if (xlnx_canfd_connect_to_bus(s, s->canfdbus) < 0) { | ||
2146 | + g_autofree char *path = object_get_canonical_path(OBJECT(s)); | ||
2147 | + | ||
2148 | + error_setg(errp, "%s: xlnx_canfd_connect_to_bus failed", path); | ||
2149 | + return; | ||
2150 | + } | ||
2151 | + | ||
2152 | + } | ||
2153 | + | ||
2154 | + /* Allocate a new timer. */ | ||
2155 | + s->canfd_timer = ptimer_init(xlnx_versal_canfd_ptimer_cb, s, | ||
2156 | + PTIMER_POLICY_WRAP_AFTER_ONE_PERIOD | | ||
2157 | + PTIMER_POLICY_TRIGGER_ONLY_ON_DECREMENT | | ||
2158 | + PTIMER_POLICY_NO_IMMEDIATE_RELOAD); | ||
2159 | + | ||
2160 | + ptimer_transaction_begin(s->canfd_timer); | ||
2161 | + | ||
2162 | + ptimer_set_freq(s->canfd_timer, s->cfg.ext_clk_freq); | ||
2163 | + ptimer_set_limit(s->canfd_timer, CANFD_TIMER_MAX, 1); | ||
2164 | + ptimer_run(s->canfd_timer, 0); | ||
2165 | + ptimer_transaction_commit(s->canfd_timer); | ||
2166 | +} | ||
2167 | + | ||
2168 | +static void canfd_init(Object *obj) | ||
2169 | +{ | ||
2170 | + XlnxVersalCANFDState *s = XILINX_CANFD(obj); | ||
2171 | + | ||
2172 | + memory_region_init(&s->iomem, obj, TYPE_XILINX_CANFD, | ||
2173 | + XLNX_VERSAL_CANFD_R_MAX * 4); | ||
2174 | +} | ||
2175 | + | ||
2176 | +static const VMStateDescription vmstate_canfd = { | ||
2177 | + .name = TYPE_XILINX_CANFD, | ||
2178 | + .version_id = 1, | ||
2179 | + .minimum_version_id = 1, | ||
2180 | + .fields = (VMStateField[]) { | ||
2181 | + VMSTATE_UINT32_ARRAY(regs, XlnxVersalCANFDState, | ||
2182 | + XLNX_VERSAL_CANFD_R_MAX), | ||
2183 | + VMSTATE_PTIMER(canfd_timer, XlnxVersalCANFDState), | ||
2184 | + VMSTATE_END_OF_LIST(), | ||
2185 | + } | ||
2186 | +}; | ||
2187 | + | ||
2188 | +static Property canfd_core_properties[] = { | ||
2189 | + DEFINE_PROP_UINT8("rx-fifo0", XlnxVersalCANFDState, cfg.rx0_fifo, 0x40), | ||
2190 | + DEFINE_PROP_UINT8("rx-fifo1", XlnxVersalCANFDState, cfg.rx1_fifo, 0x40), | ||
2191 | + DEFINE_PROP_UINT8("tx-fifo", XlnxVersalCANFDState, cfg.tx_fifo, 0x20), | ||
2192 | + DEFINE_PROP_BOOL("enable-rx-fifo1", XlnxVersalCANFDState, | ||
2193 | + cfg.enable_rx_fifo1, true), | ||
2194 | + DEFINE_PROP_UINT32("ext_clk_freq", XlnxVersalCANFDState, cfg.ext_clk_freq, | ||
2195 | + CANFD_DEFAULT_CLOCK), | ||
2196 | + DEFINE_PROP_LINK("canfdbus", XlnxVersalCANFDState, canfdbus, TYPE_CAN_BUS, | ||
2197 | + CanBusState *), | ||
2198 | + DEFINE_PROP_END_OF_LIST(), | ||
2199 | +}; | ||
2200 | + | ||
2201 | +static void canfd_class_init(ObjectClass *klass, void *data) | ||
2202 | +{ | ||
2203 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
2204 | + | ||
2205 | + dc->reset = canfd_reset; | ||
2206 | + dc->realize = canfd_realize; | ||
2207 | + device_class_set_props(dc, canfd_core_properties); | ||
2208 | + dc->vmsd = &vmstate_canfd; | ||
2209 | +} | ||
2210 | + | ||
2211 | +static const TypeInfo canfd_info = { | ||
2212 | + .name = TYPE_XILINX_CANFD, | ||
2213 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
2214 | + .instance_size = sizeof(XlnxVersalCANFDState), | ||
2215 | + .class_init = canfd_class_init, | ||
2216 | + .instance_init = canfd_init, | ||
2217 | +}; | ||
2218 | + | ||
2219 | +static void canfd_register_types(void) | ||
2220 | +{ | ||
2221 | + type_register_static(&canfd_info); | ||
2222 | +} | ||
2223 | + | ||
2224 | +type_init(canfd_register_types) | ||
2225 | diff --git a/hw/net/can/meson.build b/hw/net/can/meson.build | ||
145 | index XXXXXXX..XXXXXXX 100644 | 2226 | index XXXXXXX..XXXXXXX 100644 |
146 | --- a/target/arm/translate-sme.c | 2227 | --- a/hw/net/can/meson.build |
147 | +++ b/target/arm/translate-sme.c | 2228 | +++ b/hw/net/can/meson.build |
148 | @@ -XXX,XX +XXX,XX @@ static bool do_ldst_r(DisasContext *s, arg_ldstr *a, GenLdStR *fn) | 2229 | @@ -XXX,XX +XXX,XX @@ softmmu_ss.add(when: 'CONFIG_CAN_PCI', if_true: files('can_mioe3680_pci.c')) |
149 | 2230 | softmmu_ss.add(when: 'CONFIG_CAN_CTUCANFD', if_true: files('ctucan_core.c')) | |
150 | TRANS_FEAT(LDR, aa64_sme, do_ldst_r, a, gen_sve_ldr) | 2231 | softmmu_ss.add(when: 'CONFIG_CAN_CTUCANFD_PCI', if_true: files('ctucan_pci.c')) |
151 | TRANS_FEAT(STR, aa64_sme, do_ldst_r, a, gen_sve_str) | 2232 | softmmu_ss.add(when: 'CONFIG_XLNX_ZYNQMP', if_true: files('xlnx-zynqmp-can.c')) |
152 | + | 2233 | +softmmu_ss.add(when: 'CONFIG_XLNX_VERSAL', if_true: files('xlnx-versal-canfd.c')) |
153 | +static bool do_adda(DisasContext *s, arg_adda *a, MemOp esz, | 2234 | diff --git a/hw/net/can/trace-events b/hw/net/can/trace-events |
154 | + gen_helper_gvec_4 *fn) | 2235 | index XXXXXXX..XXXXXXX 100644 |
155 | +{ | 2236 | --- a/hw/net/can/trace-events |
156 | + int svl = streaming_vec_reg_size(s); | 2237 | +++ b/hw/net/can/trace-events |
157 | + uint32_t desc = simd_desc(svl, svl, 0); | 2238 | @@ -XXX,XX +XXX,XX @@ xlnx_can_filter_mask_pre_write(uint8_t filter_num, uint32_t value) "Filter%d MAS |
158 | + TCGv_ptr za, zn, pn, pm; | 2239 | xlnx_can_tx_data(uint32_t id, uint8_t dlc, uint8_t db0, uint8_t db1, uint8_t db2, uint8_t db3, uint8_t db4, uint8_t db5, uint8_t db6, uint8_t db7) "Frame: ID: 0x%08x DLC: 0x%02x DATA: 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x" |
159 | + | 2240 | xlnx_can_rx_data(uint32_t id, uint32_t dlc, uint8_t db0, uint8_t db1, uint8_t db2, uint8_t db3, uint8_t db4, uint8_t db5, uint8_t db6, uint8_t db7) "Frame: ID: 0x%08x DLC: 0x%02x DATA: 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x 0x%02x" |
160 | + if (!sme_smza_enabled_check(s)) { | 2241 | xlnx_can_rx_discard(uint32_t status) "Controller is not enabled for bus communication. Status Register: 0x%08x" |
161 | + return true; | 2242 | + |
162 | + } | 2243 | +# xlnx-versal-canfd.c |
163 | + | 2244 | +xlnx_canfd_update_irq(char *path, uint32_t isr, uint32_t ier, uint32_t irq) "%s: ISR: 0x%08x IER: 0x%08x IRQ: 0x%08x" |
164 | + /* Sum XZR+zad to find ZAd. */ | 2245 | +xlnx_canfd_rx_fifo_filter_reject(char *path, uint32_t id, uint8_t dlc) "%s: Frame: ID: 0x%08x DLC: 0x%02x" |
165 | + za = get_tile_rowcol(s, esz, 31, a->zad, false); | 2246 | +xlnx_canfd_rx_data(char *path, uint32_t id, uint8_t dlc, uint8_t flags) "%s: Frame: ID: 0x%08x DLC: 0x%02x CANFD Flag: 0x%02x" |
166 | + zn = vec_full_reg_ptr(s, a->zn); | 2247 | +xlnx_canfd_tx_data(char *path, uint32_t id, uint8_t dlc, uint8_t flgas) "%s: Frame: ID: 0x%08x DLC: 0x%02x CANFD Flag: 0x%02x" |
167 | + pn = pred_full_reg_ptr(s, a->pn); | 2248 | +xlnx_canfd_reset(char *path, uint32_t val) "%s: Resetting controller with value = 0x%08x" |
168 | + pm = pred_full_reg_ptr(s, a->pm); | ||
169 | + | ||
170 | + fn(za, zn, pn, pm, tcg_constant_i32(desc)); | ||
171 | + | ||
172 | + tcg_temp_free_ptr(za); | ||
173 | + tcg_temp_free_ptr(zn); | ||
174 | + tcg_temp_free_ptr(pn); | ||
175 | + tcg_temp_free_ptr(pm); | ||
176 | + return true; | ||
177 | +} | ||
178 | + | ||
179 | +TRANS_FEAT(ADDHA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addha_s) | ||
180 | +TRANS_FEAT(ADDVA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addva_s) | ||
181 | +TRANS_FEAT(ADDHA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addha_d) | ||
182 | +TRANS_FEAT(ADDVA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addva_d) | ||
183 | -- | 2249 | -- |
184 | 2.25.1 | 2250 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Vikram Garhwal <vikram.garhwal@amd.com> |
---|---|---|---|
2 | 2 | ||
3 | This is SMOPA, SUMOPA, USMOPA_s, UMOPA, for both Int8 and Int16. | 3 | Connect CANFD0 and CANFD1 on the Versal-virt machine and update xlnx-versal-virt |
4 | document with CANFD command line examples. | ||
4 | 5 | ||
6 | Signed-off-by: Vikram Garhwal <vikram.garhwal@amd.com> | ||
5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Reviewed-by: Francisco Iglesias <frasse.iglesias@gmail.com> |
7 | Message-id: 20220708151540.18136-28-richard.henderson@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 10 | --- |
10 | target/arm/helper-sme.h | 16 ++++++++ | 11 | docs/system/arm/xlnx-versal-virt.rst | 31 ++++++++++++++++ |
11 | target/arm/sme.decode | 10 +++++ | 12 | include/hw/arm/xlnx-versal.h | 12 +++++++ |
12 | target/arm/sme_helper.c | 82 ++++++++++++++++++++++++++++++++++++++ | 13 | hw/arm/xlnx-versal-virt.c | 53 ++++++++++++++++++++++++++++ |
13 | target/arm/translate-sme.c | 10 +++++ | 14 | hw/arm/xlnx-versal.c | 37 +++++++++++++++++++ |
14 | 4 files changed, 118 insertions(+) | 15 | 4 files changed, 133 insertions(+) |
15 | 16 | ||
16 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | 17 | diff --git a/docs/system/arm/xlnx-versal-virt.rst b/docs/system/arm/xlnx-versal-virt.rst |
17 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-sme.h | 19 | --- a/docs/system/arm/xlnx-versal-virt.rst |
19 | +++ b/target/arm/helper-sme.h | 20 | +++ b/docs/system/arm/xlnx-versal-virt.rst |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_7(sme_fmopa_d, TCG_CALL_NO_RWG, | 21 | @@ -XXX,XX +XXX,XX @@ Implemented devices: |
21 | void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | 22 | - DDR memory |
22 | DEF_HELPER_FLAGS_6(sme_bfmopa, TCG_CALL_NO_RWG, | 23 | - BBRAM (36 bytes of Battery-backed RAM) |
23 | void, ptr, ptr, ptr, ptr, ptr, i32) | 24 | - eFUSE (3072 bytes of one-time field-programmable bit array) |
24 | +DEF_HELPER_FLAGS_6(sme_smopa_s, TCG_CALL_NO_RWG, | 25 | +- 2 CANFDs |
25 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 26 | |
26 | +DEF_HELPER_FLAGS_6(sme_umopa_s, TCG_CALL_NO_RWG, | 27 | QEMU does not yet model any other devices, including the PL and the AI Engine. |
27 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 28 | |
28 | +DEF_HELPER_FLAGS_6(sme_sumopa_s, TCG_CALL_NO_RWG, | 29 | @@ -XXX,XX +XXX,XX @@ To use a different index value, N, from default of 1, add: |
29 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 30 | |
30 | +DEF_HELPER_FLAGS_6(sme_usmopa_s, TCG_CALL_NO_RWG, | 31 | Better yet, do not use actual product data when running guest image |
31 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 32 | on this Xilinx Versal Virt board. |
32 | +DEF_HELPER_FLAGS_6(sme_smopa_d, TCG_CALL_NO_RWG, | 33 | + |
33 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 34 | +Using CANFDs for Versal Virt |
34 | +DEF_HELPER_FLAGS_6(sme_umopa_d, TCG_CALL_NO_RWG, | 35 | +"""""""""""""""""""""""""""" |
35 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 36 | +Versal CANFD controller is developed based on SocketCAN and QEMU CAN bus |
36 | +DEF_HELPER_FLAGS_6(sme_sumopa_d, TCG_CALL_NO_RWG, | 37 | +implementation. Bus connection and socketCAN connection for each CAN module |
37 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 38 | +can be set through command lines. |
38 | +DEF_HELPER_FLAGS_6(sme_usmopa_d, TCG_CALL_NO_RWG, | 39 | + |
39 | + void, ptr, ptr, ptr, ptr, ptr, i32) | 40 | +To connect both CANFD0 and CANFD1 on the same bus: |
40 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | 41 | + |
41 | index XXXXXXX..XXXXXXX 100644 | 42 | +.. code-block:: bash |
42 | --- a/target/arm/sme.decode | 43 | + |
43 | +++ b/target/arm/sme.decode | 44 | + -object can-bus,id=canbus -machine canbus0=canbus -machine canbus1=canbus |
44 | @@ -XXX,XX +XXX,XX @@ FMOPA_d 10000000 110 ..... ... ... ..... . 0 ... @op_64 | 45 | + |
45 | 46 | +To connect CANFD0 and CANFD1 to separate buses: | |
46 | BFMOPA 10000001 100 ..... ... ... ..... . 00 .. @op_32 | 47 | + |
47 | FMOPA_h 10000001 101 ..... ... ... ..... . 00 .. @op_32 | 48 | +.. code-block:: bash |
48 | + | 49 | + |
49 | +SMOPA_s 1010000 0 10 0 ..... ... ... ..... . 00 .. @op_32 | 50 | + -object can-bus,id=canbus0 -object can-bus,id=canbus1 \ |
50 | +SUMOPA_s 1010000 0 10 1 ..... ... ... ..... . 00 .. @op_32 | 51 | + -machine canbus0=canbus0 -machine canbus1=canbus1 |
51 | +USMOPA_s 1010000 1 10 0 ..... ... ... ..... . 00 .. @op_32 | 52 | + |
52 | +UMOPA_s 1010000 1 10 1 ..... ... ... ..... . 00 .. @op_32 | 53 | +The SocketCAN interface can connect to a Physical or a Virtual CAN interfaces on |
53 | + | 54 | +the host machine. Please check this document to learn about CAN interface on |
54 | +SMOPA_d 1010000 0 11 0 ..... ... ... ..... . 0 ... @op_64 | 55 | +Linux: docs/system/devices/can.rst |
55 | +SUMOPA_d 1010000 0 11 1 ..... ... ... ..... . 0 ... @op_64 | 56 | + |
56 | +USMOPA_d 1010000 1 11 0 ..... ... ... ..... . 0 ... @op_64 | 57 | +To connect CANFD0 and CANFD1 to host machine's CAN interface can0: |
57 | +UMOPA_d 1010000 1 11 1 ..... ... ... ..... . 0 ... @op_64 | 58 | + |
58 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | 59 | +.. code-block:: bash |
59 | index XXXXXXX..XXXXXXX 100644 | 60 | + |
60 | --- a/target/arm/sme_helper.c | 61 | + -object can-bus,id=canbus -machine canbus0=canbus -machine canbus1=canbus |
61 | +++ b/target/arm/sme_helper.c | 62 | + -object can-host-socketcan,id=canhost0,if=can0,canbus=canbus |
62 | @@ -XXX,XX +XXX,XX @@ void HELPER(sme_bfmopa)(void *vza, void *vzn, void *vzm, void *vpn, | 63 | diff --git a/include/hw/arm/xlnx-versal.h b/include/hw/arm/xlnx-versal.h |
63 | } while (row & 15); | 64 | index XXXXXXX..XXXXXXX 100644 |
65 | --- a/include/hw/arm/xlnx-versal.h | ||
66 | +++ b/include/hw/arm/xlnx-versal.h | ||
67 | @@ -XXX,XX +XXX,XX @@ | ||
68 | #include "hw/dma/xlnx_csu_dma.h" | ||
69 | #include "hw/misc/xlnx-versal-crl.h" | ||
70 | #include "hw/misc/xlnx-versal-pmc-iou-slcr.h" | ||
71 | +#include "hw/net/xlnx-versal-canfd.h" | ||
72 | |||
73 | #define TYPE_XLNX_VERSAL "xlnx-versal" | ||
74 | OBJECT_DECLARE_SIMPLE_TYPE(Versal, XLNX_VERSAL) | ||
75 | @@ -XXX,XX +XXX,XX @@ OBJECT_DECLARE_SIMPLE_TYPE(Versal, XLNX_VERSAL) | ||
76 | #define XLNX_VERSAL_NR_SDS 2 | ||
77 | #define XLNX_VERSAL_NR_XRAM 4 | ||
78 | #define XLNX_VERSAL_NR_IRQS 192 | ||
79 | +#define XLNX_VERSAL_NR_CANFD 2 | ||
80 | +#define XLNX_VERSAL_CANFD_REF_CLK (24 * 1000 * 1000) | ||
81 | |||
82 | struct Versal { | ||
83 | /*< private >*/ | ||
84 | @@ -XXX,XX +XXX,XX @@ struct Versal { | ||
85 | CadenceGEMState gem[XLNX_VERSAL_NR_GEMS]; | ||
86 | XlnxZDMA adma[XLNX_VERSAL_NR_ADMAS]; | ||
87 | VersalUsb2 usb; | ||
88 | + CanBusState *canbus[XLNX_VERSAL_NR_CANFD]; | ||
89 | + XlnxVersalCANFDState canfd[XLNX_VERSAL_NR_CANFD]; | ||
90 | } iou; | ||
91 | |||
92 | /* Real-time Processing Unit. */ | ||
93 | @@ -XXX,XX +XXX,XX @@ struct Versal { | ||
94 | #define VERSAL_CRL_IRQ 10 | ||
95 | #define VERSAL_UART0_IRQ_0 18 | ||
96 | #define VERSAL_UART1_IRQ_0 19 | ||
97 | +#define VERSAL_CANFD0_IRQ_0 20 | ||
98 | +#define VERSAL_CANFD1_IRQ_0 21 | ||
99 | #define VERSAL_USB0_IRQ_0 22 | ||
100 | #define VERSAL_GEM0_IRQ_0 56 | ||
101 | #define VERSAL_GEM0_WAKE_IRQ_0 57 | ||
102 | @@ -XXX,XX +XXX,XX @@ struct Versal { | ||
103 | #define MM_UART1 0xff010000U | ||
104 | #define MM_UART1_SIZE 0x10000 | ||
105 | |||
106 | +#define MM_CANFD0 0xff060000U | ||
107 | +#define MM_CANFD0_SIZE 0x10000 | ||
108 | +#define MM_CANFD1 0xff070000U | ||
109 | +#define MM_CANFD1_SIZE 0x10000 | ||
110 | + | ||
111 | #define MM_GEM0 0xff0c0000U | ||
112 | #define MM_GEM0_SIZE 0x10000 | ||
113 | #define MM_GEM1 0xff0d0000U | ||
114 | diff --git a/hw/arm/xlnx-versal-virt.c b/hw/arm/xlnx-versal-virt.c | ||
115 | index XXXXXXX..XXXXXXX 100644 | ||
116 | --- a/hw/arm/xlnx-versal-virt.c | ||
117 | +++ b/hw/arm/xlnx-versal-virt.c | ||
118 | @@ -XXX,XX +XXX,XX @@ struct VersalVirt { | ||
119 | uint32_t clk_25Mhz; | ||
120 | uint32_t usb; | ||
121 | uint32_t dwc; | ||
122 | + uint32_t canfd[2]; | ||
123 | } phandle; | ||
124 | struct arm_boot_info binfo; | ||
125 | |||
126 | + CanBusState *canbus[XLNX_VERSAL_NR_CANFD]; | ||
127 | struct { | ||
128 | bool secure; | ||
129 | } cfg; | ||
130 | @@ -XXX,XX +XXX,XX @@ static void fdt_add_uart_nodes(VersalVirt *s) | ||
64 | } | 131 | } |
65 | } | 132 | } |
66 | + | 133 | |
67 | +typedef uint64_t IMOPFn(uint64_t, uint64_t, uint64_t, uint8_t, bool); | 134 | +static void fdt_add_canfd_nodes(VersalVirt *s) |
68 | + | ||
69 | +static inline void do_imopa(uint64_t *za, uint64_t *zn, uint64_t *zm, | ||
70 | + uint8_t *pn, uint8_t *pm, | ||
71 | + uint32_t desc, IMOPFn *fn) | ||
72 | +{ | 135 | +{ |
73 | + intptr_t row, col, oprsz = simd_oprsz(desc) / 8; | 136 | + uint64_t addrs[] = { MM_CANFD1, MM_CANFD0 }; |
74 | + bool neg = simd_data(desc); | 137 | + uint32_t size[] = { MM_CANFD1_SIZE, MM_CANFD0_SIZE }; |
75 | + | 138 | + unsigned int irqs[] = { VERSAL_CANFD1_IRQ_0, VERSAL_CANFD0_IRQ_0 }; |
76 | + for (row = 0; row < oprsz; ++row) { | 139 | + const char clocknames[] = "can_clk\0s_axi_aclk"; |
77 | + uint8_t pa = pn[H1(row)]; | 140 | + int i; |
78 | + uint64_t *za_row = &za[tile_vslice_index(row)]; | 141 | + |
79 | + uint64_t n = zn[row]; | 142 | + /* Create and connect CANFD0 and CANFD1 nodes to canbus0. */ |
80 | + | 143 | + for (i = 0; i < ARRAY_SIZE(addrs); i++) { |
81 | + for (col = 0; col < oprsz; ++col) { | 144 | + char *name = g_strdup_printf("/canfd@%" PRIx64, addrs[i]); |
82 | + uint8_t pb = pm[H1(col)]; | 145 | + qemu_fdt_add_subnode(s->fdt, name); |
83 | + uint64_t *a = &za_row[col]; | 146 | + |
84 | + | 147 | + qemu_fdt_setprop_cell(s->fdt, name, "rx-fifo-depth", 0x40); |
85 | + *a = fn(n, zm[col], *a, pa & pb, neg); | 148 | + qemu_fdt_setprop_cell(s->fdt, name, "tx-mailbox-count", 0x20); |
86 | + } | 149 | + |
150 | + qemu_fdt_setprop_cells(s->fdt, name, "clocks", | ||
151 | + s->phandle.clk_25Mhz, s->phandle.clk_25Mhz); | ||
152 | + qemu_fdt_setprop(s->fdt, name, "clock-names", | ||
153 | + clocknames, sizeof(clocknames)); | ||
154 | + qemu_fdt_setprop_cells(s->fdt, name, "interrupts", | ||
155 | + GIC_FDT_IRQ_TYPE_SPI, irqs[i], | ||
156 | + GIC_FDT_IRQ_FLAGS_LEVEL_HI); | ||
157 | + qemu_fdt_setprop_sized_cells(s->fdt, name, "reg", | ||
158 | + 2, addrs[i], 2, size[i]); | ||
159 | + qemu_fdt_setprop_string(s->fdt, name, "compatible", | ||
160 | + "xlnx,canfd-2.0"); | ||
161 | + | ||
162 | + g_free(name); | ||
87 | + } | 163 | + } |
88 | +} | 164 | +} |
89 | + | 165 | + |
90 | +#define DEF_IMOP_32(NAME, NTYPE, MTYPE) \ | 166 | static void fdt_add_fixed_link_nodes(VersalVirt *s, char *gemname, |
91 | +static uint64_t NAME(uint64_t n, uint64_t m, uint64_t a, uint8_t p, bool neg) \ | 167 | uint32_t phandle) |
92 | +{ \ | 168 | { |
93 | + uint32_t sum0 = 0, sum1 = 0; \ | 169 | @@ -XXX,XX +XXX,XX @@ static void versal_virt_init(MachineState *machine) |
94 | + /* Apply P to N as a mask, making the inactive elements 0. */ \ | 170 | TYPE_XLNX_VERSAL); |
95 | + n &= expand_pred_b(p); \ | 171 | object_property_set_link(OBJECT(&s->soc), "ddr", OBJECT(machine->ram), |
96 | + sum0 += (NTYPE)(n >> 0) * (MTYPE)(m >> 0); \ | 172 | &error_abort); |
97 | + sum0 += (NTYPE)(n >> 8) * (MTYPE)(m >> 8); \ | 173 | + object_property_set_link(OBJECT(&s->soc), "canbus0", OBJECT(s->canbus[0]), |
98 | + sum0 += (NTYPE)(n >> 16) * (MTYPE)(m >> 16); \ | 174 | + &error_abort); |
99 | + sum0 += (NTYPE)(n >> 24) * (MTYPE)(m >> 24); \ | 175 | + object_property_set_link(OBJECT(&s->soc), "canbus1", OBJECT(s->canbus[1]), |
100 | + sum1 += (NTYPE)(n >> 32) * (MTYPE)(m >> 32); \ | 176 | + &error_abort); |
101 | + sum1 += (NTYPE)(n >> 40) * (MTYPE)(m >> 40); \ | 177 | sysbus_realize(SYS_BUS_DEVICE(&s->soc), &error_fatal); |
102 | + sum1 += (NTYPE)(n >> 48) * (MTYPE)(m >> 48); \ | 178 | |
103 | + sum1 += (NTYPE)(n >> 56) * (MTYPE)(m >> 56); \ | 179 | fdt_create(s); |
104 | + if (neg) { \ | 180 | create_virtio_regions(s); |
105 | + sum0 = (uint32_t)a - sum0, sum1 = (uint32_t)(a >> 32) - sum1; \ | 181 | fdt_add_gem_nodes(s); |
106 | + } else { \ | 182 | fdt_add_uart_nodes(s); |
107 | + sum0 = (uint32_t)a + sum0, sum1 = (uint32_t)(a >> 32) + sum1; \ | 183 | + fdt_add_canfd_nodes(s); |
108 | + } \ | 184 | fdt_add_gic_nodes(s); |
109 | + return ((uint64_t)sum1 << 32) | sum0; \ | 185 | fdt_add_timer_nodes(s); |
186 | fdt_add_zdma_nodes(s); | ||
187 | @@ -XXX,XX +XXX,XX @@ static void versal_virt_init(MachineState *machine) | ||
188 | |||
189 | static void versal_virt_machine_instance_init(Object *obj) | ||
190 | { | ||
191 | + VersalVirt *s = XLNX_VERSAL_VIRT_MACHINE(obj); | ||
192 | + | ||
193 | + /* | ||
194 | + * User can set canbus0 and canbus1 properties to can-bus object and connect | ||
195 | + * to socketcan(optional) interface via command line. | ||
196 | + */ | ||
197 | + object_property_add_link(obj, "canbus0", TYPE_CAN_BUS, | ||
198 | + (Object **)&s->canbus[0], | ||
199 | + object_property_allow_set_link, | ||
200 | + 0); | ||
201 | + object_property_add_link(obj, "canbus1", TYPE_CAN_BUS, | ||
202 | + (Object **)&s->canbus[1], | ||
203 | + object_property_allow_set_link, | ||
204 | + 0); | ||
205 | } | ||
206 | |||
207 | static void versal_virt_machine_class_init(ObjectClass *oc, void *data) | ||
208 | diff --git a/hw/arm/xlnx-versal.c b/hw/arm/xlnx-versal.c | ||
209 | index XXXXXXX..XXXXXXX 100644 | ||
210 | --- a/hw/arm/xlnx-versal.c | ||
211 | +++ b/hw/arm/xlnx-versal.c | ||
212 | @@ -XXX,XX +XXX,XX @@ static void versal_create_uarts(Versal *s, qemu_irq *pic) | ||
213 | } | ||
214 | } | ||
215 | |||
216 | +static void versal_create_canfds(Versal *s, qemu_irq *pic) | ||
217 | +{ | ||
218 | + int i; | ||
219 | + uint32_t irqs[] = { VERSAL_CANFD0_IRQ_0, VERSAL_CANFD1_IRQ_0}; | ||
220 | + uint64_t addrs[] = { MM_CANFD0, MM_CANFD1 }; | ||
221 | + | ||
222 | + for (i = 0; i < ARRAY_SIZE(s->lpd.iou.canfd); i++) { | ||
223 | + char *name = g_strdup_printf("canfd%d", i); | ||
224 | + SysBusDevice *sbd; | ||
225 | + MemoryRegion *mr; | ||
226 | + | ||
227 | + object_initialize_child(OBJECT(s), name, &s->lpd.iou.canfd[i], | ||
228 | + TYPE_XILINX_CANFD); | ||
229 | + sbd = SYS_BUS_DEVICE(&s->lpd.iou.canfd[i]); | ||
230 | + | ||
231 | + object_property_set_int(OBJECT(&s->lpd.iou.canfd[i]), "ext_clk_freq", | ||
232 | + XLNX_VERSAL_CANFD_REF_CLK , &error_abort); | ||
233 | + | ||
234 | + object_property_set_link(OBJECT(&s->lpd.iou.canfd[i]), "canfdbus", | ||
235 | + OBJECT(s->lpd.iou.canbus[i]), | ||
236 | + &error_abort); | ||
237 | + | ||
238 | + sysbus_realize(sbd, &error_fatal); | ||
239 | + | ||
240 | + mr = sysbus_mmio_get_region(sbd, 0); | ||
241 | + memory_region_add_subregion(&s->mr_ps, addrs[i], mr); | ||
242 | + | ||
243 | + sysbus_connect_irq(sbd, 0, pic[irqs[i]]); | ||
244 | + g_free(name); | ||
245 | + } | ||
110 | +} | 246 | +} |
111 | + | 247 | + |
112 | +#define DEF_IMOP_64(NAME, NTYPE, MTYPE) \ | 248 | static void versal_create_usbs(Versal *s, qemu_irq *pic) |
113 | +static uint64_t NAME(uint64_t n, uint64_t m, uint64_t a, uint8_t p, bool neg) \ | 249 | { |
114 | +{ \ | 250 | DeviceState *dev; |
115 | + uint64_t sum = 0; \ | 251 | @@ -XXX,XX +XXX,XX @@ static void versal_realize(DeviceState *dev, Error **errp) |
116 | + /* Apply P to N as a mask, making the inactive elements 0. */ \ | 252 | versal_create_apu_gic(s, pic); |
117 | + n &= expand_pred_h(p); \ | 253 | versal_create_rpu_cpus(s); |
118 | + sum += (NTYPE)(n >> 0) * (MTYPE)(m >> 0); \ | 254 | versal_create_uarts(s, pic); |
119 | + sum += (NTYPE)(n >> 16) * (MTYPE)(m >> 16); \ | 255 | + versal_create_canfds(s, pic); |
120 | + sum += (NTYPE)(n >> 32) * (MTYPE)(m >> 32); \ | 256 | versal_create_usbs(s, pic); |
121 | + sum += (NTYPE)(n >> 48) * (MTYPE)(m >> 48); \ | 257 | versal_create_gems(s, pic); |
122 | + return neg ? a - sum : a + sum; \ | 258 | versal_create_admas(s, pic); |
123 | +} | 259 | @@ -XXX,XX +XXX,XX @@ static void versal_init(Object *obj) |
124 | + | 260 | static Property versal_properties[] = { |
125 | +DEF_IMOP_32(smopa_s, int8_t, int8_t) | 261 | DEFINE_PROP_LINK("ddr", Versal, cfg.mr_ddr, TYPE_MEMORY_REGION, |
126 | +DEF_IMOP_32(umopa_s, uint8_t, uint8_t) | 262 | MemoryRegion *), |
127 | +DEF_IMOP_32(sumopa_s, int8_t, uint8_t) | 263 | + DEFINE_PROP_LINK("canbus0", Versal, lpd.iou.canbus[0], |
128 | +DEF_IMOP_32(usmopa_s, uint8_t, int8_t) | 264 | + TYPE_CAN_BUS, CanBusState *), |
129 | + | 265 | + DEFINE_PROP_LINK("canbus1", Versal, lpd.iou.canbus[1], |
130 | +DEF_IMOP_64(smopa_d, int16_t, int16_t) | 266 | + TYPE_CAN_BUS, CanBusState *), |
131 | +DEF_IMOP_64(umopa_d, uint16_t, uint16_t) | 267 | DEFINE_PROP_END_OF_LIST() |
132 | +DEF_IMOP_64(sumopa_d, int16_t, uint16_t) | 268 | }; |
133 | +DEF_IMOP_64(usmopa_d, uint16_t, int16_t) | 269 | |
134 | + | ||
135 | +#define DEF_IMOPH(NAME) \ | ||
136 | + void HELPER(sme_##NAME)(void *vza, void *vzn, void *vzm, void *vpn, \ | ||
137 | + void *vpm, uint32_t desc) \ | ||
138 | + { do_imopa(vza, vzn, vzm, vpn, vpm, desc, NAME); } | ||
139 | + | ||
140 | +DEF_IMOPH(smopa_s) | ||
141 | +DEF_IMOPH(umopa_s) | ||
142 | +DEF_IMOPH(sumopa_s) | ||
143 | +DEF_IMOPH(usmopa_s) | ||
144 | +DEF_IMOPH(smopa_d) | ||
145 | +DEF_IMOPH(umopa_d) | ||
146 | +DEF_IMOPH(sumopa_d) | ||
147 | +DEF_IMOPH(usmopa_d) | ||
148 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | ||
149 | index XXXXXXX..XXXXXXX 100644 | ||
150 | --- a/target/arm/translate-sme.c | ||
151 | +++ b/target/arm/translate-sme.c | ||
152 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a, MO_64, gen_helper_sme_f | ||
153 | |||
154 | /* TODO: FEAT_EBF16 */ | ||
155 | TRANS_FEAT(BFMOPA, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_bfmopa) | ||
156 | + | ||
157 | +TRANS_FEAT(SMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_smopa_s) | ||
158 | +TRANS_FEAT(UMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_umopa_s) | ||
159 | +TRANS_FEAT(SUMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_sumopa_s) | ||
160 | +TRANS_FEAT(USMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_usmopa_s) | ||
161 | + | ||
162 | +TRANS_FEAT(SMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_smopa_d) | ||
163 | +TRANS_FEAT(UMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_umopa_d) | ||
164 | +TRANS_FEAT(SUMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_sumopa_d) | ||
165 | +TRANS_FEAT(USMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_usmopa_d) | ||
166 | -- | 270 | -- |
167 | 2.25.1 | 271 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Vikram Garhwal <vikram.garhwal@amd.com> |
---|---|---|---|
2 | 2 | ||
3 | There's no reason to set CPACR_EL1.ZEN if SVE disabled. | 3 | Signed-off-by: Vikram Garhwal <vikram.garhwal@amd.com> |
4 | |||
5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 4 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 5 | Reviewed-by: Francisco Iglesias <frasse.iglesias@gmail.com> |
7 | Message-id: 20220708151540.18136-44-richard.henderson@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 7 | --- |
10 | target/arm/cpu.c | 7 +++---- | 8 | MAINTAINERS | 2 +- |
11 | 1 file changed, 3 insertions(+), 4 deletions(-) | 9 | 1 file changed, 1 insertion(+), 1 deletion(-) |
12 | 10 | ||
13 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c | 11 | diff --git a/MAINTAINERS b/MAINTAINERS |
14 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/cpu.c | 13 | --- a/MAINTAINERS |
16 | +++ b/target/arm/cpu.c | 14 | +++ b/MAINTAINERS |
17 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(DeviceState *dev) | 15 | @@ -XXX,XX +XXX,XX @@ M: Francisco Iglesias <francisco.iglesias@amd.com> |
18 | /* and to the FP/Neon instructions */ | 16 | S: Maintained |
19 | env->cp15.cpacr_el1 = FIELD_DP64(env->cp15.cpacr_el1, | 17 | F: hw/net/can/xlnx-* |
20 | CPACR_EL1, FPEN, 3); | 18 | F: include/hw/net/xlnx-* |
21 | - /* and to the SVE instructions */ | 19 | -F: tests/qtest/xlnx-can-test* |
22 | - env->cp15.cpacr_el1 = FIELD_DP64(env->cp15.cpacr_el1, | 20 | +F: tests/qtest/xlnx-can*-test* |
23 | - CPACR_EL1, ZEN, 3); | 21 | |
24 | - /* with reasonable vector length */ | 22 | EDU |
25 | + /* and to the SVE instructions, with default vector length */ | 23 | M: Jiri Slaby <jslaby@suse.cz> |
26 | if (cpu_isar_feature(aa64_sve, cpu)) { | ||
27 | + env->cp15.cpacr_el1 = FIELD_DP64(env->cp15.cpacr_el1, | ||
28 | + CPACR_EL1, ZEN, 3); | ||
29 | env->vfp.zcr_el[1] = cpu->sve_default_vq - 1; | ||
30 | } | ||
31 | /* | ||
32 | -- | 24 | -- |
33 | 2.25.1 | 25 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Vikram Garhwal <vikram.garhwal@amd.com> |
---|---|---|---|
2 | 2 | ||
3 | Add "sve" to the sve prctl functions, to distinguish | 3 | The QTests perform three tests on the Xilinx VERSAL CANFD controller: |
4 | them from the coming "sme" prctls with similar names. | 4 | Tests the CANFD controllers in loopback. |
5 | Tests the CANFD controllers in normal mode with CAN frame. | ||
6 | Tests the CANFD controllers in normal mode with CANFD frame. | ||
5 | 7 | ||
8 | Signed-off-by: Vikram Garhwal <vikram.garhwal@amd.com> | ||
9 | Acked-by: Thomas Huth <thuth@redhat.com> | ||
10 | Reviewed-by: Francisco Iglesias <francisco.iglesias@amd.com> | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20220708151540.18136-42-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 13 | --- |
11 | linux-user/aarch64/target_prctl.h | 8 ++++---- | 14 | tests/qtest/xlnx-canfd-test.c | 423 ++++++++++++++++++++++++++++++++++ |
12 | linux-user/syscall.c | 12 ++++++------ | 15 | tests/qtest/meson.build | 1 + |
13 | 2 files changed, 10 insertions(+), 10 deletions(-) | 16 | 2 files changed, 424 insertions(+) |
17 | create mode 100644 tests/qtest/xlnx-canfd-test.c | ||
14 | 18 | ||
15 | diff --git a/linux-user/aarch64/target_prctl.h b/linux-user/aarch64/target_prctl.h | 19 | diff --git a/tests/qtest/xlnx-canfd-test.c b/tests/qtest/xlnx-canfd-test.c |
20 | new file mode 100644 | ||
21 | index XXXXXXX..XXXXXXX | ||
22 | --- /dev/null | ||
23 | +++ b/tests/qtest/xlnx-canfd-test.c | ||
24 | @@ -XXX,XX +XXX,XX @@ | ||
25 | +/* | ||
26 | + * SPDX-License-Identifier: MIT | ||
27 | + * | ||
28 | + * QTests for the Xilinx Versal CANFD controller. | ||
29 | + * | ||
30 | + * Copyright (c) 2022 AMD Inc. | ||
31 | + * | ||
32 | + * Written-by: Vikram Garhwal<vikram.garhwal@amd.com> | ||
33 | + * | ||
34 | + * Permission is hereby granted, free of charge, to any person obtaining a copy | ||
35 | + * of this software and associated documentation files (the "Software"), to deal | ||
36 | + * in the Software without restriction, including without limitation the rights | ||
37 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||
38 | + * copies of the Software, and to permit persons to whom the Software is | ||
39 | + * furnished to do so, subject to the following conditions: | ||
40 | + * | ||
41 | + * The above copyright notice and this permission notice shall be included in | ||
42 | + * all copies or substantial portions of the Software. | ||
43 | + * | ||
44 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
45 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
46 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | ||
47 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
48 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||
49 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | ||
50 | + * THE SOFTWARE. | ||
51 | + */ | ||
52 | + | ||
53 | +#include "qemu/osdep.h" | ||
54 | +#include "libqtest.h" | ||
55 | + | ||
56 | +/* Base address. */ | ||
57 | +#define CANFD0_BASE_ADDR 0xff060000 | ||
58 | +#define CANFD1_BASE_ADDR 0xff070000 | ||
59 | + | ||
60 | +/* Register addresses. */ | ||
61 | +#define R_SRR_OFFSET 0x00 | ||
62 | +#define R_MSR_OFFSET 0x04 | ||
63 | +#define R_FILTER_CONTROL_REGISTER 0xe0 | ||
64 | +#define R_SR_OFFSET 0x18 | ||
65 | +#define R_ISR_OFFSET 0x1c | ||
66 | +#define R_IER_OFFSET 0x20 | ||
67 | +#define R_ICR_OFFSET 0x24 | ||
68 | +#define R_TX_READY_REQ_REGISTER 0x90 | ||
69 | +#define RX_FIFO_STATUS_REGISTER 0xe8 | ||
70 | +#define R_TXID_OFFSET 0x100 | ||
71 | +#define R_TXDLC_OFFSET 0x104 | ||
72 | +#define R_TXDATA1_OFFSET 0x108 | ||
73 | +#define R_TXDATA2_OFFSET 0x10c | ||
74 | +#define R_AFMR_REGISTER0 0xa00 | ||
75 | +#define R_AFIR_REGISTER0 0xa04 | ||
76 | +#define R_RX0_ID_OFFSET 0x2100 | ||
77 | +#define R_RX0_DLC_OFFSET 0x2104 | ||
78 | +#define R_RX0_DATA1_OFFSET 0x2108 | ||
79 | +#define R_RX0_DATA2_OFFSET 0x210c | ||
80 | + | ||
81 | +/* CANFD modes. */ | ||
82 | +#define SRR_CONFIG_MODE 0x00 | ||
83 | +#define MSR_NORMAL_MODE 0x00 | ||
84 | +#define MSR_LOOPBACK_MODE (1 << 1) | ||
85 | +#define ENABLE_CANFD (1 << 1) | ||
86 | + | ||
87 | +/* CANFD status. */ | ||
88 | +#define STATUS_CONFIG_MODE (1 << 0) | ||
89 | +#define STATUS_NORMAL_MODE (1 << 3) | ||
90 | +#define STATUS_LOOPBACK_MODE (1 << 1) | ||
91 | +#define ISR_TXOK (1 << 1) | ||
92 | +#define ISR_RXOK (1 << 4) | ||
93 | + | ||
94 | +#define ENABLE_ALL_FILTERS 0xffffffff | ||
95 | +#define ENABLE_ALL_INTERRUPTS 0xffffffff | ||
96 | + | ||
97 | +/* We are sending one canfd message. */ | ||
98 | +#define TX_READY_REG_VAL 0x1 | ||
99 | + | ||
100 | +#define FIRST_RX_STORE_INDEX 0x1 | ||
101 | +#define STATUS_REG_MASK 0xf | ||
102 | +#define DLC_FD_BIT_SHIFT 0x1b | ||
103 | +#define DLC_FD_BIT_MASK 0xf8000000 | ||
104 | +#define FIFO_STATUS_READ_INDEX_MASK 0x3f | ||
105 | +#define FIFO_STATUS_FILL_LEVEL_MASK 0x7f00 | ||
106 | +#define FILL_LEVEL_SHIFT 0x8 | ||
107 | + | ||
108 | +/* CANFD frame size ID, DLC and 16 DATA word. */ | ||
109 | +#define CANFD_FRAME_SIZE 18 | ||
110 | +/* CAN frame size ID, DLC and 2 DATA word. */ | ||
111 | +#define CAN_FRAME_SIZE 4 | ||
112 | + | ||
113 | +/* Set the filters for CANFD controller. */ | ||
114 | +static void enable_filters(QTestState *qts) | ||
115 | +{ | ||
116 | + const uint32_t arr_afmr[32] = { 0xb423deaa, 0xa2a40bdc, 0x1b64f486, | ||
117 | + 0x95c0d4ee, 0xe0c44528, 0x4b407904, | ||
118 | + 0xd2673f46, 0x9fc638d6, 0x8844f3d8, | ||
119 | + 0xa607d1e8, 0x67871bf4, 0xc2557dc, | ||
120 | + 0x9ea5b53e, 0x3643c0cc, 0x5a05ea8e, | ||
121 | + 0x83a46d84, 0x4a25c2b8, 0x93a66008, | ||
122 | + 0x2e467470, 0xedc66118, 0x9086f9f2, | ||
123 | + 0xfa23dd36, 0xb6654b90, 0xb221b8ca, | ||
124 | + 0x3467d1e2, 0xa3a55542, 0x5b26a012, | ||
125 | + 0x2281ea7e, 0xcea0ece8, 0xdc61e588, | ||
126 | + 0x2e5676a, 0x16821320 }; | ||
127 | + | ||
128 | + const uint32_t arr_afir[32] = { 0xa833dfa1, 0x255a477e, 0x3a4bb1c5, | ||
129 | + 0x8f560a6c, 0x27f38903, 0x2fecec4d, | ||
130 | + 0xa014c66d, 0xec289b8, 0x7e52dead, | ||
131 | + 0x82e94f3c, 0xcf3e3c5c, 0x66059871, | ||
132 | + 0x3f213df4, 0x25ac3959, 0xa12e9bef, | ||
133 | + 0xa3ad3af, 0xbafd7fe, 0xb3cb40fd, | ||
134 | + 0x5d9caa81, 0x2ed61902, 0x7cd64a0, | ||
135 | + 0x4b1fa538, 0x9b5ced8c, 0x150de059, | ||
136 | + 0xd2794227, 0x635e820a, 0xbb6b02cf, | ||
137 | + 0xbb58176, 0x570025bb, 0xa78d9658, | ||
138 | + 0x49d735df, 0xe5399d2f }; | ||
139 | + | ||
140 | + /* Passing the respective array values to all the AFMR and AFIR pairs. */ | ||
141 | + for (int i = 0; i < 32; i++) { | ||
142 | + /* For CANFD0. */ | ||
143 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_AFMR_REGISTER0 + 8 * i, | ||
144 | + arr_afmr[i]); | ||
145 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_AFIR_REGISTER0 + 8 * i, | ||
146 | + arr_afir[i]); | ||
147 | + | ||
148 | + /* For CANFD1. */ | ||
149 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_AFMR_REGISTER0 + 8 * i, | ||
150 | + arr_afmr[i]); | ||
151 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_AFIR_REGISTER0 + 8 * i, | ||
152 | + arr_afir[i]); | ||
153 | + } | ||
154 | + | ||
155 | + /* Enable all the pairs from AFR register. */ | ||
156 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_FILTER_CONTROL_REGISTER, | ||
157 | + ENABLE_ALL_FILTERS); | ||
158 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_FILTER_CONTROL_REGISTER, | ||
159 | + ENABLE_ALL_FILTERS); | ||
160 | +} | ||
161 | + | ||
162 | +static void configure_canfd(QTestState *qts, uint8_t mode) | ||
163 | +{ | ||
164 | + uint32_t status = 0; | ||
165 | + | ||
166 | + /* Put CANFD0 and CANFD1 in config mode. */ | ||
167 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_SRR_OFFSET, SRR_CONFIG_MODE); | ||
168 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_SRR_OFFSET, SRR_CONFIG_MODE); | ||
169 | + | ||
170 | + /* Write mode of operation in Mode select register. */ | ||
171 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_MSR_OFFSET, mode); | ||
172 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_MSR_OFFSET, mode); | ||
173 | + | ||
174 | + enable_filters(qts); | ||
175 | + | ||
176 | + /* Check here if CANFD0 and CANFD1 are in config mode. */ | ||
177 | + status = qtest_readl(qts, CANFD0_BASE_ADDR + R_SR_OFFSET); | ||
178 | + status = status & STATUS_REG_MASK; | ||
179 | + g_assert_cmpint(status, ==, STATUS_CONFIG_MODE); | ||
180 | + | ||
181 | + status = qtest_readl(qts, CANFD1_BASE_ADDR + R_SR_OFFSET); | ||
182 | + status = status & STATUS_REG_MASK; | ||
183 | + g_assert_cmpint(status, ==, STATUS_CONFIG_MODE); | ||
184 | + | ||
185 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_IER_OFFSET, ENABLE_ALL_INTERRUPTS); | ||
186 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_IER_OFFSET, ENABLE_ALL_INTERRUPTS); | ||
187 | + | ||
188 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_SRR_OFFSET, ENABLE_CANFD); | ||
189 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_SRR_OFFSET, ENABLE_CANFD); | ||
190 | +} | ||
191 | + | ||
192 | +static void generate_random_data(uint32_t *buf_tx, bool is_canfd_frame) | ||
193 | +{ | ||
194 | + /* Generate random TX data for CANFD frame. */ | ||
195 | + if (is_canfd_frame) { | ||
196 | + for (int i = 0; i < CANFD_FRAME_SIZE - 2; i++) { | ||
197 | + buf_tx[2 + i] = rand(); | ||
198 | + } | ||
199 | + } else { | ||
200 | + /* Generate random TX data for CAN frame. */ | ||
201 | + for (int i = 0; i < CAN_FRAME_SIZE - 2; i++) { | ||
202 | + buf_tx[2 + i] = rand(); | ||
203 | + } | ||
204 | + } | ||
205 | +} | ||
206 | + | ||
207 | +static void read_data(QTestState *qts, uint64_t can_base_addr, uint32_t *buf_rx) | ||
208 | +{ | ||
209 | + uint32_t int_status; | ||
210 | + uint32_t fifo_status_reg_value; | ||
211 | + /* At which RX FIFO the received data is stored. */ | ||
212 | + uint8_t store_ind = 0; | ||
213 | + bool is_canfd_frame = false; | ||
214 | + | ||
215 | + /* Read the interrupt on CANFD rx. */ | ||
216 | + int_status = qtest_readl(qts, can_base_addr + R_ISR_OFFSET) & ISR_RXOK; | ||
217 | + | ||
218 | + g_assert_cmpint(int_status, ==, ISR_RXOK); | ||
219 | + | ||
220 | + /* Find the fill level and read index. */ | ||
221 | + fifo_status_reg_value = qtest_readl(qts, can_base_addr + | ||
222 | + RX_FIFO_STATUS_REGISTER); | ||
223 | + | ||
224 | + store_ind = (fifo_status_reg_value & FIFO_STATUS_READ_INDEX_MASK) + | ||
225 | + ((fifo_status_reg_value & FIFO_STATUS_FILL_LEVEL_MASK) >> | ||
226 | + FILL_LEVEL_SHIFT); | ||
227 | + | ||
228 | + g_assert_cmpint(store_ind, ==, FIRST_RX_STORE_INDEX); | ||
229 | + | ||
230 | + /* Read the RX register data for CANFD. */ | ||
231 | + buf_rx[0] = qtest_readl(qts, can_base_addr + R_RX0_ID_OFFSET); | ||
232 | + buf_rx[1] = qtest_readl(qts, can_base_addr + R_RX0_DLC_OFFSET); | ||
233 | + | ||
234 | + is_canfd_frame = (buf_rx[1] >> DLC_FD_BIT_SHIFT) & 1; | ||
235 | + | ||
236 | + if (is_canfd_frame) { | ||
237 | + for (int i = 0; i < CANFD_FRAME_SIZE - 2; i++) { | ||
238 | + buf_rx[i + 2] = qtest_readl(qts, | ||
239 | + can_base_addr + R_RX0_DATA1_OFFSET + 4 * i); | ||
240 | + } | ||
241 | + } else { | ||
242 | + buf_rx[2] = qtest_readl(qts, can_base_addr + R_RX0_DATA1_OFFSET); | ||
243 | + buf_rx[3] = qtest_readl(qts, can_base_addr + R_RX0_DATA2_OFFSET); | ||
244 | + } | ||
245 | + | ||
246 | + /* Clear the RX interrupt. */ | ||
247 | + qtest_writel(qts, CANFD1_BASE_ADDR + R_ICR_OFFSET, ISR_RXOK); | ||
248 | +} | ||
249 | + | ||
250 | +static void write_data(QTestState *qts, uint64_t can_base_addr, | ||
251 | + const uint32_t *buf_tx, bool is_canfd_frame) | ||
252 | +{ | ||
253 | + /* Write the TX register data for CANFD. */ | ||
254 | + qtest_writel(qts, can_base_addr + R_TXID_OFFSET, buf_tx[0]); | ||
255 | + qtest_writel(qts, can_base_addr + R_TXDLC_OFFSET, buf_tx[1]); | ||
256 | + | ||
257 | + if (is_canfd_frame) { | ||
258 | + for (int i = 0; i < CANFD_FRAME_SIZE - 2; i++) { | ||
259 | + qtest_writel(qts, can_base_addr + R_TXDATA1_OFFSET + 4 * i, | ||
260 | + buf_tx[2 + i]); | ||
261 | + } | ||
262 | + } else { | ||
263 | + qtest_writel(qts, can_base_addr + R_TXDATA1_OFFSET, buf_tx[2]); | ||
264 | + qtest_writel(qts, can_base_addr + R_TXDATA2_OFFSET, buf_tx[3]); | ||
265 | + } | ||
266 | +} | ||
267 | + | ||
268 | +static void send_data(QTestState *qts, uint64_t can_base_addr) | ||
269 | +{ | ||
270 | + uint32_t int_status; | ||
271 | + | ||
272 | + qtest_writel(qts, can_base_addr + R_TX_READY_REQ_REGISTER, | ||
273 | + TX_READY_REG_VAL); | ||
274 | + | ||
275 | + /* Read the interrupt on CANFD for tx. */ | ||
276 | + int_status = qtest_readl(qts, can_base_addr + R_ISR_OFFSET) & ISR_TXOK; | ||
277 | + | ||
278 | + g_assert_cmpint(int_status, ==, ISR_TXOK); | ||
279 | + | ||
280 | + /* Clear the interrupt for tx. */ | ||
281 | + qtest_writel(qts, CANFD0_BASE_ADDR + R_ICR_OFFSET, ISR_TXOK); | ||
282 | +} | ||
283 | + | ||
284 | +static void match_rx_tx_data(const uint32_t *buf_tx, const uint32_t *buf_rx, | ||
285 | + bool is_canfd_frame) | ||
286 | +{ | ||
287 | + uint16_t size = 0; | ||
288 | + uint8_t len = CAN_FRAME_SIZE; | ||
289 | + | ||
290 | + if (is_canfd_frame) { | ||
291 | + len = CANFD_FRAME_SIZE; | ||
292 | + } | ||
293 | + | ||
294 | + while (size < len) { | ||
295 | + if (R_RX0_ID_OFFSET + 4 * size == R_RX0_DLC_OFFSET) { | ||
296 | + g_assert_cmpint((buf_rx[size] & DLC_FD_BIT_MASK), ==, | ||
297 | + (buf_tx[size] & DLC_FD_BIT_MASK)); | ||
298 | + } else { | ||
299 | + if (!is_canfd_frame && size == 4) { | ||
300 | + break; | ||
301 | + } | ||
302 | + | ||
303 | + g_assert_cmpint(buf_rx[size], ==, buf_tx[size]); | ||
304 | + } | ||
305 | + | ||
306 | + size++; | ||
307 | + } | ||
308 | +} | ||
309 | +/* | ||
310 | + * Xilinx CANFD supports both CAN and CANFD frames. This test will be | ||
311 | + * transferring CAN frame i.e. 8 bytes of data from CANFD0 and CANFD1 through | ||
312 | + * canbus. CANFD0 initiate the data transfer to can-bus, CANFD1 receives the | ||
313 | + * data. Test compares the can frame data sent from CANFD0 and received on | ||
314 | + * CANFD1. | ||
315 | + */ | ||
316 | +static void test_can_data_transfer(void) | ||
317 | +{ | ||
318 | + uint32_t buf_tx[CAN_FRAME_SIZE] = { 0x5a5bb9a4, 0x80000000, | ||
319 | + 0x12345678, 0x87654321 }; | ||
320 | + uint32_t buf_rx[CAN_FRAME_SIZE] = { 0x00, 0x00, 0x00, 0x00 }; | ||
321 | + uint32_t status = 0; | ||
322 | + | ||
323 | + generate_random_data(buf_tx, false); | ||
324 | + | ||
325 | + QTestState *qts = qtest_init("-machine xlnx-versal-virt" | ||
326 | + " -object can-bus,id=canbus" | ||
327 | + " -machine canbus0=canbus" | ||
328 | + " -machine canbus1=canbus" | ||
329 | + ); | ||
330 | + | ||
331 | + configure_canfd(qts, MSR_NORMAL_MODE); | ||
332 | + | ||
333 | + /* Check if CANFD0 and CANFD1 are in Normal mode. */ | ||
334 | + status = qtest_readl(qts, CANFD0_BASE_ADDR + R_SR_OFFSET); | ||
335 | + status = status & STATUS_REG_MASK; | ||
336 | + g_assert_cmpint(status, ==, STATUS_NORMAL_MODE); | ||
337 | + | ||
338 | + status = qtest_readl(qts, CANFD1_BASE_ADDR + R_SR_OFFSET); | ||
339 | + status = status & STATUS_REG_MASK; | ||
340 | + g_assert_cmpint(status, ==, STATUS_NORMAL_MODE); | ||
341 | + | ||
342 | + write_data(qts, CANFD0_BASE_ADDR, buf_tx, false); | ||
343 | + | ||
344 | + send_data(qts, CANFD0_BASE_ADDR); | ||
345 | + read_data(qts, CANFD1_BASE_ADDR, buf_rx); | ||
346 | + match_rx_tx_data(buf_tx, buf_rx, false); | ||
347 | + | ||
348 | + qtest_quit(qts); | ||
349 | +} | ||
350 | + | ||
351 | +/* | ||
352 | + * This test will be transferring CANFD frame i.e. 64 bytes of data from CANFD0 | ||
353 | + * and CANFD1 through canbus. CANFD0 initiate the data transfer to can-bus, | ||
354 | + * CANFD1 receives the data. Test compares the CANFD frame data sent from CANFD0 | ||
355 | + * with received on CANFD1. | ||
356 | + */ | ||
357 | +static void test_canfd_data_transfer(void) | ||
358 | +{ | ||
359 | + uint32_t buf_tx[CANFD_FRAME_SIZE] = { 0x5a5bb9a4, 0xf8000000 }; | ||
360 | + uint32_t buf_rx[CANFD_FRAME_SIZE] = { 0x00, 0x00, 0x00, 0x00 }; | ||
361 | + uint32_t status = 0; | ||
362 | + | ||
363 | + generate_random_data(buf_tx, true); | ||
364 | + | ||
365 | + QTestState *qts = qtest_init("-machine xlnx-versal-virt" | ||
366 | + " -object can-bus,id=canbus" | ||
367 | + " -machine canbus0=canbus" | ||
368 | + " -machine canbus1=canbus" | ||
369 | + ); | ||
370 | + | ||
371 | + configure_canfd(qts, MSR_NORMAL_MODE); | ||
372 | + | ||
373 | + /* Check if CANFD0 and CANFD1 are in Normal mode. */ | ||
374 | + status = qtest_readl(qts, CANFD0_BASE_ADDR + R_SR_OFFSET); | ||
375 | + status = status & STATUS_REG_MASK; | ||
376 | + g_assert_cmpint(status, ==, STATUS_NORMAL_MODE); | ||
377 | + | ||
378 | + status = qtest_readl(qts, CANFD1_BASE_ADDR + R_SR_OFFSET); | ||
379 | + status = status & STATUS_REG_MASK; | ||
380 | + g_assert_cmpint(status, ==, STATUS_NORMAL_MODE); | ||
381 | + | ||
382 | + write_data(qts, CANFD0_BASE_ADDR, buf_tx, true); | ||
383 | + | ||
384 | + send_data(qts, CANFD0_BASE_ADDR); | ||
385 | + read_data(qts, CANFD1_BASE_ADDR, buf_rx); | ||
386 | + match_rx_tx_data(buf_tx, buf_rx, true); | ||
387 | + | ||
388 | + qtest_quit(qts); | ||
389 | +} | ||
390 | + | ||
391 | +/* | ||
392 | + * This test is performing loopback mode on CANFD0 and CANFD1. Data sent from | ||
393 | + * TX of each CANFD0 and CANFD1 are compared with RX register data for | ||
394 | + * respective CANFD Controller. | ||
395 | + */ | ||
396 | +static void test_can_loopback(void) | ||
397 | +{ | ||
398 | + uint32_t buf_tx[CANFD_FRAME_SIZE] = { 0x5a5bb9a4, 0xf8000000 }; | ||
399 | + uint32_t buf_rx[CANFD_FRAME_SIZE] = { 0x00, 0x00, 0x00, 0x00 }; | ||
400 | + uint32_t status = 0; | ||
401 | + | ||
402 | + generate_random_data(buf_tx, true); | ||
403 | + | ||
404 | + QTestState *qts = qtest_init("-machine xlnx-versal-virt" | ||
405 | + " -object can-bus,id=canbus" | ||
406 | + " -machine canbus0=canbus" | ||
407 | + " -machine canbus1=canbus" | ||
408 | + ); | ||
409 | + | ||
410 | + configure_canfd(qts, MSR_LOOPBACK_MODE); | ||
411 | + | ||
412 | + /* Check if CANFD0 and CANFD1 are set in correct loopback mode. */ | ||
413 | + status = qtest_readl(qts, CANFD0_BASE_ADDR + R_SR_OFFSET); | ||
414 | + status = status & STATUS_REG_MASK; | ||
415 | + g_assert_cmpint(status, ==, STATUS_LOOPBACK_MODE); | ||
416 | + | ||
417 | + status = qtest_readl(qts, CANFD1_BASE_ADDR + R_SR_OFFSET); | ||
418 | + status = status & STATUS_REG_MASK; | ||
419 | + g_assert_cmpint(status, ==, STATUS_LOOPBACK_MODE); | ||
420 | + | ||
421 | + write_data(qts, CANFD0_BASE_ADDR, buf_tx, true); | ||
422 | + | ||
423 | + send_data(qts, CANFD0_BASE_ADDR); | ||
424 | + read_data(qts, CANFD0_BASE_ADDR, buf_rx); | ||
425 | + match_rx_tx_data(buf_tx, buf_rx, true); | ||
426 | + | ||
427 | + generate_random_data(buf_tx, true); | ||
428 | + | ||
429 | + write_data(qts, CANFD1_BASE_ADDR, buf_tx, true); | ||
430 | + | ||
431 | + send_data(qts, CANFD1_BASE_ADDR); | ||
432 | + read_data(qts, CANFD1_BASE_ADDR, buf_rx); | ||
433 | + match_rx_tx_data(buf_tx, buf_rx, true); | ||
434 | + | ||
435 | + qtest_quit(qts); | ||
436 | +} | ||
437 | + | ||
438 | +int main(int argc, char **argv) | ||
439 | +{ | ||
440 | + g_test_init(&argc, &argv, NULL); | ||
441 | + | ||
442 | + qtest_add_func("/net/canfd/can_data_transfer", test_can_data_transfer); | ||
443 | + qtest_add_func("/net/canfd/canfd_data_transfer", test_canfd_data_transfer); | ||
444 | + qtest_add_func("/net/canfd/can_loopback", test_can_loopback); | ||
445 | + | ||
446 | + return g_test_run(); | ||
447 | +} | ||
448 | diff --git a/tests/qtest/meson.build b/tests/qtest/meson.build | ||
16 | index XXXXXXX..XXXXXXX 100644 | 449 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/linux-user/aarch64/target_prctl.h | 450 | --- a/tests/qtest/meson.build |
18 | +++ b/linux-user/aarch64/target_prctl.h | 451 | +++ b/tests/qtest/meson.build |
19 | @@ -XXX,XX +XXX,XX @@ | 452 | @@ -XXX,XX +XXX,XX @@ qtests_aarch64 = \ |
20 | #ifndef AARCH64_TARGET_PRCTL_H | 453 | (config_all.has_key('CONFIG_TCG') and config_all_devices.has_key('CONFIG_TPM_TIS_SYSBUS') ? \ |
21 | #define AARCH64_TARGET_PRCTL_H | 454 | ['tpm-tis-device-test', 'tpm-tis-device-swtpm-test'] : []) + \ |
22 | 455 | (config_all_devices.has_key('CONFIG_XLNX_ZYNQMP_ARM') ? ['xlnx-can-test', 'fuzz-xlnx-dp-test'] : []) + \ | |
23 | -static abi_long do_prctl_get_vl(CPUArchState *env) | 456 | + (config_all_devices.has_key('CONFIG_XLNX_VERSAL') ? ['xlnx-canfd-test'] : []) + \ |
24 | +static abi_long do_prctl_sve_get_vl(CPUArchState *env) | 457 | (config_all_devices.has_key('CONFIG_RASPI') ? ['bcm2835-dma-test'] : []) + \ |
25 | { | 458 | (config_all.has_key('CONFIG_TCG') and \ |
26 | ARMCPU *cpu = env_archcpu(env); | 459 | config_all_devices.has_key('CONFIG_TPM_TIS_I2C') ? ['tpm-tis-i2c-test'] : []) + \ |
27 | if (cpu_isar_feature(aa64_sve, cpu)) { | ||
28 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_get_vl(CPUArchState *env) | ||
29 | } | ||
30 | return -TARGET_EINVAL; | ||
31 | } | ||
32 | -#define do_prctl_get_vl do_prctl_get_vl | ||
33 | +#define do_prctl_sve_get_vl do_prctl_sve_get_vl | ||
34 | |||
35 | -static abi_long do_prctl_set_vl(CPUArchState *env, abi_long arg2) | ||
36 | +static abi_long do_prctl_sve_set_vl(CPUArchState *env, abi_long arg2) | ||
37 | { | ||
38 | /* | ||
39 | * We cannot support either PR_SVE_SET_VL_ONEXEC or PR_SVE_VL_INHERIT. | ||
40 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_set_vl(CPUArchState *env, abi_long arg2) | ||
41 | } | ||
42 | return -TARGET_EINVAL; | ||
43 | } | ||
44 | -#define do_prctl_set_vl do_prctl_set_vl | ||
45 | +#define do_prctl_sve_set_vl do_prctl_sve_set_vl | ||
46 | |||
47 | static abi_long do_prctl_reset_keys(CPUArchState *env, abi_long arg2) | ||
48 | { | ||
49 | diff --git a/linux-user/syscall.c b/linux-user/syscall.c | ||
50 | index XXXXXXX..XXXXXXX 100644 | ||
51 | --- a/linux-user/syscall.c | ||
52 | +++ b/linux-user/syscall.c | ||
53 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_inval1(CPUArchState *env, abi_long arg2) | ||
54 | #ifndef do_prctl_set_fp_mode | ||
55 | #define do_prctl_set_fp_mode do_prctl_inval1 | ||
56 | #endif | ||
57 | -#ifndef do_prctl_get_vl | ||
58 | -#define do_prctl_get_vl do_prctl_inval0 | ||
59 | +#ifndef do_prctl_sve_get_vl | ||
60 | +#define do_prctl_sve_get_vl do_prctl_inval0 | ||
61 | #endif | ||
62 | -#ifndef do_prctl_set_vl | ||
63 | -#define do_prctl_set_vl do_prctl_inval1 | ||
64 | +#ifndef do_prctl_sve_set_vl | ||
65 | +#define do_prctl_sve_set_vl do_prctl_inval1 | ||
66 | #endif | ||
67 | #ifndef do_prctl_reset_keys | ||
68 | #define do_prctl_reset_keys do_prctl_inval1 | ||
69 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl(CPUArchState *env, abi_long option, abi_long arg2, | ||
70 | case PR_SET_FP_MODE: | ||
71 | return do_prctl_set_fp_mode(env, arg2); | ||
72 | case PR_SVE_GET_VL: | ||
73 | - return do_prctl_get_vl(env); | ||
74 | + return do_prctl_sve_get_vl(env); | ||
75 | case PR_SVE_SET_VL: | ||
76 | - return do_prctl_set_vl(env, arg2); | ||
77 | + return do_prctl_sve_set_vl(env, arg2); | ||
78 | case PR_PAC_RESET_KEYS: | ||
79 | if (arg3 || arg4 || arg5) { | ||
80 | return -TARGET_EINVAL; | ||
81 | -- | 460 | -- |
82 | 2.25.1 | 461 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | These SME instructions are nominally within the SVE decode space, | 3 | Allwinner R40 (sun8i) SoC features a Quad-Core Cortex-A7 ARM CPU, |
4 | so we add them to sve.decode and translate-sve.c. | 4 | and a Mali400 MP2 GPU from ARM. It's also known as the Allwinner T3 |
5 | for In-Car Entertainment usage, A40i and A40pro are variants that | ||
6 | differ in applicable temperatures range (industrial and military). | ||
5 | 7 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 9 | Reviewed-by: Niek Linnenbank <nieklinnenbank@gmail.com> |
8 | Message-id: 20220708151540.18136-18-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | target/arm/translate-a64.h | 12 ++++++++++++ | 12 | include/hw/arm/allwinner-r40.h | 110 +++++++++ |
12 | target/arm/sve.decode | 5 ++++- | 13 | hw/arm/allwinner-r40.c | 415 +++++++++++++++++++++++++++++++++ |
13 | target/arm/translate-sve.c | 38 ++++++++++++++++++++++++++++++++++++++ | 14 | hw/arm/bananapi_m2u.c | 129 ++++++++++ |
14 | 3 files changed, 54 insertions(+), 1 deletion(-) | 15 | hw/arm/Kconfig | 10 + |
16 | hw/arm/meson.build | 1 + | ||
17 | 5 files changed, 665 insertions(+) | ||
18 | create mode 100644 include/hw/arm/allwinner-r40.h | ||
19 | create mode 100644 hw/arm/allwinner-r40.c | ||
20 | create mode 100644 hw/arm/bananapi_m2u.c | ||
15 | 21 | ||
16 | diff --git a/target/arm/translate-a64.h b/target/arm/translate-a64.h | 22 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
17 | index XXXXXXX..XXXXXXX 100644 | 23 | new file mode 100644 |
18 | --- a/target/arm/translate-a64.h | 24 | index XXXXXXX..XXXXXXX |
19 | +++ b/target/arm/translate-a64.h | 25 | --- /dev/null |
20 | @@ -XXX,XX +XXX,XX @@ static inline int vec_full_reg_size(DisasContext *s) | 26 | +++ b/include/hw/arm/allwinner-r40.h |
21 | return s->vl; | 27 | @@ -XXX,XX +XXX,XX @@ |
22 | } | 28 | +/* |
23 | 29 | + * Allwinner R40/A40i/T3 System on Chip emulation | |
24 | +/* Return the byte size of the vector register, SVL / 8. */ | 30 | + * |
25 | +static inline int streaming_vec_reg_size(DisasContext *s) | 31 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> |
32 | + * | ||
33 | + * This program is free software: you can redistribute it and/or modify | ||
34 | + * it under the terms of the GNU General Public License as published by | ||
35 | + * the Free Software Foundation, either version 2 of the License, or | ||
36 | + * (at your option) any later version. | ||
37 | + * | ||
38 | + * This program is distributed in the hope that it will be useful, | ||
39 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
40 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
41 | + * GNU General Public License for more details. | ||
42 | + * | ||
43 | + * You should have received a copy of the GNU General Public License | ||
44 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
45 | + */ | ||
46 | + | ||
47 | +#ifndef HW_ARM_ALLWINNER_R40_H | ||
48 | +#define HW_ARM_ALLWINNER_R40_H | ||
49 | + | ||
50 | +#include "qom/object.h" | ||
51 | +#include "hw/arm/boot.h" | ||
52 | +#include "hw/timer/allwinner-a10-pit.h" | ||
53 | +#include "hw/intc/arm_gic.h" | ||
54 | +#include "hw/sd/allwinner-sdhost.h" | ||
55 | +#include "target/arm/cpu.h" | ||
56 | +#include "sysemu/block-backend.h" | ||
57 | + | ||
58 | +enum { | ||
59 | + AW_R40_DEV_SRAM_A1, | ||
60 | + AW_R40_DEV_SRAM_A2, | ||
61 | + AW_R40_DEV_SRAM_A3, | ||
62 | + AW_R40_DEV_SRAM_A4, | ||
63 | + AW_R40_DEV_MMC0, | ||
64 | + AW_R40_DEV_MMC1, | ||
65 | + AW_R40_DEV_MMC2, | ||
66 | + AW_R40_DEV_MMC3, | ||
67 | + AW_R40_DEV_CCU, | ||
68 | + AW_R40_DEV_PIT, | ||
69 | + AW_R40_DEV_UART0, | ||
70 | + AW_R40_DEV_GIC_DIST, | ||
71 | + AW_R40_DEV_GIC_CPU, | ||
72 | + AW_R40_DEV_GIC_HYP, | ||
73 | + AW_R40_DEV_GIC_VCPU, | ||
74 | + AW_R40_DEV_SDRAM | ||
75 | +}; | ||
76 | + | ||
77 | +#define AW_R40_NUM_CPUS (4) | ||
78 | + | ||
79 | +/** | ||
80 | + * Allwinner R40 object model | ||
81 | + * @{ | ||
82 | + */ | ||
83 | + | ||
84 | +/** Object type for the Allwinner R40 SoC */ | ||
85 | +#define TYPE_AW_R40 "allwinner-r40" | ||
86 | + | ||
87 | +/** Convert input object to Allwinner R40 state object */ | ||
88 | +OBJECT_DECLARE_SIMPLE_TYPE(AwR40State, AW_R40) | ||
89 | + | ||
90 | +/** @} */ | ||
91 | + | ||
92 | +/** | ||
93 | + * Allwinner R40 object | ||
94 | + * | ||
95 | + * This struct contains the state of all the devices | ||
96 | + * which are currently emulated by the R40 SoC code. | ||
97 | + */ | ||
98 | +#define AW_R40_NUM_MMCS 4 | ||
99 | + | ||
100 | +struct AwR40State { | ||
101 | + /*< private >*/ | ||
102 | + DeviceState parent_obj; | ||
103 | + /*< public >*/ | ||
104 | + | ||
105 | + ARMCPU cpus[AW_R40_NUM_CPUS]; | ||
106 | + const hwaddr *memmap; | ||
107 | + AwA10PITState timer; | ||
108 | + AwSdHostState mmc[AW_R40_NUM_MMCS]; | ||
109 | + GICState gic; | ||
110 | + MemoryRegion sram_a1; | ||
111 | + MemoryRegion sram_a2; | ||
112 | + MemoryRegion sram_a3; | ||
113 | + MemoryRegion sram_a4; | ||
114 | +}; | ||
115 | + | ||
116 | +/** | ||
117 | + * Emulate Boot ROM firmware setup functionality. | ||
118 | + * | ||
119 | + * A real Allwinner R40 SoC contains a Boot ROM | ||
120 | + * which is the first code that runs right after | ||
121 | + * the SoC is powered on. The Boot ROM is responsible | ||
122 | + * for loading user code (e.g. a bootloader) from any | ||
123 | + * of the supported external devices and writing the | ||
124 | + * downloaded code to internal SRAM. After loading the SoC | ||
125 | + * begins executing the code written to SRAM. | ||
126 | + * | ||
127 | + * This function emulates the Boot ROM by copying 32 KiB | ||
128 | + * of data from the given block device and writes it to | ||
129 | + * the start of the first internal SRAM memory. | ||
130 | + * | ||
131 | + * @s: Allwinner R40 state object pointer | ||
132 | + * @blk: Block backend device object pointer | ||
133 | + * @unit: the mmc control's unit | ||
134 | + */ | ||
135 | +bool allwinner_r40_bootrom_setup(AwR40State *s, BlockBackend *blk, int unit); | ||
136 | + | ||
137 | +#endif /* HW_ARM_ALLWINNER_R40_H */ | ||
138 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
139 | new file mode 100644 | ||
140 | index XXXXXXX..XXXXXXX | ||
141 | --- /dev/null | ||
142 | +++ b/hw/arm/allwinner-r40.c | ||
143 | @@ -XXX,XX +XXX,XX @@ | ||
144 | +/* | ||
145 | + * Allwinner R40/A40i/T3 System on Chip emulation | ||
146 | + * | ||
147 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> | ||
148 | + * | ||
149 | + * This program is free software: you can redistribute it and/or modify | ||
150 | + * it under the terms of the GNU General Public License as published by | ||
151 | + * the Free Software Foundation, either version 2 of the License, or | ||
152 | + * (at your option) any later version. | ||
153 | + * | ||
154 | + * This program is distributed in the hope that it will be useful, | ||
155 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
156 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
157 | + * GNU General Public License for more details. | ||
158 | + * | ||
159 | + * You should have received a copy of the GNU General Public License | ||
160 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
161 | + */ | ||
162 | + | ||
163 | +#include "qemu/osdep.h" | ||
164 | +#include "qapi/error.h" | ||
165 | +#include "qemu/error-report.h" | ||
166 | +#include "qemu/bswap.h" | ||
167 | +#include "qemu/module.h" | ||
168 | +#include "qemu/units.h" | ||
169 | +#include "hw/qdev-core.h" | ||
170 | +#include "hw/sysbus.h" | ||
171 | +#include "hw/char/serial.h" | ||
172 | +#include "hw/misc/unimp.h" | ||
173 | +#include "hw/usb/hcd-ehci.h" | ||
174 | +#include "hw/loader.h" | ||
175 | +#include "sysemu/sysemu.h" | ||
176 | +#include "hw/arm/allwinner-r40.h" | ||
177 | + | ||
178 | +/* Memory map */ | ||
179 | +const hwaddr allwinner_r40_memmap[] = { | ||
180 | + [AW_R40_DEV_SRAM_A1] = 0x00000000, | ||
181 | + [AW_R40_DEV_SRAM_A2] = 0x00004000, | ||
182 | + [AW_R40_DEV_SRAM_A3] = 0x00008000, | ||
183 | + [AW_R40_DEV_SRAM_A4] = 0x0000b400, | ||
184 | + [AW_R40_DEV_MMC0] = 0x01c0f000, | ||
185 | + [AW_R40_DEV_MMC1] = 0x01c10000, | ||
186 | + [AW_R40_DEV_MMC2] = 0x01c11000, | ||
187 | + [AW_R40_DEV_MMC3] = 0x01c12000, | ||
188 | + [AW_R40_DEV_PIT] = 0x01c20c00, | ||
189 | + [AW_R40_DEV_UART0] = 0x01c28000, | ||
190 | + [AW_R40_DEV_GIC_DIST] = 0x01c81000, | ||
191 | + [AW_R40_DEV_GIC_CPU] = 0x01c82000, | ||
192 | + [AW_R40_DEV_GIC_HYP] = 0x01c84000, | ||
193 | + [AW_R40_DEV_GIC_VCPU] = 0x01c86000, | ||
194 | + [AW_R40_DEV_SDRAM] = 0x40000000 | ||
195 | +}; | ||
196 | + | ||
197 | +/* List of unimplemented devices */ | ||
198 | +struct AwR40Unimplemented { | ||
199 | + const char *device_name; | ||
200 | + hwaddr base; | ||
201 | + hwaddr size; | ||
202 | +}; | ||
203 | + | ||
204 | +static struct AwR40Unimplemented r40_unimplemented[] = { | ||
205 | + { "d-engine", 0x01000000, 4 * MiB }, | ||
206 | + { "d-inter", 0x01400000, 128 * KiB }, | ||
207 | + { "sram-c", 0x01c00000, 4 * KiB }, | ||
208 | + { "dma", 0x01c02000, 4 * KiB }, | ||
209 | + { "nfdc", 0x01c03000, 4 * KiB }, | ||
210 | + { "ts", 0x01c04000, 4 * KiB }, | ||
211 | + { "spi0", 0x01c05000, 4 * KiB }, | ||
212 | + { "spi1", 0x01c06000, 4 * KiB }, | ||
213 | + { "cs0", 0x01c09000, 4 * KiB }, | ||
214 | + { "keymem", 0x01c0a000, 4 * KiB }, | ||
215 | + { "emac", 0x01c0b000, 4 * KiB }, | ||
216 | + { "usb0-otg", 0x01c13000, 4 * KiB }, | ||
217 | + { "usb0-host", 0x01c14000, 4 * KiB }, | ||
218 | + { "crypto", 0x01c15000, 4 * KiB }, | ||
219 | + { "spi2", 0x01c17000, 4 * KiB }, | ||
220 | + { "sata", 0x01c18000, 4 * KiB }, | ||
221 | + { "usb1-host", 0x01c19000, 4 * KiB }, | ||
222 | + { "sid", 0x01c1b000, 4 * KiB }, | ||
223 | + { "usb2-host", 0x01c1c000, 4 * KiB }, | ||
224 | + { "cs1", 0x01c1d000, 4 * KiB }, | ||
225 | + { "spi3", 0x01c1f000, 4 * KiB }, | ||
226 | + { "ccu", 0x01c20000, 1 * KiB }, | ||
227 | + { "rtc", 0x01c20400, 1 * KiB }, | ||
228 | + { "pio", 0x01c20800, 1 * KiB }, | ||
229 | + { "owa", 0x01c21000, 1 * KiB }, | ||
230 | + { "ac97", 0x01c21400, 1 * KiB }, | ||
231 | + { "cir0", 0x01c21800, 1 * KiB }, | ||
232 | + { "cir1", 0x01c21c00, 1 * KiB }, | ||
233 | + { "pcm0", 0x01c22000, 1 * KiB }, | ||
234 | + { "pcm1", 0x01c22400, 1 * KiB }, | ||
235 | + { "pcm2", 0x01c22800, 1 * KiB }, | ||
236 | + { "audio", 0x01c22c00, 1 * KiB }, | ||
237 | + { "keypad", 0x01c23000, 1 * KiB }, | ||
238 | + { "pwm", 0x01c23400, 1 * KiB }, | ||
239 | + { "keyadc", 0x01c24400, 1 * KiB }, | ||
240 | + { "ths", 0x01c24c00, 1 * KiB }, | ||
241 | + { "rtp", 0x01c25000, 1 * KiB }, | ||
242 | + { "pmu", 0x01c25400, 1 * KiB }, | ||
243 | + { "cpu-cfg", 0x01c25c00, 1 * KiB }, | ||
244 | + { "uart0", 0x01c28000, 1 * KiB }, | ||
245 | + { "uart1", 0x01c28400, 1 * KiB }, | ||
246 | + { "uart2", 0x01c28800, 1 * KiB }, | ||
247 | + { "uart3", 0x01c28c00, 1 * KiB }, | ||
248 | + { "uart4", 0x01c29000, 1 * KiB }, | ||
249 | + { "uart5", 0x01c29400, 1 * KiB }, | ||
250 | + { "uart6", 0x01c29800, 1 * KiB }, | ||
251 | + { "uart7", 0x01c29c00, 1 * KiB }, | ||
252 | + { "ps20", 0x01c2a000, 1 * KiB }, | ||
253 | + { "ps21", 0x01c2a400, 1 * KiB }, | ||
254 | + { "twi0", 0x01c2ac00, 1 * KiB }, | ||
255 | + { "twi1", 0x01c2b000, 1 * KiB }, | ||
256 | + { "twi2", 0x01c2b400, 1 * KiB }, | ||
257 | + { "twi3", 0x01c2b800, 1 * KiB }, | ||
258 | + { "twi4", 0x01c2c000, 1 * KiB }, | ||
259 | + { "scr", 0x01c2c400, 1 * KiB }, | ||
260 | + { "tvd-top", 0x01c30000, 4 * KiB }, | ||
261 | + { "tvd0", 0x01c31000, 4 * KiB }, | ||
262 | + { "tvd1", 0x01c32000, 4 * KiB }, | ||
263 | + { "tvd2", 0x01c33000, 4 * KiB }, | ||
264 | + { "tvd3", 0x01c34000, 4 * KiB }, | ||
265 | + { "gpu", 0x01c40000, 64 * KiB }, | ||
266 | + { "gmac", 0x01c50000, 64 * KiB }, | ||
267 | + { "hstmr", 0x01c60000, 4 * KiB }, | ||
268 | + { "dram-com", 0x01c62000, 4 * KiB }, | ||
269 | + { "dram-ctl", 0x01c63000, 4 * KiB }, | ||
270 | + { "tcon-top", 0x01c70000, 4 * KiB }, | ||
271 | + { "lcd0", 0x01c71000, 4 * KiB }, | ||
272 | + { "lcd1", 0x01c72000, 4 * KiB }, | ||
273 | + { "tv0", 0x01c73000, 4 * KiB }, | ||
274 | + { "tv1", 0x01c74000, 4 * KiB }, | ||
275 | + { "tve-top", 0x01c90000, 16 * KiB }, | ||
276 | + { "tve0", 0x01c94000, 16 * KiB }, | ||
277 | + { "tve1", 0x01c98000, 16 * KiB }, | ||
278 | + { "mipi_dsi", 0x01ca0000, 4 * KiB }, | ||
279 | + { "mipi_dphy", 0x01ca1000, 4 * KiB }, | ||
280 | + { "ve", 0x01d00000, 1024 * KiB }, | ||
281 | + { "mp", 0x01e80000, 128 * KiB }, | ||
282 | + { "hdmi", 0x01ee0000, 128 * KiB }, | ||
283 | + { "prcm", 0x01f01400, 1 * KiB }, | ||
284 | + { "debug", 0x3f500000, 64 * KiB }, | ||
285 | + { "cpubist", 0x3f501000, 4 * KiB }, | ||
286 | + { "dcu", 0x3fff0000, 64 * KiB }, | ||
287 | + { "hstmr", 0x01c60000, 4 * KiB }, | ||
288 | + { "brom", 0xffff0000, 36 * KiB } | ||
289 | +}; | ||
290 | + | ||
291 | +/* Per Processor Interrupts */ | ||
292 | +enum { | ||
293 | + AW_R40_GIC_PPI_MAINT = 9, | ||
294 | + AW_R40_GIC_PPI_HYPTIMER = 10, | ||
295 | + AW_R40_GIC_PPI_VIRTTIMER = 11, | ||
296 | + AW_R40_GIC_PPI_SECTIMER = 13, | ||
297 | + AW_R40_GIC_PPI_PHYSTIMER = 14 | ||
298 | +}; | ||
299 | + | ||
300 | +/* Shared Processor Interrupts */ | ||
301 | +enum { | ||
302 | + AW_R40_GIC_SPI_UART0 = 1, | ||
303 | + AW_R40_GIC_SPI_TIMER0 = 22, | ||
304 | + AW_R40_GIC_SPI_TIMER1 = 23, | ||
305 | + AW_R40_GIC_SPI_MMC0 = 32, | ||
306 | + AW_R40_GIC_SPI_MMC1 = 33, | ||
307 | + AW_R40_GIC_SPI_MMC2 = 34, | ||
308 | + AW_R40_GIC_SPI_MMC3 = 35, | ||
309 | +}; | ||
310 | + | ||
311 | +/* Allwinner R40 general constants */ | ||
312 | +enum { | ||
313 | + AW_R40_GIC_NUM_SPI = 128 | ||
314 | +}; | ||
315 | + | ||
316 | +#define BOOT0_MAGIC "eGON.BT0" | ||
317 | + | ||
318 | +/* The low 8-bits of the 'boot_media' field in the SPL header */ | ||
319 | +#define SUNXI_BOOTED_FROM_MMC0 0 | ||
320 | +#define SUNXI_BOOTED_FROM_NAND 1 | ||
321 | +#define SUNXI_BOOTED_FROM_MMC2 2 | ||
322 | +#define SUNXI_BOOTED_FROM_SPI 3 | ||
323 | + | ||
324 | +struct boot_file_head { | ||
325 | + uint32_t b_instruction; | ||
326 | + uint8_t magic[8]; | ||
327 | + uint32_t check_sum; | ||
328 | + uint32_t length; | ||
329 | + uint32_t pub_head_size; | ||
330 | + uint32_t fel_script_address; | ||
331 | + uint32_t fel_uEnv_length; | ||
332 | + uint32_t dt_name_offset; | ||
333 | + uint32_t dram_size; | ||
334 | + uint32_t boot_media; | ||
335 | + uint32_t string_pool[13]; | ||
336 | +}; | ||
337 | + | ||
338 | +bool allwinner_r40_bootrom_setup(AwR40State *s, BlockBackend *blk, int unit) | ||
26 | +{ | 339 | +{ |
27 | + return s->svl; | 340 | + const int64_t rom_size = 32 * KiB; |
28 | +} | 341 | + g_autofree uint8_t *buffer = g_new0(uint8_t, rom_size); |
29 | + | 342 | + struct boot_file_head *head = (struct boot_file_head *)buffer; |
30 | /* | 343 | + |
31 | * Return the offset info CPUARMState of the predicate vector register Pn. | 344 | + if (blk_pread(blk, 8 * KiB, rom_size, buffer, 0) < 0) { |
32 | * Note for this purpose, FFR is P16. | 345 | + error_setg(&error_fatal, "%s: failed to read BlockBackend data", |
33 | @@ -XXX,XX +XXX,XX @@ static inline int pred_full_reg_size(DisasContext *s) | 346 | + __func__); |
34 | return s->vl >> 3; | ||
35 | } | ||
36 | |||
37 | +/* Return the byte size of the predicate register, SVL / 64. */ | ||
38 | +static inline int streaming_pred_reg_size(DisasContext *s) | ||
39 | +{ | ||
40 | + return s->svl >> 3; | ||
41 | +} | ||
42 | + | ||
43 | /* | ||
44 | * Round up the size of a register to a size allowed by | ||
45 | * the tcg vector infrastructure. Any operation which uses this | ||
46 | diff --git a/target/arm/sve.decode b/target/arm/sve.decode | ||
47 | index XXXXXXX..XXXXXXX 100644 | ||
48 | --- a/target/arm/sve.decode | ||
49 | +++ b/target/arm/sve.decode | ||
50 | @@ -XXX,XX +XXX,XX @@ INDEX_ri 00000100 esz:2 1 imm:s5 010001 rn:5 rd:5 | ||
51 | # SVE index generation (register start, register increment) | ||
52 | INDEX_rr 00000100 .. 1 ..... 010011 ..... ..... @rd_rn_rm | ||
53 | |||
54 | -### SVE Stack Allocation Group | ||
55 | +### SVE / Streaming SVE Stack Allocation Group | ||
56 | |||
57 | # SVE stack frame adjustment | ||
58 | ADDVL 00000100 001 ..... 01010 ...... ..... @rd_rn_i6 | ||
59 | +ADDSVL 00000100 001 ..... 01011 ...... ..... @rd_rn_i6 | ||
60 | ADDPL 00000100 011 ..... 01010 ...... ..... @rd_rn_i6 | ||
61 | +ADDSPL 00000100 011 ..... 01011 ...... ..... @rd_rn_i6 | ||
62 | |||
63 | # SVE stack frame size | ||
64 | RDVL 00000100 101 11111 01010 imm:s6 rd:5 | ||
65 | +RDSVL 00000100 101 11111 01011 imm:s6 rd:5 | ||
66 | |||
67 | ### SVE Bitwise Shift - Unpredicated Group | ||
68 | |||
69 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | ||
70 | index XXXXXXX..XXXXXXX 100644 | ||
71 | --- a/target/arm/translate-sve.c | ||
72 | +++ b/target/arm/translate-sve.c | ||
73 | @@ -XXX,XX +XXX,XX @@ static bool trans_ADDVL(DisasContext *s, arg_ADDVL *a) | ||
74 | return true; | ||
75 | } | ||
76 | |||
77 | +static bool trans_ADDSVL(DisasContext *s, arg_ADDSVL *a) | ||
78 | +{ | ||
79 | + if (!dc_isar_feature(aa64_sme, s)) { | ||
80 | + return false; | 347 | + return false; |
81 | + } | 348 | + } |
82 | + if (sme_enabled_check(s)) { | 349 | + |
83 | + TCGv_i64 rd = cpu_reg_sp(s, a->rd); | 350 | + /* we only check the magic string here. */ |
84 | + TCGv_i64 rn = cpu_reg_sp(s, a->rn); | 351 | + if (memcmp(head->magic, BOOT0_MAGIC, sizeof(head->magic))) { |
85 | + tcg_gen_addi_i64(rd, rn, a->imm * streaming_vec_reg_size(s)); | 352 | + return false; |
86 | + } | 353 | + } |
354 | + | ||
355 | + /* | ||
356 | + * Simulate the behavior of the bootROM, it will change the boot_media | ||
357 | + * flag to indicate where the chip is booting from. R40 can boot from | ||
358 | + * mmc0 or mmc2, the default value of boot_media is zero | ||
359 | + * (SUNXI_BOOTED_FROM_MMC0), let's fix this flag when it is booting from | ||
360 | + * the others. | ||
361 | + */ | ||
362 | + if (unit == 2) { | ||
363 | + head->boot_media = cpu_to_le32(SUNXI_BOOTED_FROM_MMC2); | ||
364 | + } else { | ||
365 | + head->boot_media = cpu_to_le32(SUNXI_BOOTED_FROM_MMC0); | ||
366 | + } | ||
367 | + | ||
368 | + rom_add_blob("allwinner-r40.bootrom", buffer, rom_size, | ||
369 | + rom_size, s->memmap[AW_R40_DEV_SRAM_A1], | ||
370 | + NULL, NULL, NULL, NULL, false); | ||
87 | + return true; | 371 | + return true; |
88 | +} | 372 | +} |
89 | + | 373 | + |
90 | static bool trans_ADDPL(DisasContext *s, arg_ADDPL *a) | 374 | +static void allwinner_r40_init(Object *obj) |
91 | { | ||
92 | if (!dc_isar_feature(aa64_sve, s)) { | ||
93 | @@ -XXX,XX +XXX,XX @@ static bool trans_ADDPL(DisasContext *s, arg_ADDPL *a) | ||
94 | return true; | ||
95 | } | ||
96 | |||
97 | +static bool trans_ADDSPL(DisasContext *s, arg_ADDSPL *a) | ||
98 | +{ | 375 | +{ |
99 | + if (!dc_isar_feature(aa64_sme, s)) { | 376 | + static const char *mmc_names[AW_R40_NUM_MMCS] = { |
100 | + return false; | 377 | + "mmc0", "mmc1", "mmc2", "mmc3" |
101 | + } | 378 | + }; |
102 | + if (sme_enabled_check(s)) { | 379 | + AwR40State *s = AW_R40(obj); |
103 | + TCGv_i64 rd = cpu_reg_sp(s, a->rd); | 380 | + |
104 | + TCGv_i64 rn = cpu_reg_sp(s, a->rn); | 381 | + s->memmap = allwinner_r40_memmap; |
105 | + tcg_gen_addi_i64(rd, rn, a->imm * streaming_pred_reg_size(s)); | 382 | + |
106 | + } | 383 | + for (int i = 0; i < AW_R40_NUM_CPUS; i++) { |
107 | + return true; | 384 | + object_initialize_child(obj, "cpu[*]", &s->cpus[i], |
385 | + ARM_CPU_TYPE_NAME("cortex-a7")); | ||
386 | + } | ||
387 | + | ||
388 | + object_initialize_child(obj, "gic", &s->gic, TYPE_ARM_GIC); | ||
389 | + | ||
390 | + object_initialize_child(obj, "timer", &s->timer, TYPE_AW_A10_PIT); | ||
391 | + object_property_add_alias(obj, "clk0-freq", OBJECT(&s->timer), | ||
392 | + "clk0-freq"); | ||
393 | + object_property_add_alias(obj, "clk1-freq", OBJECT(&s->timer), | ||
394 | + "clk1-freq"); | ||
395 | + | ||
396 | + for (int i = 0; i < AW_R40_NUM_MMCS; i++) { | ||
397 | + object_initialize_child(obj, mmc_names[i], &s->mmc[i], | ||
398 | + TYPE_AW_SDHOST_SUN5I); | ||
399 | + } | ||
108 | +} | 400 | +} |
109 | + | 401 | + |
110 | static bool trans_RDVL(DisasContext *s, arg_RDVL *a) | 402 | +static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
111 | { | ||
112 | if (!dc_isar_feature(aa64_sve, s)) { | ||
113 | @@ -XXX,XX +XXX,XX @@ static bool trans_RDVL(DisasContext *s, arg_RDVL *a) | ||
114 | return true; | ||
115 | } | ||
116 | |||
117 | +static bool trans_RDSVL(DisasContext *s, arg_RDSVL *a) | ||
118 | +{ | 403 | +{ |
119 | + if (!dc_isar_feature(aa64_sme, s)) { | 404 | + AwR40State *s = AW_R40(dev); |
120 | + return false; | 405 | + unsigned i; |
121 | + } | 406 | + |
122 | + if (sme_enabled_check(s)) { | 407 | + /* CPUs */ |
123 | + TCGv_i64 reg = cpu_reg(s, a->rd); | 408 | + for (i = 0; i < AW_R40_NUM_CPUS; i++) { |
124 | + tcg_gen_movi_i64(reg, a->imm * streaming_vec_reg_size(s)); | 409 | + |
125 | + } | 410 | + /* |
126 | + return true; | 411 | + * Disable secondary CPUs. Guest EL3 firmware will start |
412 | + * them via CPU reset control registers. | ||
413 | + */ | ||
414 | + qdev_prop_set_bit(DEVICE(&s->cpus[i]), "start-powered-off", | ||
415 | + i > 0); | ||
416 | + | ||
417 | + /* All exception levels required */ | ||
418 | + qdev_prop_set_bit(DEVICE(&s->cpus[i]), "has_el3", true); | ||
419 | + qdev_prop_set_bit(DEVICE(&s->cpus[i]), "has_el2", true); | ||
420 | + | ||
421 | + /* Mark realized */ | ||
422 | + qdev_realize(DEVICE(&s->cpus[i]), NULL, &error_fatal); | ||
423 | + } | ||
424 | + | ||
425 | + /* Generic Interrupt Controller */ | ||
426 | + qdev_prop_set_uint32(DEVICE(&s->gic), "num-irq", AW_R40_GIC_NUM_SPI + | ||
427 | + GIC_INTERNAL); | ||
428 | + qdev_prop_set_uint32(DEVICE(&s->gic), "revision", 2); | ||
429 | + qdev_prop_set_uint32(DEVICE(&s->gic), "num-cpu", AW_R40_NUM_CPUS); | ||
430 | + qdev_prop_set_bit(DEVICE(&s->gic), "has-security-extensions", false); | ||
431 | + qdev_prop_set_bit(DEVICE(&s->gic), "has-virtualization-extensions", true); | ||
432 | + sysbus_realize(SYS_BUS_DEVICE(&s->gic), &error_fatal); | ||
433 | + | ||
434 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 0, s->memmap[AW_R40_DEV_GIC_DIST]); | ||
435 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 1, s->memmap[AW_R40_DEV_GIC_CPU]); | ||
436 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 2, s->memmap[AW_R40_DEV_GIC_HYP]); | ||
437 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 3, s->memmap[AW_R40_DEV_GIC_VCPU]); | ||
438 | + | ||
439 | + /* | ||
440 | + * Wire the outputs from each CPU's generic timer and the GICv2 | ||
441 | + * maintenance interrupt signal to the appropriate GIC PPI inputs, | ||
442 | + * and the GIC's IRQ/FIQ/VIRQ/VFIQ interrupt outputs to the CPU's inputs. | ||
443 | + */ | ||
444 | + for (i = 0; i < AW_R40_NUM_CPUS; i++) { | ||
445 | + DeviceState *cpudev = DEVICE(&s->cpus[i]); | ||
446 | + int ppibase = AW_R40_GIC_NUM_SPI + i * GIC_INTERNAL + GIC_NR_SGIS; | ||
447 | + int irq; | ||
448 | + /* | ||
449 | + * Mapping from the output timer irq lines from the CPU to the | ||
450 | + * GIC PPI inputs used for this board. | ||
451 | + */ | ||
452 | + const int timer_irq[] = { | ||
453 | + [GTIMER_PHYS] = AW_R40_GIC_PPI_PHYSTIMER, | ||
454 | + [GTIMER_VIRT] = AW_R40_GIC_PPI_VIRTTIMER, | ||
455 | + [GTIMER_HYP] = AW_R40_GIC_PPI_HYPTIMER, | ||
456 | + [GTIMER_SEC] = AW_R40_GIC_PPI_SECTIMER, | ||
457 | + }; | ||
458 | + | ||
459 | + /* Connect CPU timer outputs to GIC PPI inputs */ | ||
460 | + for (irq = 0; irq < ARRAY_SIZE(timer_irq); irq++) { | ||
461 | + qdev_connect_gpio_out(cpudev, irq, | ||
462 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
463 | + ppibase + timer_irq[irq])); | ||
464 | + } | ||
465 | + | ||
466 | + /* Connect GIC outputs to CPU interrupt inputs */ | ||
467 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i, | ||
468 | + qdev_get_gpio_in(cpudev, ARM_CPU_IRQ)); | ||
469 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + AW_R40_NUM_CPUS, | ||
470 | + qdev_get_gpio_in(cpudev, ARM_CPU_FIQ)); | ||
471 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + (2 * AW_R40_NUM_CPUS), | ||
472 | + qdev_get_gpio_in(cpudev, ARM_CPU_VIRQ)); | ||
473 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + (3 * AW_R40_NUM_CPUS), | ||
474 | + qdev_get_gpio_in(cpudev, ARM_CPU_VFIQ)); | ||
475 | + | ||
476 | + /* GIC maintenance signal */ | ||
477 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + (4 * AW_R40_NUM_CPUS), | ||
478 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
479 | + ppibase + AW_R40_GIC_PPI_MAINT)); | ||
480 | + } | ||
481 | + | ||
482 | + /* Timer */ | ||
483 | + sysbus_realize(SYS_BUS_DEVICE(&s->timer), &error_fatal); | ||
484 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->timer), 0, s->memmap[AW_R40_DEV_PIT]); | ||
485 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer), 0, | ||
486 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
487 | + AW_R40_GIC_SPI_TIMER0)); | ||
488 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer), 1, | ||
489 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
490 | + AW_R40_GIC_SPI_TIMER1)); | ||
491 | + | ||
492 | + /* SRAM */ | ||
493 | + memory_region_init_ram(&s->sram_a1, OBJECT(dev), "sram A1", | ||
494 | + 16 * KiB, &error_abort); | ||
495 | + memory_region_init_ram(&s->sram_a2, OBJECT(dev), "sram A2", | ||
496 | + 16 * KiB, &error_abort); | ||
497 | + memory_region_init_ram(&s->sram_a3, OBJECT(dev), "sram A3", | ||
498 | + 13 * KiB, &error_abort); | ||
499 | + memory_region_init_ram(&s->sram_a4, OBJECT(dev), "sram A4", | ||
500 | + 3 * KiB, &error_abort); | ||
501 | + memory_region_add_subregion(get_system_memory(), | ||
502 | + s->memmap[AW_R40_DEV_SRAM_A1], &s->sram_a1); | ||
503 | + memory_region_add_subregion(get_system_memory(), | ||
504 | + s->memmap[AW_R40_DEV_SRAM_A2], &s->sram_a2); | ||
505 | + memory_region_add_subregion(get_system_memory(), | ||
506 | + s->memmap[AW_R40_DEV_SRAM_A3], &s->sram_a3); | ||
507 | + memory_region_add_subregion(get_system_memory(), | ||
508 | + s->memmap[AW_R40_DEV_SRAM_A4], &s->sram_a4); | ||
509 | + | ||
510 | + /* SD/MMC */ | ||
511 | + for (int i = 0; i < AW_R40_NUM_MMCS; i++) { | ||
512 | + qemu_irq irq = qdev_get_gpio_in(DEVICE(&s->gic), | ||
513 | + AW_R40_GIC_SPI_MMC0 + i); | ||
514 | + const hwaddr addr = s->memmap[AW_R40_DEV_MMC0 + i]; | ||
515 | + | ||
516 | + object_property_set_link(OBJECT(&s->mmc[i]), "dma-memory", | ||
517 | + OBJECT(get_system_memory()), &error_fatal); | ||
518 | + sysbus_realize(SYS_BUS_DEVICE(&s->mmc[i]), &error_fatal); | ||
519 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->mmc[i]), 0, addr); | ||
520 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->mmc[i]), 0, irq); | ||
521 | + } | ||
522 | + | ||
523 | + /* UART0. For future clocktree API: All UARTS are connected to APB2_CLK. */ | ||
524 | + serial_mm_init(get_system_memory(), s->memmap[AW_R40_DEV_UART0], 2, | ||
525 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_R40_GIC_SPI_UART0), | ||
526 | + 115200, serial_hd(0), DEVICE_NATIVE_ENDIAN); | ||
527 | + | ||
528 | + /* Unimplemented devices */ | ||
529 | + for (i = 0; i < ARRAY_SIZE(r40_unimplemented); i++) { | ||
530 | + create_unimplemented_device(r40_unimplemented[i].device_name, | ||
531 | + r40_unimplemented[i].base, | ||
532 | + r40_unimplemented[i].size); | ||
533 | + } | ||
127 | +} | 534 | +} |
128 | + | 535 | + |
129 | /* | 536 | +static void allwinner_r40_class_init(ObjectClass *oc, void *data) |
130 | *** SVE Compute Vector Address Group | 537 | +{ |
131 | */ | 538 | + DeviceClass *dc = DEVICE_CLASS(oc); |
539 | + | ||
540 | + dc->realize = allwinner_r40_realize; | ||
541 | + /* Reason: uses serial_hd() in realize function */ | ||
542 | + dc->user_creatable = false; | ||
543 | +} | ||
544 | + | ||
545 | +static const TypeInfo allwinner_r40_type_info = { | ||
546 | + .name = TYPE_AW_R40, | ||
547 | + .parent = TYPE_DEVICE, | ||
548 | + .instance_size = sizeof(AwR40State), | ||
549 | + .instance_init = allwinner_r40_init, | ||
550 | + .class_init = allwinner_r40_class_init, | ||
551 | +}; | ||
552 | + | ||
553 | +static void allwinner_r40_register_types(void) | ||
554 | +{ | ||
555 | + type_register_static(&allwinner_r40_type_info); | ||
556 | +} | ||
557 | + | ||
558 | +type_init(allwinner_r40_register_types) | ||
559 | diff --git a/hw/arm/bananapi_m2u.c b/hw/arm/bananapi_m2u.c | ||
560 | new file mode 100644 | ||
561 | index XXXXXXX..XXXXXXX | ||
562 | --- /dev/null | ||
563 | +++ b/hw/arm/bananapi_m2u.c | ||
564 | @@ -XXX,XX +XXX,XX @@ | ||
565 | +/* | ||
566 | + * Bananapi M2U emulation | ||
567 | + * | ||
568 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> | ||
569 | + * | ||
570 | + * This program is free software: you can redistribute it and/or modify | ||
571 | + * it under the terms of the GNU General Public License as published by | ||
572 | + * the Free Software Foundation, either version 2 of the License, or | ||
573 | + * (at your option) any later version. | ||
574 | + * | ||
575 | + * This program is distributed in the hope that it will be useful, | ||
576 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
577 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
578 | + * GNU General Public License for more details. | ||
579 | + * | ||
580 | + * You should have received a copy of the GNU General Public License | ||
581 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
582 | + */ | ||
583 | + | ||
584 | +#include "qemu/osdep.h" | ||
585 | +#include "qemu/units.h" | ||
586 | +#include "exec/address-spaces.h" | ||
587 | +#include "qapi/error.h" | ||
588 | +#include "qemu/error-report.h" | ||
589 | +#include "hw/boards.h" | ||
590 | +#include "hw/qdev-properties.h" | ||
591 | +#include "hw/arm/allwinner-r40.h" | ||
592 | + | ||
593 | +static struct arm_boot_info bpim2u_binfo; | ||
594 | + | ||
595 | +/* | ||
596 | + * R40 can boot from mmc0 and mmc2, and bpim2u has two mmc interface, one is | ||
597 | + * connected to sdcard and another mount an emmc media. | ||
598 | + * Attach the mmc driver and try loading bootloader. | ||
599 | + */ | ||
600 | +static void mmc_attach_drive(AwR40State *s, AwSdHostState *mmc, int unit, | ||
601 | + bool load_bootroom, bool *bootroom_loaded) | ||
602 | +{ | ||
603 | + DriveInfo *di = drive_get(IF_SD, 0, unit); | ||
604 | + BlockBackend *blk = di ? blk_by_legacy_dinfo(di) : NULL; | ||
605 | + BusState *bus; | ||
606 | + DeviceState *carddev; | ||
607 | + | ||
608 | + bus = qdev_get_child_bus(DEVICE(mmc), "sd-bus"); | ||
609 | + if (bus == NULL) { | ||
610 | + error_report("No SD bus found in SOC object"); | ||
611 | + exit(1); | ||
612 | + } | ||
613 | + | ||
614 | + carddev = qdev_new(TYPE_SD_CARD); | ||
615 | + qdev_prop_set_drive_err(carddev, "drive", blk, &error_fatal); | ||
616 | + qdev_realize_and_unref(carddev, bus, &error_fatal); | ||
617 | + | ||
618 | + if (load_bootroom && blk && blk_is_available(blk)) { | ||
619 | + /* Use Boot ROM to copy data from SD card to SRAM */ | ||
620 | + *bootroom_loaded = allwinner_r40_bootrom_setup(s, blk, unit); | ||
621 | + } | ||
622 | +} | ||
623 | + | ||
624 | +static void bpim2u_init(MachineState *machine) | ||
625 | +{ | ||
626 | + bool bootroom_loaded = false; | ||
627 | + AwR40State *r40; | ||
628 | + | ||
629 | + /* BIOS is not supported by this board */ | ||
630 | + if (machine->firmware) { | ||
631 | + error_report("BIOS not supported for this machine"); | ||
632 | + exit(1); | ||
633 | + } | ||
634 | + | ||
635 | + /* Only allow Cortex-A7 for this board */ | ||
636 | + if (strcmp(machine->cpu_type, ARM_CPU_TYPE_NAME("cortex-a7")) != 0) { | ||
637 | + error_report("This board can only be used with cortex-a7 CPU"); | ||
638 | + exit(1); | ||
639 | + } | ||
640 | + | ||
641 | + r40 = AW_R40(object_new(TYPE_AW_R40)); | ||
642 | + object_property_add_child(OBJECT(machine), "soc", OBJECT(r40)); | ||
643 | + object_unref(OBJECT(r40)); | ||
644 | + | ||
645 | + /* Setup timer properties */ | ||
646 | + object_property_set_int(OBJECT(r40), "clk0-freq", 32768, &error_abort); | ||
647 | + object_property_set_int(OBJECT(r40), "clk1-freq", 24 * 1000 * 1000, | ||
648 | + &error_abort); | ||
649 | + | ||
650 | + /* Mark R40 object realized */ | ||
651 | + qdev_realize(DEVICE(r40), NULL, &error_abort); | ||
652 | + | ||
653 | + /* | ||
654 | + * Plug in SD card and try load bootrom, R40 has 4 mmc controllers but can | ||
655 | + * only booting from mmc0 and mmc2. | ||
656 | + */ | ||
657 | + for (int i = 0; i < AW_R40_NUM_MMCS; i++) { | ||
658 | + switch (i) { | ||
659 | + case 0: | ||
660 | + case 2: | ||
661 | + mmc_attach_drive(r40, &r40->mmc[i], i, | ||
662 | + !machine->kernel_filename && !bootroom_loaded, | ||
663 | + &bootroom_loaded); | ||
664 | + break; | ||
665 | + default: | ||
666 | + mmc_attach_drive(r40, &r40->mmc[i], i, false, NULL); | ||
667 | + break; | ||
668 | + } | ||
669 | + } | ||
670 | + | ||
671 | + /* SDRAM */ | ||
672 | + memory_region_add_subregion(get_system_memory(), | ||
673 | + r40->memmap[AW_R40_DEV_SDRAM], machine->ram); | ||
674 | + | ||
675 | + bpim2u_binfo.loader_start = r40->memmap[AW_R40_DEV_SDRAM]; | ||
676 | + bpim2u_binfo.ram_size = machine->ram_size; | ||
677 | + bpim2u_binfo.psci_conduit = QEMU_PSCI_CONDUIT_SMC; | ||
678 | + arm_load_kernel(ARM_CPU(first_cpu), machine, &bpim2u_binfo); | ||
679 | +} | ||
680 | + | ||
681 | +static void bpim2u_machine_init(MachineClass *mc) | ||
682 | +{ | ||
683 | + mc->desc = "Bananapi M2U (Cortex-A7)"; | ||
684 | + mc->init = bpim2u_init; | ||
685 | + mc->min_cpus = AW_R40_NUM_CPUS; | ||
686 | + mc->max_cpus = AW_R40_NUM_CPUS; | ||
687 | + mc->default_cpus = AW_R40_NUM_CPUS; | ||
688 | + mc->default_cpu_type = ARM_CPU_TYPE_NAME("cortex-a7"); | ||
689 | + mc->default_ram_size = 1 * GiB; | ||
690 | + mc->default_ram_id = "bpim2u.ram"; | ||
691 | +} | ||
692 | + | ||
693 | +DEFINE_MACHINE("bpim2u", bpim2u_machine_init) | ||
694 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig | ||
695 | index XXXXXXX..XXXXXXX 100644 | ||
696 | --- a/hw/arm/Kconfig | ||
697 | +++ b/hw/arm/Kconfig | ||
698 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_H3 | ||
699 | select USB_EHCI_SYSBUS | ||
700 | select SD | ||
701 | |||
702 | +config ALLWINNER_R40 | ||
703 | + bool | ||
704 | + default y if TCG && ARM | ||
705 | + select ALLWINNER_A10_PIT | ||
706 | + select SERIAL | ||
707 | + select ARM_TIMER | ||
708 | + select ARM_GIC | ||
709 | + select UNIMP | ||
710 | + select SD | ||
711 | + | ||
712 | config RASPI | ||
713 | bool | ||
714 | default y | ||
715 | diff --git a/hw/arm/meson.build b/hw/arm/meson.build | ||
716 | index XXXXXXX..XXXXXXX 100644 | ||
717 | --- a/hw/arm/meson.build | ||
718 | +++ b/hw/arm/meson.build | ||
719 | @@ -XXX,XX +XXX,XX @@ arm_ss.add(when: 'CONFIG_OMAP', if_true: files('omap1.c', 'omap2.c')) | ||
720 | arm_ss.add(when: 'CONFIG_STRONGARM', if_true: files('strongarm.c')) | ||
721 | arm_ss.add(when: 'CONFIG_ALLWINNER_A10', if_true: files('allwinner-a10.c', 'cubieboard.c')) | ||
722 | arm_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3.c', 'orangepi.c')) | ||
723 | +arm_ss.add(when: 'CONFIG_ALLWINNER_R40', if_true: files('allwinner-r40.c', 'bananapi_m2u.c')) | ||
724 | arm_ss.add(when: 'CONFIG_RASPI', if_true: files('bcm2836.c', 'raspi.c')) | ||
725 | arm_ss.add(when: 'CONFIG_STM32F100_SOC', if_true: files('stm32f100_soc.c')) | ||
726 | arm_ss.add(when: 'CONFIG_STM32F205_SOC', if_true: files('stm32f205_soc.c')) | ||
132 | -- | 727 | -- |
133 | 2.25.1 | 728 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | This is an SVE instruction that operates using the SVE vector | 3 | The CCU provides the registers to program the PLLs and the controls |
4 | length but that it is present only if SME is implemented. | 4 | most of the clock generation, division, distribution, synchronization |
5 | and gating. | ||
5 | 6 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | This commit adds support for the Clock Control Unit which emulates |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | a simple read/write register interface. |
8 | Message-id: 20220708151540.18136-29-richard.henderson@linaro.org | 9 | |
10 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> | ||
11 | Reviewed-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 13 | --- |
11 | target/arm/sve.decode | 20 +++++++++++++ | 14 | include/hw/arm/allwinner-r40.h | 2 + |
12 | target/arm/translate-sve.c | 57 ++++++++++++++++++++++++++++++++++++++ | 15 | include/hw/misc/allwinner-r40-ccu.h | 65 +++++++++ |
13 | 2 files changed, 77 insertions(+) | 16 | hw/arm/allwinner-r40.c | 8 +- |
17 | hw/misc/allwinner-r40-ccu.c | 209 ++++++++++++++++++++++++++++ | ||
18 | hw/misc/meson.build | 1 + | ||
19 | 5 files changed, 284 insertions(+), 1 deletion(-) | ||
20 | create mode 100644 include/hw/misc/allwinner-r40-ccu.h | ||
21 | create mode 100644 hw/misc/allwinner-r40-ccu.c | ||
14 | 22 | ||
15 | diff --git a/target/arm/sve.decode b/target/arm/sve.decode | 23 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
16 | index XXXXXXX..XXXXXXX 100644 | 24 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sve.decode | 25 | --- a/include/hw/arm/allwinner-r40.h |
18 | +++ b/target/arm/sve.decode | 26 | +++ b/include/hw/arm/allwinner-r40.h |
19 | @@ -XXX,XX +XXX,XX @@ BFMLALT_zzxw 01100100 11 1 ..... 0100.1 ..... ..... @rrxr_3a esz=2 | 27 | @@ -XXX,XX +XXX,XX @@ |
20 | 28 | #include "hw/timer/allwinner-a10-pit.h" | |
21 | ### SVE2 floating-point bfloat16 dot-product (indexed) | 29 | #include "hw/intc/arm_gic.h" |
22 | BFDOT_zzxz 01100100 01 1 ..... 010000 ..... ..... @rrxr_2 esz=2 | 30 | #include "hw/sd/allwinner-sdhost.h" |
23 | + | 31 | +#include "hw/misc/allwinner-r40-ccu.h" |
24 | +### SVE broadcast predicate element | 32 | #include "target/arm/cpu.h" |
25 | + | 33 | #include "sysemu/block-backend.h" |
26 | +&psel esz pd pn pm rv imm | 34 | |
27 | +%psel_rv 16:2 !function=plus_12 | 35 | @@ -XXX,XX +XXX,XX @@ struct AwR40State { |
28 | +%psel_imm_b 22:2 19:2 | 36 | const hwaddr *memmap; |
29 | +%psel_imm_h 22:2 20:1 | 37 | AwA10PITState timer; |
30 | +%psel_imm_s 22:2 | 38 | AwSdHostState mmc[AW_R40_NUM_MMCS]; |
31 | +%psel_imm_d 23:1 | 39 | + AwR40ClockCtlState ccu; |
32 | +@psel ........ .. . ... .. .. pn:4 . pm:4 . pd:4 \ | 40 | GICState gic; |
33 | + &psel rv=%psel_rv | 41 | MemoryRegion sram_a1; |
34 | + | 42 | MemoryRegion sram_a2; |
35 | +PSEL 00100101 .. 1 ..1 .. 01 .... 0 .... 0 .... \ | 43 | diff --git a/include/hw/misc/allwinner-r40-ccu.h b/include/hw/misc/allwinner-r40-ccu.h |
36 | + @psel esz=0 imm=%psel_imm_b | 44 | new file mode 100644 |
37 | +PSEL 00100101 .. 1 .10 .. 01 .... 0 .... 0 .... \ | 45 | index XXXXXXX..XXXXXXX |
38 | + @psel esz=1 imm=%psel_imm_h | 46 | --- /dev/null |
39 | +PSEL 00100101 .. 1 100 .. 01 .... 0 .... 0 .... \ | 47 | +++ b/include/hw/misc/allwinner-r40-ccu.h |
40 | + @psel esz=2 imm=%psel_imm_s | 48 | @@ -XXX,XX +XXX,XX @@ |
41 | +PSEL 00100101 .1 1 000 .. 01 .... 0 .... 0 .... \ | 49 | +/* |
42 | + @psel esz=3 imm=%psel_imm_d | 50 | + * Allwinner R40 Clock Control Unit emulation |
43 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 51 | + * |
52 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> | ||
53 | + * | ||
54 | + * This program is free software: you can redistribute it and/or modify | ||
55 | + * it under the terms of the GNU General Public License as published by | ||
56 | + * the Free Software Foundation, either version 2 of the License, or | ||
57 | + * (at your option) any later version. | ||
58 | + * | ||
59 | + * This program is distributed in the hope that it will be useful, | ||
60 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
61 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
62 | + * GNU General Public License for more details. | ||
63 | + * | ||
64 | + * You should have received a copy of the GNU General Public License | ||
65 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
66 | + */ | ||
67 | + | ||
68 | +#ifndef HW_MISC_ALLWINNER_R40_CCU_H | ||
69 | +#define HW_MISC_ALLWINNER_R40_CCU_H | ||
70 | + | ||
71 | +#include "qom/object.h" | ||
72 | +#include "hw/sysbus.h" | ||
73 | + | ||
74 | +/** | ||
75 | + * @name Constants | ||
76 | + * @{ | ||
77 | + */ | ||
78 | + | ||
79 | +/** Size of register I/O address space used by CCU device */ | ||
80 | +#define AW_R40_CCU_IOSIZE (0x400) | ||
81 | + | ||
82 | +/** Total number of known registers */ | ||
83 | +#define AW_R40_CCU_REGS_NUM (AW_R40_CCU_IOSIZE / sizeof(uint32_t)) | ||
84 | + | ||
85 | +/** @} */ | ||
86 | + | ||
87 | +/** | ||
88 | + * @name Object model | ||
89 | + * @{ | ||
90 | + */ | ||
91 | + | ||
92 | +#define TYPE_AW_R40_CCU "allwinner-r40-ccu" | ||
93 | +OBJECT_DECLARE_SIMPLE_TYPE(AwR40ClockCtlState, AW_R40_CCU) | ||
94 | + | ||
95 | +/** @} */ | ||
96 | + | ||
97 | +/** | ||
98 | + * Allwinner R40 CCU object instance state. | ||
99 | + */ | ||
100 | +struct AwR40ClockCtlState { | ||
101 | + /*< private >*/ | ||
102 | + SysBusDevice parent_obj; | ||
103 | + /*< public >*/ | ||
104 | + | ||
105 | + /** Maps I/O registers in physical memory */ | ||
106 | + MemoryRegion iomem; | ||
107 | + | ||
108 | + /** Array of hardware registers */ | ||
109 | + uint32_t regs[AW_R40_CCU_REGS_NUM]; | ||
110 | + | ||
111 | +}; | ||
112 | + | ||
113 | +#endif /* HW_MISC_ALLWINNER_R40_CCU_H */ | ||
114 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
44 | index XXXXXXX..XXXXXXX 100644 | 115 | index XXXXXXX..XXXXXXX 100644 |
45 | --- a/target/arm/translate-sve.c | 116 | --- a/hw/arm/allwinner-r40.c |
46 | +++ b/target/arm/translate-sve.c | 117 | +++ b/hw/arm/allwinner-r40.c |
47 | @@ -XXX,XX +XXX,XX @@ static bool do_BFMLAL_zzxw(DisasContext *s, arg_rrxr_esz *a, bool sel) | 118 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { |
48 | 119 | [AW_R40_DEV_MMC1] = 0x01c10000, | |
49 | TRANS_FEAT(BFMLALB_zzxw, aa64_sve_bf16, do_BFMLAL_zzxw, a, false) | 120 | [AW_R40_DEV_MMC2] = 0x01c11000, |
50 | TRANS_FEAT(BFMLALT_zzxw, aa64_sve_bf16, do_BFMLAL_zzxw, a, true) | 121 | [AW_R40_DEV_MMC3] = 0x01c12000, |
51 | + | 122 | + [AW_R40_DEV_CCU] = 0x01c20000, |
52 | +static bool trans_PSEL(DisasContext *s, arg_psel *a) | 123 | [AW_R40_DEV_PIT] = 0x01c20c00, |
53 | +{ | 124 | [AW_R40_DEV_UART0] = 0x01c28000, |
54 | + int vl = vec_full_reg_size(s); | 125 | [AW_R40_DEV_GIC_DIST] = 0x01c81000, |
55 | + int pl = pred_gvec_reg_size(s); | 126 | @@ -XXX,XX +XXX,XX @@ static struct AwR40Unimplemented r40_unimplemented[] = { |
56 | + int elements = vl >> a->esz; | 127 | { "usb2-host", 0x01c1c000, 4 * KiB }, |
57 | + TCGv_i64 tmp, didx, dbit; | 128 | { "cs1", 0x01c1d000, 4 * KiB }, |
58 | + TCGv_ptr ptr; | 129 | { "spi3", 0x01c1f000, 4 * KiB }, |
59 | + | 130 | - { "ccu", 0x01c20000, 1 * KiB }, |
60 | + if (!dc_isar_feature(aa64_sme, s)) { | 131 | { "rtc", 0x01c20400, 1 * KiB }, |
61 | + return false; | 132 | { "pio", 0x01c20800, 1 * KiB }, |
133 | { "owa", 0x01c21000, 1 * KiB }, | ||
134 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) | ||
135 | object_property_add_alias(obj, "clk1-freq", OBJECT(&s->timer), | ||
136 | "clk1-freq"); | ||
137 | |||
138 | + object_initialize_child(obj, "ccu", &s->ccu, TYPE_AW_R40_CCU); | ||
139 | + | ||
140 | for (int i = 0; i < AW_R40_NUM_MMCS; i++) { | ||
141 | object_initialize_child(obj, mmc_names[i], &s->mmc[i], | ||
142 | TYPE_AW_SDHOST_SUN5I); | ||
143 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_realize(DeviceState *dev, Error **errp) | ||
144 | memory_region_add_subregion(get_system_memory(), | ||
145 | s->memmap[AW_R40_DEV_SRAM_A4], &s->sram_a4); | ||
146 | |||
147 | + /* Clock Control Unit */ | ||
148 | + sysbus_realize(SYS_BUS_DEVICE(&s->ccu), &error_fatal); | ||
149 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->ccu), 0, s->memmap[AW_R40_DEV_CCU]); | ||
150 | + | ||
151 | /* SD/MMC */ | ||
152 | for (int i = 0; i < AW_R40_NUM_MMCS; i++) { | ||
153 | qemu_irq irq = qdev_get_gpio_in(DEVICE(&s->gic), | ||
154 | diff --git a/hw/misc/allwinner-r40-ccu.c b/hw/misc/allwinner-r40-ccu.c | ||
155 | new file mode 100644 | ||
156 | index XXXXXXX..XXXXXXX | ||
157 | --- /dev/null | ||
158 | +++ b/hw/misc/allwinner-r40-ccu.c | ||
159 | @@ -XXX,XX +XXX,XX @@ | ||
160 | +/* | ||
161 | + * Allwinner R40 Clock Control Unit emulation | ||
162 | + * | ||
163 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> | ||
164 | + * | ||
165 | + * This program is free software: you can redistribute it and/or modify | ||
166 | + * it under the terms of the GNU General Public License as published by | ||
167 | + * the Free Software Foundation, either version 2 of the License, or | ||
168 | + * (at your option) any later version. | ||
169 | + * | ||
170 | + * This program is distributed in the hope that it will be useful, | ||
171 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
172 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
173 | + * GNU General Public License for more details. | ||
174 | + * | ||
175 | + * You should have received a copy of the GNU General Public License | ||
176 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
177 | + */ | ||
178 | + | ||
179 | +#include "qemu/osdep.h" | ||
180 | +#include "qemu/units.h" | ||
181 | +#include "hw/sysbus.h" | ||
182 | +#include "migration/vmstate.h" | ||
183 | +#include "qemu/log.h" | ||
184 | +#include "qemu/module.h" | ||
185 | +#include "hw/misc/allwinner-r40-ccu.h" | ||
186 | + | ||
187 | +/* CCU register offsets */ | ||
188 | +enum { | ||
189 | + REG_PLL_CPUX_CTRL = 0x0000, | ||
190 | + REG_PLL_AUDIO_CTRL = 0x0008, | ||
191 | + REG_PLL_VIDEO0_CTRL = 0x0010, | ||
192 | + REG_PLL_VE_CTRL = 0x0018, | ||
193 | + REG_PLL_DDR0_CTRL = 0x0020, | ||
194 | + REG_PLL_PERIPH0_CTRL = 0x0028, | ||
195 | + REG_PLL_PERIPH1_CTRL = 0x002c, | ||
196 | + REG_PLL_VIDEO1_CTRL = 0x0030, | ||
197 | + REG_PLL_SATA_CTRL = 0x0034, | ||
198 | + REG_PLL_GPU_CTRL = 0x0038, | ||
199 | + REG_PLL_MIPI_CTRL = 0x0040, | ||
200 | + REG_PLL_DE_CTRL = 0x0048, | ||
201 | + REG_PLL_DDR1_CTRL = 0x004c, | ||
202 | + REG_AHB1_APB1_CFG = 0x0054, | ||
203 | + REG_APB2_CFG = 0x0058, | ||
204 | + REG_MMC0_CLK = 0x0088, | ||
205 | + REG_MMC1_CLK = 0x008c, | ||
206 | + REG_MMC2_CLK = 0x0090, | ||
207 | + REG_MMC3_CLK = 0x0094, | ||
208 | + REG_USBPHY_CFG = 0x00cc, | ||
209 | + REG_PLL_DDR_AUX = 0x00f0, | ||
210 | + REG_DRAM_CFG = 0x00f4, | ||
211 | + REG_PLL_DDR1_CFG = 0x00f8, | ||
212 | + REG_DRAM_CLK_GATING = 0x0100, | ||
213 | + REG_GMAC_CLK = 0x0164, | ||
214 | + REG_SYS_32K_CLK = 0x0310, | ||
215 | + REG_PLL_LOCK_CTRL = 0x0320, | ||
216 | +}; | ||
217 | + | ||
218 | +#define REG_INDEX(offset) (offset / sizeof(uint32_t)) | ||
219 | + | ||
220 | +/* CCU register flags */ | ||
221 | +enum { | ||
222 | + REG_PLL_ENABLE = (1 << 31), | ||
223 | + REG_PLL_LOCK = (1 << 28), | ||
224 | +}; | ||
225 | + | ||
226 | +static uint64_t allwinner_r40_ccu_read(void *opaque, hwaddr offset, | ||
227 | + unsigned size) | ||
228 | +{ | ||
229 | + const AwR40ClockCtlState *s = AW_R40_CCU(opaque); | ||
230 | + const uint32_t idx = REG_INDEX(offset); | ||
231 | + | ||
232 | + switch (offset) { | ||
233 | + case 0x324 ... AW_R40_CCU_IOSIZE: | ||
234 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
235 | + __func__, (uint32_t)offset); | ||
236 | + return 0; | ||
62 | + } | 237 | + } |
63 | + if (!sve_access_check(s)) { | 238 | + |
64 | + return true; | 239 | + return s->regs[idx]; |
240 | +} | ||
241 | + | ||
242 | +static void allwinner_r40_ccu_write(void *opaque, hwaddr offset, | ||
243 | + uint64_t val, unsigned size) | ||
244 | +{ | ||
245 | + AwR40ClockCtlState *s = AW_R40_CCU(opaque); | ||
246 | + | ||
247 | + switch (offset) { | ||
248 | + case REG_DRAM_CFG: /* DRAM Configuration(for DDR0) */ | ||
249 | + /* bit16: SDRCLK_UPD (SDRCLK configuration 0 update) */ | ||
250 | + val &= ~(1 << 16); | ||
251 | + break; | ||
252 | + case REG_PLL_DDR1_CTRL: /* DDR1 Control register */ | ||
253 | + /* bit30: SDRPLL_UPD */ | ||
254 | + val &= ~(1 << 30); | ||
255 | + if (val & REG_PLL_ENABLE) { | ||
256 | + val |= REG_PLL_LOCK; | ||
257 | + } | ||
258 | + break; | ||
259 | + case REG_PLL_CPUX_CTRL: | ||
260 | + case REG_PLL_AUDIO_CTRL: | ||
261 | + case REG_PLL_VE_CTRL: | ||
262 | + case REG_PLL_VIDEO0_CTRL: | ||
263 | + case REG_PLL_DDR0_CTRL: | ||
264 | + case REG_PLL_PERIPH0_CTRL: | ||
265 | + case REG_PLL_PERIPH1_CTRL: | ||
266 | + case REG_PLL_VIDEO1_CTRL: | ||
267 | + case REG_PLL_SATA_CTRL: | ||
268 | + case REG_PLL_GPU_CTRL: | ||
269 | + case REG_PLL_MIPI_CTRL: | ||
270 | + case REG_PLL_DE_CTRL: | ||
271 | + if (val & REG_PLL_ENABLE) { | ||
272 | + val |= REG_PLL_LOCK; | ||
273 | + } | ||
274 | + break; | ||
275 | + case 0x324 ... AW_R40_CCU_IOSIZE: | ||
276 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
277 | + __func__, (uint32_t)offset); | ||
278 | + break; | ||
279 | + default: | ||
280 | + qemu_log_mask(LOG_UNIMP, "%s: unimplemented write offset 0x%04x\n", | ||
281 | + __func__, (uint32_t)offset); | ||
282 | + break; | ||
65 | + } | 283 | + } |
66 | + | 284 | + |
67 | + tmp = tcg_temp_new_i64(); | 285 | + s->regs[REG_INDEX(offset)] = (uint32_t) val; |
68 | + dbit = tcg_temp_new_i64(); | 286 | +} |
69 | + didx = tcg_temp_new_i64(); | 287 | + |
70 | + ptr = tcg_temp_new_ptr(); | 288 | +static const MemoryRegionOps allwinner_r40_ccu_ops = { |
71 | + | 289 | + .read = allwinner_r40_ccu_read, |
72 | + /* Compute the predicate element. */ | 290 | + .write = allwinner_r40_ccu_write, |
73 | + tcg_gen_addi_i64(tmp, cpu_reg(s, a->rv), a->imm); | 291 | + .endianness = DEVICE_NATIVE_ENDIAN, |
74 | + if (is_power_of_2(elements)) { | 292 | + .valid = { |
75 | + tcg_gen_andi_i64(tmp, tmp, elements - 1); | 293 | + .min_access_size = 4, |
76 | + } else { | 294 | + .max_access_size = 4, |
77 | + tcg_gen_remu_i64(tmp, tmp, tcg_constant_i64(elements)); | 295 | + }, |
296 | + .impl.min_access_size = 4, | ||
297 | +}; | ||
298 | + | ||
299 | +static void allwinner_r40_ccu_reset(DeviceState *dev) | ||
300 | +{ | ||
301 | + AwR40ClockCtlState *s = AW_R40_CCU(dev); | ||
302 | + | ||
303 | + memset(s->regs, 0, sizeof(s->regs)); | ||
304 | + | ||
305 | + /* Set default values for registers */ | ||
306 | + s->regs[REG_INDEX(REG_PLL_CPUX_CTRL)] = 0x00001000; | ||
307 | + s->regs[REG_INDEX(REG_PLL_AUDIO_CTRL)] = 0x00035514; | ||
308 | + s->regs[REG_INDEX(REG_PLL_VIDEO0_CTRL)] = 0x03006207; | ||
309 | + s->regs[REG_INDEX(REG_PLL_VE_CTRL)] = 0x03006207; | ||
310 | + s->regs[REG_INDEX(REG_PLL_DDR0_CTRL)] = 0x00001000, | ||
311 | + s->regs[REG_INDEX(REG_PLL_PERIPH0_CTRL)] = 0x00041811; | ||
312 | + s->regs[REG_INDEX(REG_PLL_PERIPH1_CTRL)] = 0x00041811; | ||
313 | + s->regs[REG_INDEX(REG_PLL_VIDEO1_CTRL)] = 0x03006207; | ||
314 | + s->regs[REG_INDEX(REG_PLL_SATA_CTRL)] = 0x00001811; | ||
315 | + s->regs[REG_INDEX(REG_PLL_GPU_CTRL)] = 0x03006207; | ||
316 | + s->regs[REG_INDEX(REG_PLL_MIPI_CTRL)] = 0x00000515; | ||
317 | + s->regs[REG_INDEX(REG_PLL_DE_CTRL)] = 0x03006207; | ||
318 | + s->regs[REG_INDEX(REG_PLL_DDR1_CTRL)] = 0x00001800; | ||
319 | + s->regs[REG_INDEX(REG_AHB1_APB1_CFG)] = 0x00001010; | ||
320 | + s->regs[REG_INDEX(REG_APB2_CFG)] = 0x01000000; | ||
321 | + s->regs[REG_INDEX(REG_PLL_DDR_AUX)] = 0x00000001; | ||
322 | + s->regs[REG_INDEX(REG_PLL_DDR1_CFG)] = 0x0ccca000; | ||
323 | + s->regs[REG_INDEX(REG_SYS_32K_CLK)] = 0x0000000f; | ||
324 | +} | ||
325 | + | ||
326 | +static void allwinner_r40_ccu_init(Object *obj) | ||
327 | +{ | ||
328 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
329 | + AwR40ClockCtlState *s = AW_R40_CCU(obj); | ||
330 | + | ||
331 | + /* Memory mapping */ | ||
332 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_r40_ccu_ops, s, | ||
333 | + TYPE_AW_R40_CCU, AW_R40_CCU_IOSIZE); | ||
334 | + sysbus_init_mmio(sbd, &s->iomem); | ||
335 | +} | ||
336 | + | ||
337 | +static const VMStateDescription allwinner_r40_ccu_vmstate = { | ||
338 | + .name = "allwinner-r40-ccu", | ||
339 | + .version_id = 1, | ||
340 | + .minimum_version_id = 1, | ||
341 | + .fields = (VMStateField[]) { | ||
342 | + VMSTATE_UINT32_ARRAY(regs, AwR40ClockCtlState, AW_R40_CCU_REGS_NUM), | ||
343 | + VMSTATE_END_OF_LIST() | ||
78 | + } | 344 | + } |
79 | + | 345 | +}; |
80 | + /* Extract the predicate byte and bit indices. */ | 346 | + |
81 | + tcg_gen_shli_i64(tmp, tmp, a->esz); | 347 | +static void allwinner_r40_ccu_class_init(ObjectClass *klass, void *data) |
82 | + tcg_gen_andi_i64(dbit, tmp, 7); | 348 | +{ |
83 | + tcg_gen_shri_i64(didx, tmp, 3); | 349 | + DeviceClass *dc = DEVICE_CLASS(klass); |
84 | + if (HOST_BIG_ENDIAN) { | 350 | + |
85 | + tcg_gen_xori_i64(didx, didx, 7); | 351 | + dc->reset = allwinner_r40_ccu_reset; |
86 | + } | 352 | + dc->vmsd = &allwinner_r40_ccu_vmstate; |
87 | + | 353 | +} |
88 | + /* Load the predicate word. */ | 354 | + |
89 | + tcg_gen_trunc_i64_ptr(ptr, didx); | 355 | +static const TypeInfo allwinner_r40_ccu_info = { |
90 | + tcg_gen_add_ptr(ptr, ptr, cpu_env); | 356 | + .name = TYPE_AW_R40_CCU, |
91 | + tcg_gen_ld8u_i64(tmp, ptr, pred_full_reg_offset(s, a->pm)); | 357 | + .parent = TYPE_SYS_BUS_DEVICE, |
92 | + | 358 | + .instance_init = allwinner_r40_ccu_init, |
93 | + /* Extract the predicate bit and replicate to MO_64. */ | 359 | + .instance_size = sizeof(AwR40ClockCtlState), |
94 | + tcg_gen_shr_i64(tmp, tmp, dbit); | 360 | + .class_init = allwinner_r40_ccu_class_init, |
95 | + tcg_gen_andi_i64(tmp, tmp, 1); | 361 | +}; |
96 | + tcg_gen_neg_i64(tmp, tmp); | 362 | + |
97 | + | 363 | +static void allwinner_r40_ccu_register(void) |
98 | + /* Apply to either copy the source, or write zeros. */ | 364 | +{ |
99 | + tcg_gen_gvec_ands(MO_64, pred_full_reg_offset(s, a->pd), | 365 | + type_register_static(&allwinner_r40_ccu_info); |
100 | + pred_full_reg_offset(s, a->pn), tmp, pl, pl); | 366 | +} |
101 | + | 367 | + |
102 | + tcg_temp_free_i64(tmp); | 368 | +type_init(allwinner_r40_ccu_register) |
103 | + tcg_temp_free_i64(dbit); | 369 | diff --git a/hw/misc/meson.build b/hw/misc/meson.build |
104 | + tcg_temp_free_i64(didx); | 370 | index XXXXXXX..XXXXXXX 100644 |
105 | + tcg_temp_free_ptr(ptr); | 371 | --- a/hw/misc/meson.build |
106 | + return true; | 372 | +++ b/hw/misc/meson.build |
107 | +} | 373 | @@ -XXX,XX +XXX,XX @@ specific_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-cpucfg.c' |
374 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-dramc.c')) | ||
375 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-sysctrl.c')) | ||
376 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-sid.c')) | ||
377 | +softmmu_ss.add(when: 'CONFIG_ALLWINNER_R40', if_true: files('allwinner-r40-ccu.c')) | ||
378 | softmmu_ss.add(when: 'CONFIG_AXP209_PMU', if_true: files('axp209.c')) | ||
379 | softmmu_ss.add(when: 'CONFIG_REALVIEW', if_true: files('arm_sysctl.c')) | ||
380 | softmmu_ss.add(when: 'CONFIG_NSERIES', if_true: files('cbus.c')) | ||
108 | -- | 381 | -- |
109 | 2.25.1 | 382 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | Make sure to zero the currently reserved fields. | 3 | R40 has eight UARTs, support both 16450 and 16550 compatible modes. |
4 | 4 | ||
5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 5 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20220708151540.18136-36-richard.henderson@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 7 | --- |
10 | linux-user/aarch64/signal.c | 9 ++++++++- | 8 | include/hw/arm/allwinner-r40.h | 8 ++++++++ |
11 | 1 file changed, 8 insertions(+), 1 deletion(-) | 9 | hw/arm/allwinner-r40.c | 34 +++++++++++++++++++++++++++++++--- |
10 | 2 files changed, 39 insertions(+), 3 deletions(-) | ||
12 | 11 | ||
13 | diff --git a/linux-user/aarch64/signal.c b/linux-user/aarch64/signal.c | 12 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
14 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/linux-user/aarch64/signal.c | 14 | --- a/include/hw/arm/allwinner-r40.h |
16 | +++ b/linux-user/aarch64/signal.c | 15 | +++ b/include/hw/arm/allwinner-r40.h |
17 | @@ -XXX,XX +XXX,XX @@ struct target_extra_context { | 16 | @@ -XXX,XX +XXX,XX @@ enum { |
18 | struct target_sve_context { | 17 | AW_R40_DEV_CCU, |
19 | struct target_aarch64_ctx head; | 18 | AW_R40_DEV_PIT, |
20 | uint16_t vl; | 19 | AW_R40_DEV_UART0, |
21 | - uint16_t reserved[3]; | 20 | + AW_R40_DEV_UART1, |
22 | + uint16_t flags; | 21 | + AW_R40_DEV_UART2, |
23 | + uint16_t reserved[2]; | 22 | + AW_R40_DEV_UART3, |
24 | /* The actual SVE data immediately follows. It is laid out | 23 | + AW_R40_DEV_UART4, |
25 | * according to TARGET_SVE_SIG_{Z,P}REG_OFFSET, based off of | 24 | + AW_R40_DEV_UART5, |
26 | * the original struct pointer. | 25 | + AW_R40_DEV_UART6, |
27 | @@ -XXX,XX +XXX,XX @@ struct target_sve_context { | 26 | + AW_R40_DEV_UART7, |
28 | #define TARGET_SVE_SIG_CONTEXT_SIZE(VQ) \ | 27 | AW_R40_DEV_GIC_DIST, |
29 | (TARGET_SVE_SIG_PREG_OFFSET(VQ, 17)) | 28 | AW_R40_DEV_GIC_CPU, |
30 | 29 | AW_R40_DEV_GIC_HYP, | |
31 | +#define TARGET_SVE_SIG_FLAG_SM 1 | 30 | @@ -XXX,XX +XXX,XX @@ OBJECT_DECLARE_SIMPLE_TYPE(AwR40State, AW_R40) |
31 | * which are currently emulated by the R40 SoC code. | ||
32 | */ | ||
33 | #define AW_R40_NUM_MMCS 4 | ||
34 | +#define AW_R40_NUM_UARTS 8 | ||
35 | |||
36 | struct AwR40State { | ||
37 | /*< private >*/ | ||
38 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
39 | index XXXXXXX..XXXXXXX 100644 | ||
40 | --- a/hw/arm/allwinner-r40.c | ||
41 | +++ b/hw/arm/allwinner-r40.c | ||
42 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { | ||
43 | [AW_R40_DEV_CCU] = 0x01c20000, | ||
44 | [AW_R40_DEV_PIT] = 0x01c20c00, | ||
45 | [AW_R40_DEV_UART0] = 0x01c28000, | ||
46 | + [AW_R40_DEV_UART1] = 0x01c28400, | ||
47 | + [AW_R40_DEV_UART2] = 0x01c28800, | ||
48 | + [AW_R40_DEV_UART3] = 0x01c28c00, | ||
49 | + [AW_R40_DEV_UART4] = 0x01c29000, | ||
50 | + [AW_R40_DEV_UART5] = 0x01c29400, | ||
51 | + [AW_R40_DEV_UART6] = 0x01c29800, | ||
52 | + [AW_R40_DEV_UART7] = 0x01c29c00, | ||
53 | [AW_R40_DEV_GIC_DIST] = 0x01c81000, | ||
54 | [AW_R40_DEV_GIC_CPU] = 0x01c82000, | ||
55 | [AW_R40_DEV_GIC_HYP] = 0x01c84000, | ||
56 | @@ -XXX,XX +XXX,XX @@ enum { | ||
57 | /* Shared Processor Interrupts */ | ||
58 | enum { | ||
59 | AW_R40_GIC_SPI_UART0 = 1, | ||
60 | + AW_R40_GIC_SPI_UART1 = 2, | ||
61 | + AW_R40_GIC_SPI_UART2 = 3, | ||
62 | + AW_R40_GIC_SPI_UART3 = 4, | ||
63 | + AW_R40_GIC_SPI_UART4 = 17, | ||
64 | + AW_R40_GIC_SPI_UART5 = 18, | ||
65 | + AW_R40_GIC_SPI_UART6 = 19, | ||
66 | + AW_R40_GIC_SPI_UART7 = 20, | ||
67 | AW_R40_GIC_SPI_TIMER0 = 22, | ||
68 | AW_R40_GIC_SPI_TIMER1 = 23, | ||
69 | AW_R40_GIC_SPI_MMC0 = 32, | ||
70 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_realize(DeviceState *dev, Error **errp) | ||
71 | } | ||
72 | |||
73 | /* UART0. For future clocktree API: All UARTS are connected to APB2_CLK. */ | ||
74 | - serial_mm_init(get_system_memory(), s->memmap[AW_R40_DEV_UART0], 2, | ||
75 | - qdev_get_gpio_in(DEVICE(&s->gic), AW_R40_GIC_SPI_UART0), | ||
76 | - 115200, serial_hd(0), DEVICE_NATIVE_ENDIAN); | ||
77 | + for (int i = 0; i < AW_R40_NUM_UARTS; i++) { | ||
78 | + static const int uart_irqs[AW_R40_NUM_UARTS] = { | ||
79 | + AW_R40_GIC_SPI_UART0, | ||
80 | + AW_R40_GIC_SPI_UART1, | ||
81 | + AW_R40_GIC_SPI_UART2, | ||
82 | + AW_R40_GIC_SPI_UART3, | ||
83 | + AW_R40_GIC_SPI_UART4, | ||
84 | + AW_R40_GIC_SPI_UART5, | ||
85 | + AW_R40_GIC_SPI_UART6, | ||
86 | + AW_R40_GIC_SPI_UART7, | ||
87 | + }; | ||
88 | + const hwaddr addr = s->memmap[AW_R40_DEV_UART0 + i]; | ||
32 | + | 89 | + |
33 | struct target_rt_sigframe { | 90 | + serial_mm_init(get_system_memory(), addr, 2, |
34 | struct target_siginfo info; | 91 | + qdev_get_gpio_in(DEVICE(&s->gic), uart_irqs[i]), |
35 | struct target_ucontext uc; | 92 | + 115200, serial_hd(i), DEVICE_NATIVE_ENDIAN); |
36 | @@ -XXX,XX +XXX,XX @@ static void target_setup_sve_record(struct target_sve_context *sve, | ||
37 | { | ||
38 | int i, j; | ||
39 | |||
40 | + memset(sve, 0, sizeof(*sve)); | ||
41 | __put_user(TARGET_SVE_MAGIC, &sve->head.magic); | ||
42 | __put_user(size, &sve->head.size); | ||
43 | __put_user(vq * TARGET_SVE_VQ_BYTES, &sve->vl); | ||
44 | + if (FIELD_EX64(env->svcr, SVCR, SM)) { | ||
45 | + __put_user(TARGET_SVE_SIG_FLAG_SM, &sve->flags); | ||
46 | + } | 93 | + } |
47 | 94 | ||
48 | /* Note that SVE regs are stored as a byte stream, with each byte element | 95 | /* Unimplemented devices */ |
49 | * at a subsequent address. This corresponds to a little-endian store | 96 | for (i = 0; i < ARRAY_SIZE(r40_unimplemented); i++) { |
50 | -- | 97 | -- |
51 | 2.25.1 | 98 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 3 | TWI(i2c) is designed to be used as an interface between CPU host and the |
4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 4 | serial 2-Wire bus. It can support all standard 2-Wire transfer, can be |
5 | Message-id: 20220708151540.18136-34-richard.henderson@linaro.org | 5 | operated in standard mode(100kbit/s) or fast-mode, supporting data rate |
6 | up to 400kbit/s. | ||
7 | |||
8 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> | ||
9 | Reviewed-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 11 | --- |
8 | linux-user/aarch64/target_cpu.h | 5 ++++- | 12 | include/hw/arm/allwinner-r40.h | 3 +++ |
9 | 1 file changed, 4 insertions(+), 1 deletion(-) | 13 | hw/arm/allwinner-r40.c | 11 ++++++++++- |
14 | 2 files changed, 13 insertions(+), 1 deletion(-) | ||
10 | 15 | ||
11 | diff --git a/linux-user/aarch64/target_cpu.h b/linux-user/aarch64/target_cpu.h | 16 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
12 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/linux-user/aarch64/target_cpu.h | 18 | --- a/include/hw/arm/allwinner-r40.h |
14 | +++ b/linux-user/aarch64/target_cpu.h | 19 | +++ b/include/hw/arm/allwinner-r40.h |
15 | @@ -XXX,XX +XXX,XX @@ static inline void cpu_clone_regs_parent(CPUARMState *env, unsigned flags) | 20 | @@ -XXX,XX +XXX,XX @@ |
16 | 21 | #include "hw/intc/arm_gic.h" | |
17 | static inline void cpu_set_tls(CPUARMState *env, target_ulong newtls) | 22 | #include "hw/sd/allwinner-sdhost.h" |
18 | { | 23 | #include "hw/misc/allwinner-r40-ccu.h" |
19 | - /* Note that AArch64 Linux keeps the TLS pointer in TPIDR; this is | 24 | +#include "hw/i2c/allwinner-i2c.h" |
20 | + /* | 25 | #include "target/arm/cpu.h" |
21 | + * Note that AArch64 Linux keeps the TLS pointer in TPIDR; this is | 26 | #include "sysemu/block-backend.h" |
22 | * different from AArch32 Linux, which uses TPIDRRO. | 27 | |
23 | */ | 28 | @@ -XXX,XX +XXX,XX @@ enum { |
24 | env->cp15.tpidr_el[0] = newtls; | 29 | AW_R40_DEV_UART5, |
25 | + /* TPIDR2_EL0 is cleared with CLONE_SETTLS. */ | 30 | AW_R40_DEV_UART6, |
26 | + env->cp15.tpidr2_el0 = 0; | 31 | AW_R40_DEV_UART7, |
32 | + AW_R40_DEV_TWI0, | ||
33 | AW_R40_DEV_GIC_DIST, | ||
34 | AW_R40_DEV_GIC_CPU, | ||
35 | AW_R40_DEV_GIC_HYP, | ||
36 | @@ -XXX,XX +XXX,XX @@ struct AwR40State { | ||
37 | AwA10PITState timer; | ||
38 | AwSdHostState mmc[AW_R40_NUM_MMCS]; | ||
39 | AwR40ClockCtlState ccu; | ||
40 | + AWI2CState i2c0; | ||
41 | GICState gic; | ||
42 | MemoryRegion sram_a1; | ||
43 | MemoryRegion sram_a2; | ||
44 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
45 | index XXXXXXX..XXXXXXX 100644 | ||
46 | --- a/hw/arm/allwinner-r40.c | ||
47 | +++ b/hw/arm/allwinner-r40.c | ||
48 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { | ||
49 | [AW_R40_DEV_UART5] = 0x01c29400, | ||
50 | [AW_R40_DEV_UART6] = 0x01c29800, | ||
51 | [AW_R40_DEV_UART7] = 0x01c29c00, | ||
52 | + [AW_R40_DEV_TWI0] = 0x01c2ac00, | ||
53 | [AW_R40_DEV_GIC_DIST] = 0x01c81000, | ||
54 | [AW_R40_DEV_GIC_CPU] = 0x01c82000, | ||
55 | [AW_R40_DEV_GIC_HYP] = 0x01c84000, | ||
56 | @@ -XXX,XX +XXX,XX @@ static struct AwR40Unimplemented r40_unimplemented[] = { | ||
57 | { "uart7", 0x01c29c00, 1 * KiB }, | ||
58 | { "ps20", 0x01c2a000, 1 * KiB }, | ||
59 | { "ps21", 0x01c2a400, 1 * KiB }, | ||
60 | - { "twi0", 0x01c2ac00, 1 * KiB }, | ||
61 | { "twi1", 0x01c2b000, 1 * KiB }, | ||
62 | { "twi2", 0x01c2b400, 1 * KiB }, | ||
63 | { "twi3", 0x01c2b800, 1 * KiB }, | ||
64 | @@ -XXX,XX +XXX,XX @@ enum { | ||
65 | AW_R40_GIC_SPI_UART1 = 2, | ||
66 | AW_R40_GIC_SPI_UART2 = 3, | ||
67 | AW_R40_GIC_SPI_UART3 = 4, | ||
68 | + AW_R40_GIC_SPI_TWI0 = 7, | ||
69 | AW_R40_GIC_SPI_UART4 = 17, | ||
70 | AW_R40_GIC_SPI_UART5 = 18, | ||
71 | AW_R40_GIC_SPI_UART6 = 19, | ||
72 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) | ||
73 | object_initialize_child(obj, mmc_names[i], &s->mmc[i], | ||
74 | TYPE_AW_SDHOST_SUN5I); | ||
75 | } | ||
76 | + | ||
77 | + object_initialize_child(obj, "twi0", &s->i2c0, TYPE_AW_I2C_SUN6I); | ||
27 | } | 78 | } |
28 | 79 | ||
29 | static inline abi_ulong get_sp_from_cpustate(CPUARMState *state) | 80 | static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
81 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_realize(DeviceState *dev, Error **errp) | ||
82 | 115200, serial_hd(i), DEVICE_NATIVE_ENDIAN); | ||
83 | } | ||
84 | |||
85 | + /* I2C */ | ||
86 | + sysbus_realize(SYS_BUS_DEVICE(&s->i2c0), &error_fatal); | ||
87 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->i2c0), 0, s->memmap[AW_R40_DEV_TWI0]); | ||
88 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->i2c0), 0, | ||
89 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_R40_GIC_SPI_TWI0)); | ||
90 | + | ||
91 | /* Unimplemented devices */ | ||
92 | for (i = 0; i < ARRAY_SIZE(r40_unimplemented); i++) { | ||
93 | create_unimplemented_device(r40_unimplemented[i].device_name, | ||
30 | -- | 94 | -- |
31 | 2.25.1 | 95 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | Mark ADR as a non-streaming instruction, which should trap | 3 | This patch adds minimal support for AXP-221 PMU and connect it to |
4 | if full a64 support is not enabled in streaming mode. | 4 | bananapi M2U board. |
5 | 5 | ||
6 | Removing entries from sme-fa64.decode is an easy way to see | 6 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
7 | what remains to be done. | ||
8 | |||
9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
11 | Message-id: 20220708151540.18136-5-richard.henderson@linaro.org | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
13 | --- | 8 | --- |
14 | target/arm/translate.h | 7 +++++++ | 9 | hw/arm/bananapi_m2u.c | 6 + |
15 | target/arm/sme-fa64.decode | 1 - | 10 | hw/misc/axp209.c | 238 ----------------------------------- |
16 | target/arm/translate-sve.c | 8 ++++---- | 11 | hw/misc/axp2xx.c | 283 ++++++++++++++++++++++++++++++++++++++++++ |
17 | 3 files changed, 11 insertions(+), 5 deletions(-) | 12 | hw/arm/Kconfig | 3 +- |
13 | hw/misc/Kconfig | 2 +- | ||
14 | hw/misc/meson.build | 2 +- | ||
15 | hw/misc/trace-events | 8 +- | ||
16 | 7 files changed, 297 insertions(+), 245 deletions(-) | ||
17 | delete mode 100644 hw/misc/axp209.c | ||
18 | create mode 100644 hw/misc/axp2xx.c | ||
18 | 19 | ||
19 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 20 | diff --git a/hw/arm/bananapi_m2u.c b/hw/arm/bananapi_m2u.c |
20 | index XXXXXXX..XXXXXXX 100644 | 21 | index XXXXXXX..XXXXXXX 100644 |
21 | --- a/target/arm/translate.h | 22 | --- a/hw/arm/bananapi_m2u.c |
22 | +++ b/target/arm/translate.h | 23 | +++ b/hw/arm/bananapi_m2u.c |
23 | @@ -XXX,XX +XXX,XX @@ uint64_t asimd_imm_const(uint32_t imm, int cmode, int op); | 24 | @@ -XXX,XX +XXX,XX @@ |
24 | static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \ | 25 | #include "qapi/error.h" |
25 | { return dc_isar_feature(FEAT, s) && FUNC(s, __VA_ARGS__); } | 26 | #include "qemu/error-report.h" |
26 | 27 | #include "hw/boards.h" | |
27 | +#define TRANS_FEAT_NONSTREAMING(NAME, FEAT, FUNC, ...) \ | 28 | +#include "hw/i2c/i2c.h" |
28 | + static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \ | 29 | #include "hw/qdev-properties.h" |
29 | + { \ | 30 | #include "hw/arm/allwinner-r40.h" |
30 | + s->is_nonstreaming = true; \ | 31 | |
31 | + return dc_isar_feature(FEAT, s) && FUNC(s, __VA_ARGS__); \ | 32 | @@ -XXX,XX +XXX,XX @@ static void bpim2u_init(MachineState *machine) |
33 | { | ||
34 | bool bootroom_loaded = false; | ||
35 | AwR40State *r40; | ||
36 | + I2CBus *i2c; | ||
37 | |||
38 | /* BIOS is not supported by this board */ | ||
39 | if (machine->firmware) { | ||
40 | @@ -XXX,XX +XXX,XX @@ static void bpim2u_init(MachineState *machine) | ||
41 | } | ||
42 | } | ||
43 | |||
44 | + /* Connect AXP221 */ | ||
45 | + i2c = I2C_BUS(qdev_get_child_bus(DEVICE(&r40->i2c0), "i2c")); | ||
46 | + i2c_slave_create_simple(i2c, "axp221_pmu", 0x34); | ||
47 | + | ||
48 | /* SDRAM */ | ||
49 | memory_region_add_subregion(get_system_memory(), | ||
50 | r40->memmap[AW_R40_DEV_SDRAM], machine->ram); | ||
51 | diff --git a/hw/misc/axp209.c b/hw/misc/axp209.c | ||
52 | deleted file mode 100644 | ||
53 | index XXXXXXX..XXXXXXX | ||
54 | --- a/hw/misc/axp209.c | ||
55 | +++ /dev/null | ||
56 | @@ -XXX,XX +XXX,XX @@ | ||
57 | -/* | ||
58 | - * AXP-209 PMU Emulation | ||
59 | - * | ||
60 | - * Copyright (C) 2022 Strahinja Jankovic <strahinja.p.jankovic@gmail.com> | ||
61 | - * | ||
62 | - * Permission is hereby granted, free of charge, to any person obtaining a | ||
63 | - * copy of this software and associated documentation files (the "Software"), | ||
64 | - * to deal in the Software without restriction, including without limitation | ||
65 | - * the rights to use, copy, modify, merge, publish, distribute, sublicense, | ||
66 | - * and/or sell copies of the Software, and to permit persons to whom the | ||
67 | - * Software is furnished to do so, subject to the following conditions: | ||
68 | - * | ||
69 | - * The above copyright notice and this permission notice shall be included in | ||
70 | - * all copies or substantial portions of the Software. | ||
71 | - * | ||
72 | - * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
73 | - * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
74 | - * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | ||
75 | - * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
76 | - * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING | ||
77 | - * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER | ||
78 | - * DEALINGS IN THE SOFTWARE. | ||
79 | - * | ||
80 | - * SPDX-License-Identifier: MIT | ||
81 | - */ | ||
82 | - | ||
83 | -#include "qemu/osdep.h" | ||
84 | -#include "qemu/log.h" | ||
85 | -#include "trace.h" | ||
86 | -#include "hw/i2c/i2c.h" | ||
87 | -#include "migration/vmstate.h" | ||
88 | - | ||
89 | -#define TYPE_AXP209_PMU "axp209_pmu" | ||
90 | - | ||
91 | -#define AXP209(obj) \ | ||
92 | - OBJECT_CHECK(AXP209I2CState, (obj), TYPE_AXP209_PMU) | ||
93 | - | ||
94 | -/* registers */ | ||
95 | -enum { | ||
96 | - REG_POWER_STATUS = 0x0u, | ||
97 | - REG_OPERATING_MODE, | ||
98 | - REG_OTG_VBUS_STATUS, | ||
99 | - REG_CHIP_VERSION, | ||
100 | - REG_DATA_CACHE_0, | ||
101 | - REG_DATA_CACHE_1, | ||
102 | - REG_DATA_CACHE_2, | ||
103 | - REG_DATA_CACHE_3, | ||
104 | - REG_DATA_CACHE_4, | ||
105 | - REG_DATA_CACHE_5, | ||
106 | - REG_DATA_CACHE_6, | ||
107 | - REG_DATA_CACHE_7, | ||
108 | - REG_DATA_CACHE_8, | ||
109 | - REG_DATA_CACHE_9, | ||
110 | - REG_DATA_CACHE_A, | ||
111 | - REG_DATA_CACHE_B, | ||
112 | - REG_POWER_OUTPUT_CTRL = 0x12u, | ||
113 | - REG_DC_DC2_OUT_V_CTRL = 0x23u, | ||
114 | - REG_DC_DC2_DVS_CTRL = 0x25u, | ||
115 | - REG_DC_DC3_OUT_V_CTRL = 0x27u, | ||
116 | - REG_LDO2_4_OUT_V_CTRL, | ||
117 | - REG_LDO3_OUT_V_CTRL, | ||
118 | - REG_VBUS_CH_MGMT = 0x30u, | ||
119 | - REG_SHUTDOWN_V_CTRL, | ||
120 | - REG_SHUTDOWN_CTRL, | ||
121 | - REG_CHARGE_CTRL_1, | ||
122 | - REG_CHARGE_CTRL_2, | ||
123 | - REG_SPARE_CHARGE_CTRL, | ||
124 | - REG_PEK_KEY_CTRL, | ||
125 | - REG_DC_DC_FREQ_SET, | ||
126 | - REG_CHR_TEMP_TH_SET, | ||
127 | - REG_CHR_HIGH_TEMP_TH_CTRL, | ||
128 | - REG_IPSOUT_WARN_L1, | ||
129 | - REG_IPSOUT_WARN_L2, | ||
130 | - REG_DISCHR_TEMP_TH_SET, | ||
131 | - REG_DISCHR_HIGH_TEMP_TH_CTRL, | ||
132 | - REG_IRQ_BANK_1_CTRL = 0x40u, | ||
133 | - REG_IRQ_BANK_2_CTRL, | ||
134 | - REG_IRQ_BANK_3_CTRL, | ||
135 | - REG_IRQ_BANK_4_CTRL, | ||
136 | - REG_IRQ_BANK_5_CTRL, | ||
137 | - REG_IRQ_BANK_1_STAT = 0x48u, | ||
138 | - REG_IRQ_BANK_2_STAT, | ||
139 | - REG_IRQ_BANK_3_STAT, | ||
140 | - REG_IRQ_BANK_4_STAT, | ||
141 | - REG_IRQ_BANK_5_STAT, | ||
142 | - REG_ADC_ACIN_V_H = 0x56u, | ||
143 | - REG_ADC_ACIN_V_L, | ||
144 | - REG_ADC_ACIN_CURR_H, | ||
145 | - REG_ADC_ACIN_CURR_L, | ||
146 | - REG_ADC_VBUS_V_H, | ||
147 | - REG_ADC_VBUS_V_L, | ||
148 | - REG_ADC_VBUS_CURR_H, | ||
149 | - REG_ADC_VBUS_CURR_L, | ||
150 | - REG_ADC_INT_TEMP_H, | ||
151 | - REG_ADC_INT_TEMP_L, | ||
152 | - REG_ADC_TEMP_SENS_V_H = 0x62u, | ||
153 | - REG_ADC_TEMP_SENS_V_L, | ||
154 | - REG_ADC_BAT_V_H = 0x78u, | ||
155 | - REG_ADC_BAT_V_L, | ||
156 | - REG_ADC_BAT_DISCHR_CURR_H, | ||
157 | - REG_ADC_BAT_DISCHR_CURR_L, | ||
158 | - REG_ADC_BAT_CHR_CURR_H, | ||
159 | - REG_ADC_BAT_CHR_CURR_L, | ||
160 | - REG_ADC_IPSOUT_V_H, | ||
161 | - REG_ADC_IPSOUT_V_L, | ||
162 | - REG_DC_DC_MOD_SEL = 0x80u, | ||
163 | - REG_ADC_EN_1, | ||
164 | - REG_ADC_EN_2, | ||
165 | - REG_ADC_SR_CTRL, | ||
166 | - REG_ADC_IN_RANGE, | ||
167 | - REG_GPIO1_ADC_IRQ_RISING_TH, | ||
168 | - REG_GPIO1_ADC_IRQ_FALLING_TH, | ||
169 | - REG_TIMER_CTRL = 0x8au, | ||
170 | - REG_VBUS_CTRL_MON_SRP, | ||
171 | - REG_OVER_TEMP_SHUTDOWN = 0x8fu, | ||
172 | - REG_GPIO0_FEAT_SET, | ||
173 | - REG_GPIO_OUT_HIGH_SET, | ||
174 | - REG_GPIO1_FEAT_SET, | ||
175 | - REG_GPIO2_FEAT_SET, | ||
176 | - REG_GPIO_SIG_STATE_SET_MON, | ||
177 | - REG_GPIO3_SET, | ||
178 | - REG_COULOMB_CNTR_CTRL = 0xb8u, | ||
179 | - REG_POWER_MEAS_RES, | ||
180 | - NR_REGS | ||
181 | -}; | ||
182 | - | ||
183 | -#define AXP209_CHIP_VERSION_ID (0x01) | ||
184 | -#define AXP209_DC_DC2_OUT_V_CTRL_RESET (0x16) | ||
185 | -#define AXP209_IRQ_BANK_1_CTRL_RESET (0xd8) | ||
186 | - | ||
187 | -/* A simple I2C slave which returns values of ID or CNT register. */ | ||
188 | -typedef struct AXP209I2CState { | ||
189 | - /*< private >*/ | ||
190 | - I2CSlave i2c; | ||
191 | - /*< public >*/ | ||
192 | - uint8_t regs[NR_REGS]; /* peripheral registers */ | ||
193 | - uint8_t ptr; /* current register index */ | ||
194 | - uint8_t count; /* counter used for tx/rx */ | ||
195 | -} AXP209I2CState; | ||
196 | - | ||
197 | -/* Reset all counters and load ID register */ | ||
198 | -static void axp209_reset_enter(Object *obj, ResetType type) | ||
199 | -{ | ||
200 | - AXP209I2CState *s = AXP209(obj); | ||
201 | - | ||
202 | - memset(s->regs, 0, NR_REGS); | ||
203 | - s->ptr = 0; | ||
204 | - s->count = 0; | ||
205 | - s->regs[REG_CHIP_VERSION] = AXP209_CHIP_VERSION_ID; | ||
206 | - s->regs[REG_DC_DC2_OUT_V_CTRL] = AXP209_DC_DC2_OUT_V_CTRL_RESET; | ||
207 | - s->regs[REG_IRQ_BANK_1_CTRL] = AXP209_IRQ_BANK_1_CTRL_RESET; | ||
208 | -} | ||
209 | - | ||
210 | -/* Handle events from master. */ | ||
211 | -static int axp209_event(I2CSlave *i2c, enum i2c_event event) | ||
212 | -{ | ||
213 | - AXP209I2CState *s = AXP209(i2c); | ||
214 | - | ||
215 | - s->count = 0; | ||
216 | - | ||
217 | - return 0; | ||
218 | -} | ||
219 | - | ||
220 | -/* Called when master requests read */ | ||
221 | -static uint8_t axp209_rx(I2CSlave *i2c) | ||
222 | -{ | ||
223 | - AXP209I2CState *s = AXP209(i2c); | ||
224 | - uint8_t ret = 0xff; | ||
225 | - | ||
226 | - if (s->ptr < NR_REGS) { | ||
227 | - ret = s->regs[s->ptr++]; | ||
228 | - } | ||
229 | - | ||
230 | - trace_axp209_rx(s->ptr - 1, ret); | ||
231 | - | ||
232 | - return ret; | ||
233 | -} | ||
234 | - | ||
235 | -/* | ||
236 | - * Called when master sends write. | ||
237 | - * Update ptr with byte 0, then perform write with second byte. | ||
238 | - */ | ||
239 | -static int axp209_tx(I2CSlave *i2c, uint8_t data) | ||
240 | -{ | ||
241 | - AXP209I2CState *s = AXP209(i2c); | ||
242 | - | ||
243 | - if (s->count == 0) { | ||
244 | - /* Store register address */ | ||
245 | - s->ptr = data; | ||
246 | - s->count++; | ||
247 | - trace_axp209_select(data); | ||
248 | - } else { | ||
249 | - trace_axp209_tx(s->ptr, data); | ||
250 | - if (s->ptr == REG_DC_DC2_OUT_V_CTRL) { | ||
251 | - s->regs[s->ptr++] = data; | ||
252 | - } | ||
253 | - } | ||
254 | - | ||
255 | - return 0; | ||
256 | -} | ||
257 | - | ||
258 | -static const VMStateDescription vmstate_axp209 = { | ||
259 | - .name = TYPE_AXP209_PMU, | ||
260 | - .version_id = 1, | ||
261 | - .fields = (VMStateField[]) { | ||
262 | - VMSTATE_UINT8_ARRAY(regs, AXP209I2CState, NR_REGS), | ||
263 | - VMSTATE_UINT8(count, AXP209I2CState), | ||
264 | - VMSTATE_UINT8(ptr, AXP209I2CState), | ||
265 | - VMSTATE_END_OF_LIST() | ||
266 | - } | ||
267 | -}; | ||
268 | - | ||
269 | -static void axp209_class_init(ObjectClass *oc, void *data) | ||
270 | -{ | ||
271 | - DeviceClass *dc = DEVICE_CLASS(oc); | ||
272 | - I2CSlaveClass *isc = I2C_SLAVE_CLASS(oc); | ||
273 | - ResettableClass *rc = RESETTABLE_CLASS(oc); | ||
274 | - | ||
275 | - rc->phases.enter = axp209_reset_enter; | ||
276 | - dc->vmsd = &vmstate_axp209; | ||
277 | - isc->event = axp209_event; | ||
278 | - isc->recv = axp209_rx; | ||
279 | - isc->send = axp209_tx; | ||
280 | -} | ||
281 | - | ||
282 | -static const TypeInfo axp209_info = { | ||
283 | - .name = TYPE_AXP209_PMU, | ||
284 | - .parent = TYPE_I2C_SLAVE, | ||
285 | - .instance_size = sizeof(AXP209I2CState), | ||
286 | - .class_init = axp209_class_init | ||
287 | -}; | ||
288 | - | ||
289 | -static void axp209_register_devices(void) | ||
290 | -{ | ||
291 | - type_register_static(&axp209_info); | ||
292 | -} | ||
293 | - | ||
294 | -type_init(axp209_register_devices); | ||
295 | diff --git a/hw/misc/axp2xx.c b/hw/misc/axp2xx.c | ||
296 | new file mode 100644 | ||
297 | index XXXXXXX..XXXXXXX | ||
298 | --- /dev/null | ||
299 | +++ b/hw/misc/axp2xx.c | ||
300 | @@ -XXX,XX +XXX,XX @@ | ||
301 | +/* | ||
302 | + * AXP-2XX PMU Emulation, supported lists: | ||
303 | + * AXP209 | ||
304 | + * AXP221 | ||
305 | + * | ||
306 | + * Copyright (C) 2022 Strahinja Jankovic <strahinja.p.jankovic@gmail.com> | ||
307 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> | ||
308 | + * | ||
309 | + * Permission is hereby granted, free of charge, to any person obtaining a | ||
310 | + * copy of this software and associated documentation files (the "Software"), | ||
311 | + * to deal in the Software without restriction, including without limitation | ||
312 | + * the rights to use, copy, modify, merge, publish, distribute, sublicense, | ||
313 | + * and/or sell copies of the Software, and to permit persons to whom the | ||
314 | + * Software is furnished to do so, subject to the following conditions: | ||
315 | + * | ||
316 | + * The above copyright notice and this permission notice shall be included in | ||
317 | + * all copies or substantial portions of the Software. | ||
318 | + * | ||
319 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
320 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
321 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | ||
322 | + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
323 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING | ||
324 | + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER | ||
325 | + * DEALINGS IN THE SOFTWARE. | ||
326 | + * | ||
327 | + * SPDX-License-Identifier: MIT | ||
328 | + */ | ||
329 | + | ||
330 | +#include "qemu/osdep.h" | ||
331 | +#include "qemu/log.h" | ||
332 | +#include "qom/object.h" | ||
333 | +#include "trace.h" | ||
334 | +#include "hw/i2c/i2c.h" | ||
335 | +#include "migration/vmstate.h" | ||
336 | + | ||
337 | +#define TYPE_AXP2XX "axp2xx_pmu" | ||
338 | +#define TYPE_AXP209_PMU "axp209_pmu" | ||
339 | +#define TYPE_AXP221_PMU "axp221_pmu" | ||
340 | + | ||
341 | +OBJECT_DECLARE_TYPE(AXP2xxI2CState, AXP2xxClass, AXP2XX) | ||
342 | + | ||
343 | +#define NR_REGS (0xff) | ||
344 | + | ||
345 | +/* A simple I2C slave which returns values of ID or CNT register. */ | ||
346 | +typedef struct AXP2xxI2CState { | ||
347 | + /*< private >*/ | ||
348 | + I2CSlave i2c; | ||
349 | + /*< public >*/ | ||
350 | + uint8_t regs[NR_REGS]; /* peripheral registers */ | ||
351 | + uint8_t ptr; /* current register index */ | ||
352 | + uint8_t count; /* counter used for tx/rx */ | ||
353 | +} AXP2xxI2CState; | ||
354 | + | ||
355 | +typedef struct AXP2xxClass { | ||
356 | + /*< private >*/ | ||
357 | + I2CSlaveClass parent_class; | ||
358 | + /*< public >*/ | ||
359 | + void (*reset_enter)(AXP2xxI2CState *s, ResetType type); | ||
360 | +} AXP2xxClass; | ||
361 | + | ||
362 | +#define AXP209_CHIP_VERSION_ID (0x01) | ||
363 | +#define AXP209_DC_DC2_OUT_V_CTRL_RESET (0x16) | ||
364 | + | ||
365 | +/* Reset all counters and load ID register */ | ||
366 | +static void axp209_reset_enter(AXP2xxI2CState *s, ResetType type) | ||
367 | +{ | ||
368 | + memset(s->regs, 0, NR_REGS); | ||
369 | + s->ptr = 0; | ||
370 | + s->count = 0; | ||
371 | + | ||
372 | + s->regs[0x03] = AXP209_CHIP_VERSION_ID; | ||
373 | + s->regs[0x23] = AXP209_DC_DC2_OUT_V_CTRL_RESET; | ||
374 | + | ||
375 | + s->regs[0x30] = 0x60; | ||
376 | + s->regs[0x32] = 0x46; | ||
377 | + s->regs[0x34] = 0x41; | ||
378 | + s->regs[0x35] = 0x22; | ||
379 | + s->regs[0x36] = 0x5d; | ||
380 | + s->regs[0x37] = 0x08; | ||
381 | + s->regs[0x38] = 0xa5; | ||
382 | + s->regs[0x39] = 0x1f; | ||
383 | + s->regs[0x3a] = 0x68; | ||
384 | + s->regs[0x3b] = 0x5f; | ||
385 | + s->regs[0x3c] = 0xfc; | ||
386 | + s->regs[0x3d] = 0x16; | ||
387 | + s->regs[0x40] = 0xd8; | ||
388 | + s->regs[0x42] = 0xff; | ||
389 | + s->regs[0x43] = 0x3b; | ||
390 | + s->regs[0x80] = 0xe0; | ||
391 | + s->regs[0x82] = 0x83; | ||
392 | + s->regs[0x83] = 0x80; | ||
393 | + s->regs[0x84] = 0x32; | ||
394 | + s->regs[0x86] = 0xff; | ||
395 | + s->regs[0x90] = 0x07; | ||
396 | + s->regs[0x91] = 0xa0; | ||
397 | + s->regs[0x92] = 0x07; | ||
398 | + s->regs[0x93] = 0x07; | ||
399 | +} | ||
400 | + | ||
401 | +#define AXP221_PWR_STATUS_ACIN_PRESENT BIT(7) | ||
402 | +#define AXP221_PWR_STATUS_ACIN_AVAIL BIT(6) | ||
403 | +#define AXP221_PWR_STATUS_VBUS_PRESENT BIT(5) | ||
404 | +#define AXP221_PWR_STATUS_VBUS_USED BIT(4) | ||
405 | +#define AXP221_PWR_STATUS_BAT_CHARGING BIT(2) | ||
406 | +#define AXP221_PWR_STATUS_ACIN_VBUS_POWERED BIT(1) | ||
407 | + | ||
408 | +/* Reset all counters and load ID register */ | ||
409 | +static void axp221_reset_enter(AXP2xxI2CState *s, ResetType type) | ||
410 | +{ | ||
411 | + memset(s->regs, 0, NR_REGS); | ||
412 | + s->ptr = 0; | ||
413 | + s->count = 0; | ||
414 | + | ||
415 | + /* input power status register */ | ||
416 | + s->regs[0x00] = AXP221_PWR_STATUS_ACIN_PRESENT | ||
417 | + | AXP221_PWR_STATUS_ACIN_AVAIL | ||
418 | + | AXP221_PWR_STATUS_ACIN_VBUS_POWERED; | ||
419 | + | ||
420 | + s->regs[0x01] = 0x00; /* no battery is connected */ | ||
421 | + | ||
422 | + /* | ||
423 | + * CHIPID register, no documented on datasheet, but it is checked in | ||
424 | + * u-boot spl. I had read it from AXP221s and got 0x06 value. | ||
425 | + * So leave 06h here. | ||
426 | + */ | ||
427 | + s->regs[0x03] = 0x06; | ||
428 | + | ||
429 | + s->regs[0x10] = 0xbf; | ||
430 | + s->regs[0x13] = 0x01; | ||
431 | + s->regs[0x30] = 0x60; | ||
432 | + s->regs[0x31] = 0x03; | ||
433 | + s->regs[0x32] = 0x43; | ||
434 | + s->regs[0x33] = 0xc6; | ||
435 | + s->regs[0x34] = 0x45; | ||
436 | + s->regs[0x35] = 0x0e; | ||
437 | + s->regs[0x36] = 0x5d; | ||
438 | + s->regs[0x37] = 0x08; | ||
439 | + s->regs[0x38] = 0xa5; | ||
440 | + s->regs[0x39] = 0x1f; | ||
441 | + s->regs[0x3c] = 0xfc; | ||
442 | + s->regs[0x3d] = 0x16; | ||
443 | + s->regs[0x80] = 0x80; | ||
444 | + s->regs[0x82] = 0xe0; | ||
445 | + s->regs[0x84] = 0x32; | ||
446 | + s->regs[0x8f] = 0x01; | ||
447 | + | ||
448 | + s->regs[0x90] = 0x07; | ||
449 | + s->regs[0x91] = 0x1f; | ||
450 | + s->regs[0x92] = 0x07; | ||
451 | + s->regs[0x93] = 0x1f; | ||
452 | + | ||
453 | + s->regs[0x40] = 0xd8; | ||
454 | + s->regs[0x41] = 0xff; | ||
455 | + s->regs[0x42] = 0x03; | ||
456 | + s->regs[0x43] = 0x03; | ||
457 | + | ||
458 | + s->regs[0xb8] = 0xc0; | ||
459 | + s->regs[0xb9] = 0x64; | ||
460 | + s->regs[0xe6] = 0xa0; | ||
461 | +} | ||
462 | + | ||
463 | +static void axp2xx_reset_enter(Object *obj, ResetType type) | ||
464 | +{ | ||
465 | + AXP2xxI2CState *s = AXP2XX(obj); | ||
466 | + AXP2xxClass *sc = AXP2XX_GET_CLASS(s); | ||
467 | + | ||
468 | + sc->reset_enter(s, type); | ||
469 | +} | ||
470 | + | ||
471 | +/* Handle events from master. */ | ||
472 | +static int axp2xx_event(I2CSlave *i2c, enum i2c_event event) | ||
473 | +{ | ||
474 | + AXP2xxI2CState *s = AXP2XX(i2c); | ||
475 | + | ||
476 | + s->count = 0; | ||
477 | + | ||
478 | + return 0; | ||
479 | +} | ||
480 | + | ||
481 | +/* Called when master requests read */ | ||
482 | +static uint8_t axp2xx_rx(I2CSlave *i2c) | ||
483 | +{ | ||
484 | + AXP2xxI2CState *s = AXP2XX(i2c); | ||
485 | + uint8_t ret = 0xff; | ||
486 | + | ||
487 | + if (s->ptr < NR_REGS) { | ||
488 | + ret = s->regs[s->ptr++]; | ||
32 | + } | 489 | + } |
33 | + | 490 | + |
34 | #endif /* TARGET_ARM_TRANSLATE_H */ | 491 | + trace_axp2xx_rx(s->ptr - 1, ret); |
35 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 492 | + |
493 | + return ret; | ||
494 | +} | ||
495 | + | ||
496 | +/* | ||
497 | + * Called when master sends write. | ||
498 | + * Update ptr with byte 0, then perform write with second byte. | ||
499 | + */ | ||
500 | +static int axp2xx_tx(I2CSlave *i2c, uint8_t data) | ||
501 | +{ | ||
502 | + AXP2xxI2CState *s = AXP2XX(i2c); | ||
503 | + | ||
504 | + if (s->count == 0) { | ||
505 | + /* Store register address */ | ||
506 | + s->ptr = data; | ||
507 | + s->count++; | ||
508 | + trace_axp2xx_select(data); | ||
509 | + } else { | ||
510 | + trace_axp2xx_tx(s->ptr, data); | ||
511 | + s->regs[s->ptr++] = data; | ||
512 | + } | ||
513 | + | ||
514 | + return 0; | ||
515 | +} | ||
516 | + | ||
517 | +static const VMStateDescription vmstate_axp2xx = { | ||
518 | + .name = TYPE_AXP2XX, | ||
519 | + .version_id = 1, | ||
520 | + .fields = (VMStateField[]) { | ||
521 | + VMSTATE_UINT8_ARRAY(regs, AXP2xxI2CState, NR_REGS), | ||
522 | + VMSTATE_UINT8(ptr, AXP2xxI2CState), | ||
523 | + VMSTATE_UINT8(count, AXP2xxI2CState), | ||
524 | + VMSTATE_END_OF_LIST() | ||
525 | + } | ||
526 | +}; | ||
527 | + | ||
528 | +static void axp2xx_class_init(ObjectClass *oc, void *data) | ||
529 | +{ | ||
530 | + DeviceClass *dc = DEVICE_CLASS(oc); | ||
531 | + I2CSlaveClass *isc = I2C_SLAVE_CLASS(oc); | ||
532 | + ResettableClass *rc = RESETTABLE_CLASS(oc); | ||
533 | + | ||
534 | + rc->phases.enter = axp2xx_reset_enter; | ||
535 | + dc->vmsd = &vmstate_axp2xx; | ||
536 | + isc->event = axp2xx_event; | ||
537 | + isc->recv = axp2xx_rx; | ||
538 | + isc->send = axp2xx_tx; | ||
539 | +} | ||
540 | + | ||
541 | +static const TypeInfo axp2xx_info = { | ||
542 | + .name = TYPE_AXP2XX, | ||
543 | + .parent = TYPE_I2C_SLAVE, | ||
544 | + .instance_size = sizeof(AXP2xxI2CState), | ||
545 | + .class_size = sizeof(AXP2xxClass), | ||
546 | + .class_init = axp2xx_class_init, | ||
547 | + .abstract = true, | ||
548 | +}; | ||
549 | + | ||
550 | +static void axp209_class_init(ObjectClass *oc, void *data) | ||
551 | +{ | ||
552 | + AXP2xxClass *sc = AXP2XX_CLASS(oc); | ||
553 | + | ||
554 | + sc->reset_enter = axp209_reset_enter; | ||
555 | +} | ||
556 | + | ||
557 | +static const TypeInfo axp209_info = { | ||
558 | + .name = TYPE_AXP209_PMU, | ||
559 | + .parent = TYPE_AXP2XX, | ||
560 | + .class_init = axp209_class_init | ||
561 | +}; | ||
562 | + | ||
563 | +static void axp221_class_init(ObjectClass *oc, void *data) | ||
564 | +{ | ||
565 | + AXP2xxClass *sc = AXP2XX_CLASS(oc); | ||
566 | + | ||
567 | + sc->reset_enter = axp221_reset_enter; | ||
568 | +} | ||
569 | + | ||
570 | +static const TypeInfo axp221_info = { | ||
571 | + .name = TYPE_AXP221_PMU, | ||
572 | + .parent = TYPE_AXP2XX, | ||
573 | + .class_init = axp221_class_init, | ||
574 | +}; | ||
575 | + | ||
576 | +static void axp2xx_register_devices(void) | ||
577 | +{ | ||
578 | + type_register_static(&axp2xx_info); | ||
579 | + type_register_static(&axp209_info); | ||
580 | + type_register_static(&axp221_info); | ||
581 | +} | ||
582 | + | ||
583 | +type_init(axp2xx_register_devices); | ||
584 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig | ||
36 | index XXXXXXX..XXXXXXX 100644 | 585 | index XXXXXXX..XXXXXXX 100644 |
37 | --- a/target/arm/sme-fa64.decode | 586 | --- a/hw/arm/Kconfig |
38 | +++ b/target/arm/sme-fa64.decode | 587 | +++ b/hw/arm/Kconfig |
39 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 588 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_A10 |
40 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 589 | select ALLWINNER_WDT |
41 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 590 | select ALLWINNER_EMAC |
42 | 591 | select ALLWINNER_I2C | |
43 | -FAIL 0000 0100 --1- ---- 1010 ---- ---- ---- # ADR | 592 | - select AXP209_PMU |
44 | FAIL 0000 0100 --1- ---- 1011 -0-- ---- ---- # FTSSEL, FEXPA | 593 | + select AXP2XX_PMU |
45 | FAIL 0000 0101 --10 0001 100- ---- ---- ---- # COMPACT | 594 | select SERIAL |
46 | FAIL 0010 0101 --01 100- 1111 000- ---0 ---- # RDFFR, RDFFRS | 595 | select UNIMP |
47 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 596 | |
597 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_R40 | ||
598 | bool | ||
599 | default y if TCG && ARM | ||
600 | select ALLWINNER_A10_PIT | ||
601 | + select AXP2XX_PMU | ||
602 | select SERIAL | ||
603 | select ARM_TIMER | ||
604 | select ARM_GIC | ||
605 | diff --git a/hw/misc/Kconfig b/hw/misc/Kconfig | ||
48 | index XXXXXXX..XXXXXXX 100644 | 606 | index XXXXXXX..XXXXXXX 100644 |
49 | --- a/target/arm/translate-sve.c | 607 | --- a/hw/misc/Kconfig |
50 | +++ b/target/arm/translate-sve.c | 608 | +++ b/hw/misc/Kconfig |
51 | @@ -XXX,XX +XXX,XX @@ static bool do_adr(DisasContext *s, arg_rrri *a, gen_helper_gvec_3 *fn) | 609 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_A10_CCM |
52 | return gen_gvec_ool_zzz(s, fn, a->rd, a->rn, a->rm, a->imm); | 610 | config ALLWINNER_A10_DRAMC |
53 | } | 611 | bool |
54 | 612 | ||
55 | -TRANS_FEAT(ADR_p32, aa64_sve, do_adr, a, gen_helper_sve_adr_p32) | 613 | -config AXP209_PMU |
56 | -TRANS_FEAT(ADR_p64, aa64_sve, do_adr, a, gen_helper_sve_adr_p64) | 614 | +config AXP2XX_PMU |
57 | -TRANS_FEAT(ADR_s32, aa64_sve, do_adr, a, gen_helper_sve_adr_s32) | 615 | bool |
58 | -TRANS_FEAT(ADR_u32, aa64_sve, do_adr, a, gen_helper_sve_adr_u32) | 616 | depends on I2C |
59 | +TRANS_FEAT_NONSTREAMING(ADR_p32, aa64_sve, do_adr, a, gen_helper_sve_adr_p32) | 617 | |
60 | +TRANS_FEAT_NONSTREAMING(ADR_p64, aa64_sve, do_adr, a, gen_helper_sve_adr_p64) | 618 | diff --git a/hw/misc/meson.build b/hw/misc/meson.build |
61 | +TRANS_FEAT_NONSTREAMING(ADR_s32, aa64_sve, do_adr, a, gen_helper_sve_adr_s32) | 619 | index XXXXXXX..XXXXXXX 100644 |
62 | +TRANS_FEAT_NONSTREAMING(ADR_u32, aa64_sve, do_adr, a, gen_helper_sve_adr_u32) | 620 | --- a/hw/misc/meson.build |
63 | 621 | +++ b/hw/misc/meson.build | |
64 | /* | 622 | @@ -XXX,XX +XXX,XX @@ softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-dramc.c |
65 | *** SVE Integer Misc - Unpredicated Group | 623 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-sysctrl.c')) |
624 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-sid.c')) | ||
625 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_R40', if_true: files('allwinner-r40-ccu.c')) | ||
626 | -softmmu_ss.add(when: 'CONFIG_AXP209_PMU', if_true: files('axp209.c')) | ||
627 | +softmmu_ss.add(when: 'CONFIG_AXP2XX_PMU', if_true: files('axp2xx.c')) | ||
628 | softmmu_ss.add(when: 'CONFIG_REALVIEW', if_true: files('arm_sysctl.c')) | ||
629 | softmmu_ss.add(when: 'CONFIG_NSERIES', if_true: files('cbus.c')) | ||
630 | softmmu_ss.add(when: 'CONFIG_ECCMEMCTL', if_true: files('eccmemctl.c')) | ||
631 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events | ||
632 | index XXXXXXX..XXXXXXX 100644 | ||
633 | --- a/hw/misc/trace-events | ||
634 | +++ b/hw/misc/trace-events | ||
635 | @@ -XXX,XX +XXX,XX @@ allwinner_sid_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" | ||
636 | avr_power_read(uint8_t value) "power_reduc read value:%u" | ||
637 | avr_power_write(uint8_t value) "power_reduc write value:%u" | ||
638 | |||
639 | -# axp209.c | ||
640 | -axp209_rx(uint8_t reg, uint8_t data) "Read reg 0x%" PRIx8 " : 0x%" PRIx8 | ||
641 | -axp209_select(uint8_t reg) "Accessing reg 0x%" PRIx8 | ||
642 | -axp209_tx(uint8_t reg, uint8_t data) "Write reg 0x%" PRIx8 " : 0x%" PRIx8 | ||
643 | +# axp2xx | ||
644 | +axp2xx_rx(uint8_t reg, uint8_t data) "Read reg 0x%" PRIx8 " : 0x%" PRIx8 | ||
645 | +axp2xx_select(uint8_t reg) "Accessing reg 0x%" PRIx8 | ||
646 | +axp2xx_tx(uint8_t reg, uint8_t data) "Write reg 0x%" PRIx8 " : 0x%" PRIx8 | ||
647 | |||
648 | # eccmemctl.c | ||
649 | ecc_mem_writel_mer(uint32_t val) "Write memory enable 0x%08x" | ||
66 | -- | 650 | -- |
67 | 2.25.1 | 651 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | This includes the build rules for the decoder, and the | 3 | Types of memory that the SDRAM controller supports are DDR2/DDR3 |
4 | new file for translation, but excludes any instructions. | 4 | and capacities of up to 2GiB. This commit adds emulation support |
5 | of the Allwinner R40 SDRAM controller. | ||
5 | 6 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | This driver only support 256M, 512M and 1024M memory now. |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | |
8 | Message-id: 20220708151540.18136-3-richard.henderson@linaro.org | 9 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | target/arm/translate-a64.h | 1 + | 12 | include/hw/arm/allwinner-r40.h | 13 +- |
12 | target/arm/sme.decode | 20 ++++++++++++++++++++ | 13 | include/hw/misc/allwinner-r40-dramc.h | 108 ++++++ |
13 | target/arm/translate-a64.c | 7 ++++++- | 14 | hw/arm/allwinner-r40.c | 21 +- |
14 | target/arm/translate-sme.c | 35 +++++++++++++++++++++++++++++++++++ | 15 | hw/arm/bananapi_m2u.c | 7 + |
15 | target/arm/meson.build | 2 ++ | 16 | hw/misc/allwinner-r40-dramc.c | 513 ++++++++++++++++++++++++++ |
16 | 5 files changed, 64 insertions(+), 1 deletion(-) | 17 | hw/misc/meson.build | 1 + |
17 | create mode 100644 target/arm/sme.decode | 18 | hw/misc/trace-events | 14 + |
18 | create mode 100644 target/arm/translate-sme.c | 19 | 7 files changed, 674 insertions(+), 3 deletions(-) |
20 | create mode 100644 include/hw/misc/allwinner-r40-dramc.h | ||
21 | create mode 100644 hw/misc/allwinner-r40-dramc.c | ||
19 | 22 | ||
20 | diff --git a/target/arm/translate-a64.h b/target/arm/translate-a64.h | 23 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
21 | index XXXXXXX..XXXXXXX 100644 | 24 | index XXXXXXX..XXXXXXX 100644 |
22 | --- a/target/arm/translate-a64.h | 25 | --- a/include/hw/arm/allwinner-r40.h |
23 | +++ b/target/arm/translate-a64.h | 26 | +++ b/include/hw/arm/allwinner-r40.h |
24 | @@ -XXX,XX +XXX,XX @@ static inline int pred_gvec_reg_size(DisasContext *s) | 27 | @@ -XXX,XX +XXX,XX @@ |
25 | } | 28 | #include "hw/intc/arm_gic.h" |
26 | 29 | #include "hw/sd/allwinner-sdhost.h" | |
27 | bool disas_sve(DisasContext *, uint32_t); | 30 | #include "hw/misc/allwinner-r40-ccu.h" |
28 | +bool disas_sme(DisasContext *, uint32_t); | 31 | +#include "hw/misc/allwinner-r40-dramc.h" |
29 | 32 | #include "hw/i2c/allwinner-i2c.h" | |
30 | void gen_gvec_rax1(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs, | 33 | #include "target/arm/cpu.h" |
31 | uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz); | 34 | #include "sysemu/block-backend.h" |
32 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | 35 | @@ -XXX,XX +XXX,XX @@ enum { |
36 | AW_R40_DEV_GIC_CPU, | ||
37 | AW_R40_DEV_GIC_HYP, | ||
38 | AW_R40_DEV_GIC_VCPU, | ||
39 | - AW_R40_DEV_SDRAM | ||
40 | + AW_R40_DEV_SDRAM, | ||
41 | + AW_R40_DEV_DRAMCOM, | ||
42 | + AW_R40_DEV_DRAMCTL, | ||
43 | + AW_R40_DEV_DRAMPHY, | ||
44 | }; | ||
45 | |||
46 | #define AW_R40_NUM_CPUS (4) | ||
47 | @@ -XXX,XX +XXX,XX @@ struct AwR40State { | ||
48 | DeviceState parent_obj; | ||
49 | /*< public >*/ | ||
50 | |||
51 | + /** Physical base address for start of RAM */ | ||
52 | + hwaddr ram_addr; | ||
53 | + | ||
54 | + /** Total RAM size in megabytes */ | ||
55 | + uint32_t ram_size; | ||
56 | + | ||
57 | ARMCPU cpus[AW_R40_NUM_CPUS]; | ||
58 | const hwaddr *memmap; | ||
59 | AwA10PITState timer; | ||
60 | AwSdHostState mmc[AW_R40_NUM_MMCS]; | ||
61 | AwR40ClockCtlState ccu; | ||
62 | + AwR40DramCtlState dramc; | ||
63 | AWI2CState i2c0; | ||
64 | GICState gic; | ||
65 | MemoryRegion sram_a1; | ||
66 | diff --git a/include/hw/misc/allwinner-r40-dramc.h b/include/hw/misc/allwinner-r40-dramc.h | ||
33 | new file mode 100644 | 67 | new file mode 100644 |
34 | index XXXXXXX..XXXXXXX | 68 | index XXXXXXX..XXXXXXX |
35 | --- /dev/null | 69 | --- /dev/null |
36 | +++ b/target/arm/sme.decode | 70 | +++ b/include/hw/misc/allwinner-r40-dramc.h |
37 | @@ -XXX,XX +XXX,XX @@ | 71 | @@ -XXX,XX +XXX,XX @@ |
38 | +# AArch64 SME instruction descriptions | 72 | +/* |
39 | +# | 73 | + * Allwinner R40 SDRAM Controller emulation |
40 | +# Copyright (c) 2022 Linaro, Ltd | 74 | + * |
41 | +# | 75 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> |
42 | +# This library is free software; you can redistribute it and/or | 76 | + * |
43 | +# modify it under the terms of the GNU Lesser General Public | 77 | + * This program is free software: you can redistribute it and/or modify |
44 | +# License as published by the Free Software Foundation; either | 78 | + * it under the terms of the GNU General Public License as published by |
45 | +# version 2.1 of the License, or (at your option) any later version. | 79 | + * the Free Software Foundation, either version 2 of the License, or |
46 | +# | 80 | + * (at your option) any later version. |
47 | +# This library is distributed in the hope that it will be useful, | 81 | + * |
48 | +# but WITHOUT ANY WARRANTY; without even the implied warranty of | 82 | + * This program is distributed in the hope that it will be useful, |
49 | +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | 83 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of |
50 | +# Lesser General Public License for more details. | 84 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
51 | +# | 85 | + * GNU General Public License for more details. |
52 | +# You should have received a copy of the GNU Lesser General Public | 86 | + * |
53 | +# License along with this library; if not, see <http://www.gnu.org/licenses/>. | 87 | + * You should have received a copy of the GNU General Public License |
54 | + | 88 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. |
55 | +# | 89 | + */ |
56 | +# This file is processed by scripts/decodetree.py | 90 | + |
57 | +# | 91 | +#ifndef HW_MISC_ALLWINNER_R40_DRAMC_H |
58 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 92 | +#define HW_MISC_ALLWINNER_R40_DRAMC_H |
93 | + | ||
94 | +#include "qom/object.h" | ||
95 | +#include "hw/sysbus.h" | ||
96 | +#include "exec/hwaddr.h" | ||
97 | + | ||
98 | +/** | ||
99 | + * Constants | ||
100 | + * @{ | ||
101 | + */ | ||
102 | + | ||
103 | +/** Highest register address used by DRAMCOM module */ | ||
104 | +#define AW_R40_DRAMCOM_REGS_MAXADDR (0x804) | ||
105 | + | ||
106 | +/** Total number of known DRAMCOM registers */ | ||
107 | +#define AW_R40_DRAMCOM_REGS_NUM (AW_R40_DRAMCOM_REGS_MAXADDR / \ | ||
108 | + sizeof(uint32_t)) | ||
109 | + | ||
110 | +/** Highest register address used by DRAMCTL module */ | ||
111 | +#define AW_R40_DRAMCTL_REGS_MAXADDR (0x88c) | ||
112 | + | ||
113 | +/** Total number of known DRAMCTL registers */ | ||
114 | +#define AW_R40_DRAMCTL_REGS_NUM (AW_R40_DRAMCTL_REGS_MAXADDR / \ | ||
115 | + sizeof(uint32_t)) | ||
116 | + | ||
117 | +/** Highest register address used by DRAMPHY module */ | ||
118 | +#define AW_R40_DRAMPHY_REGS_MAXADDR (0x4) | ||
119 | + | ||
120 | +/** Total number of known DRAMPHY registers */ | ||
121 | +#define AW_R40_DRAMPHY_REGS_NUM (AW_R40_DRAMPHY_REGS_MAXADDR / \ | ||
122 | + sizeof(uint32_t)) | ||
123 | + | ||
124 | +/** @} */ | ||
125 | + | ||
126 | +/** | ||
127 | + * Object model | ||
128 | + * @{ | ||
129 | + */ | ||
130 | + | ||
131 | +#define TYPE_AW_R40_DRAMC "allwinner-r40-dramc" | ||
132 | +OBJECT_DECLARE_SIMPLE_TYPE(AwR40DramCtlState, AW_R40_DRAMC) | ||
133 | + | ||
134 | +/** @} */ | ||
135 | + | ||
136 | +/** | ||
137 | + * Allwinner R40 SDRAM Controller object instance state. | ||
138 | + */ | ||
139 | +struct AwR40DramCtlState { | ||
140 | + /*< private >*/ | ||
141 | + SysBusDevice parent_obj; | ||
142 | + /*< public >*/ | ||
143 | + | ||
144 | + /** Physical base address for start of RAM */ | ||
145 | + hwaddr ram_addr; | ||
146 | + | ||
147 | + /** Total RAM size in megabytes */ | ||
148 | + uint32_t ram_size; | ||
149 | + | ||
150 | + uint8_t set_row_bits; | ||
151 | + uint8_t set_bank_bits; | ||
152 | + uint8_t set_col_bits; | ||
153 | + | ||
154 | + /** | ||
155 | + * @name Memory Regions | ||
156 | + * @{ | ||
157 | + */ | ||
158 | + MemoryRegion dramcom_iomem; /**< DRAMCOM module I/O registers */ | ||
159 | + MemoryRegion dramctl_iomem; /**< DRAMCTL module I/O registers */ | ||
160 | + MemoryRegion dramphy_iomem; /**< DRAMPHY module I/O registers */ | ||
161 | + MemoryRegion dram_high; /**< The high 1G dram for dualrank detect */ | ||
162 | + MemoryRegion detect_cells; /**< DRAM memory cells for auto detect */ | ||
163 | + | ||
164 | + /** @} */ | ||
165 | + | ||
166 | + /** | ||
167 | + * @name Hardware Registers | ||
168 | + * @{ | ||
169 | + */ | ||
170 | + | ||
171 | + uint32_t dramcom[AW_R40_DRAMCOM_REGS_NUM]; /**< DRAMCOM registers */ | ||
172 | + uint32_t dramctl[AW_R40_DRAMCTL_REGS_NUM]; /**< DRAMCTL registers */ | ||
173 | + uint32_t dramphy[AW_R40_DRAMPHY_REGS_NUM] ;/**< DRAMPHY registers */ | ||
174 | + | ||
175 | + /** @} */ | ||
176 | + | ||
177 | +}; | ||
178 | + | ||
179 | +#endif /* HW_MISC_ALLWINNER_R40_DRAMC_H */ | ||
180 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
59 | index XXXXXXX..XXXXXXX 100644 | 181 | index XXXXXXX..XXXXXXX 100644 |
60 | --- a/target/arm/translate-a64.c | 182 | --- a/hw/arm/allwinner-r40.c |
61 | +++ b/target/arm/translate-a64.c | 183 | +++ b/hw/arm/allwinner-r40.c |
62 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_translate_insn(DisasContextBase *dcbase, CPUState *cpu) | 184 | @@ -XXX,XX +XXX,XX @@ |
185 | #include "hw/loader.h" | ||
186 | #include "sysemu/sysemu.h" | ||
187 | #include "hw/arm/allwinner-r40.h" | ||
188 | +#include "hw/misc/allwinner-r40-dramc.h" | ||
189 | |||
190 | /* Memory map */ | ||
191 | const hwaddr allwinner_r40_memmap[] = { | ||
192 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { | ||
193 | [AW_R40_DEV_UART6] = 0x01c29800, | ||
194 | [AW_R40_DEV_UART7] = 0x01c29c00, | ||
195 | [AW_R40_DEV_TWI0] = 0x01c2ac00, | ||
196 | + [AW_R40_DEV_DRAMCOM] = 0x01c62000, | ||
197 | + [AW_R40_DEV_DRAMCTL] = 0x01c63000, | ||
198 | + [AW_R40_DEV_DRAMPHY] = 0x01c65000, | ||
199 | [AW_R40_DEV_GIC_DIST] = 0x01c81000, | ||
200 | [AW_R40_DEV_GIC_CPU] = 0x01c82000, | ||
201 | [AW_R40_DEV_GIC_HYP] = 0x01c84000, | ||
202 | @@ -XXX,XX +XXX,XX @@ static struct AwR40Unimplemented r40_unimplemented[] = { | ||
203 | { "gpu", 0x01c40000, 64 * KiB }, | ||
204 | { "gmac", 0x01c50000, 64 * KiB }, | ||
205 | { "hstmr", 0x01c60000, 4 * KiB }, | ||
206 | - { "dram-com", 0x01c62000, 4 * KiB }, | ||
207 | - { "dram-ctl", 0x01c63000, 4 * KiB }, | ||
208 | { "tcon-top", 0x01c70000, 4 * KiB }, | ||
209 | { "lcd0", 0x01c71000, 4 * KiB }, | ||
210 | { "lcd1", 0x01c72000, 4 * KiB }, | ||
211 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) | ||
63 | } | 212 | } |
64 | 213 | ||
65 | switch (extract32(insn, 25, 4)) { | 214 | object_initialize_child(obj, "twi0", &s->i2c0, TYPE_AW_I2C_SUN6I); |
66 | - case 0x0: case 0x1: case 0x3: /* UNALLOCATED */ | 215 | + |
67 | + case 0x0: | 216 | + object_initialize_child(obj, "dramc", &s->dramc, TYPE_AW_R40_DRAMC); |
68 | + if (!extract32(insn, 31, 1) || !disas_sme(s, insn)) { | 217 | + object_property_add_alias(obj, "ram-addr", OBJECT(&s->dramc), |
69 | + unallocated_encoding(s); | 218 | + "ram-addr"); |
70 | + } | 219 | + object_property_add_alias(obj, "ram-size", OBJECT(&s->dramc), |
71 | + break; | 220 | + "ram-size"); |
72 | + case 0x1: case 0x3: /* UNALLOCATED */ | 221 | } |
73 | unallocated_encoding(s); | 222 | |
74 | break; | 223 | static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
75 | case 0x2: | 224 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
76 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 225 | sysbus_connect_irq(SYS_BUS_DEVICE(&s->i2c0), 0, |
226 | qdev_get_gpio_in(DEVICE(&s->gic), AW_R40_GIC_SPI_TWI0)); | ||
227 | |||
228 | + /* DRAMC */ | ||
229 | + sysbus_realize(SYS_BUS_DEVICE(&s->dramc), &error_fatal); | ||
230 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 0, | ||
231 | + s->memmap[AW_R40_DEV_DRAMCOM]); | ||
232 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 1, | ||
233 | + s->memmap[AW_R40_DEV_DRAMCTL]); | ||
234 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 2, | ||
235 | + s->memmap[AW_R40_DEV_DRAMPHY]); | ||
236 | + | ||
237 | /* Unimplemented devices */ | ||
238 | for (i = 0; i < ARRAY_SIZE(r40_unimplemented); i++) { | ||
239 | create_unimplemented_device(r40_unimplemented[i].device_name, | ||
240 | diff --git a/hw/arm/bananapi_m2u.c b/hw/arm/bananapi_m2u.c | ||
241 | index XXXXXXX..XXXXXXX 100644 | ||
242 | --- a/hw/arm/bananapi_m2u.c | ||
243 | +++ b/hw/arm/bananapi_m2u.c | ||
244 | @@ -XXX,XX +XXX,XX @@ static void bpim2u_init(MachineState *machine) | ||
245 | object_property_set_int(OBJECT(r40), "clk1-freq", 24 * 1000 * 1000, | ||
246 | &error_abort); | ||
247 | |||
248 | + /* DRAMC */ | ||
249 | + r40->ram_size = machine->ram_size / MiB; | ||
250 | + object_property_set_uint(OBJECT(r40), "ram-addr", | ||
251 | + r40->memmap[AW_R40_DEV_SDRAM], &error_abort); | ||
252 | + object_property_set_int(OBJECT(r40), "ram-size", | ||
253 | + r40->ram_size, &error_abort); | ||
254 | + | ||
255 | /* Mark R40 object realized */ | ||
256 | qdev_realize(DEVICE(r40), NULL, &error_abort); | ||
257 | |||
258 | diff --git a/hw/misc/allwinner-r40-dramc.c b/hw/misc/allwinner-r40-dramc.c | ||
77 | new file mode 100644 | 259 | new file mode 100644 |
78 | index XXXXXXX..XXXXXXX | 260 | index XXXXXXX..XXXXXXX |
79 | --- /dev/null | 261 | --- /dev/null |
80 | +++ b/target/arm/translate-sme.c | 262 | +++ b/hw/misc/allwinner-r40-dramc.c |
81 | @@ -XXX,XX +XXX,XX @@ | 263 | @@ -XXX,XX +XXX,XX @@ |
82 | +/* | 264 | +/* |
83 | + * AArch64 SME translation | 265 | + * Allwinner R40 SDRAM Controller emulation |
84 | + * | 266 | + * |
85 | + * Copyright (c) 2022 Linaro, Ltd | 267 | + * CCopyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> |
86 | + * | 268 | + * |
87 | + * This library is free software; you can redistribute it and/or | 269 | + * This program is free software: you can redistribute it and/or modify |
88 | + * modify it under the terms of the GNU Lesser General Public | 270 | + * it under the terms of the GNU General Public License as published by |
89 | + * License as published by the Free Software Foundation; either | 271 | + * the Free Software Foundation, either version 2 of the License, or |
90 | + * version 2.1 of the License, or (at your option) any later version. | 272 | + * (at your option) any later version. |
91 | + * | 273 | + * |
92 | + * This library is distributed in the hope that it will be useful, | 274 | + * This program is distributed in the hope that it will be useful, |
93 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | 275 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of |
94 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | 276 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
95 | + * Lesser General Public License for more details. | 277 | + * GNU General Public License for more details. |
96 | + * | 278 | + * |
97 | + * You should have received a copy of the GNU Lesser General Public | 279 | + * You should have received a copy of the GNU General Public License |
98 | + * License along with this library; if not, see <http://www.gnu.org/licenses/>. | 280 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. |
99 | + */ | 281 | + */ |
100 | + | 282 | + |
101 | +#include "qemu/osdep.h" | 283 | +#include "qemu/osdep.h" |
102 | +#include "cpu.h" | 284 | +#include "qemu/units.h" |
103 | +#include "tcg/tcg-op.h" | 285 | +#include "qemu/error-report.h" |
104 | +#include "tcg/tcg-op-gvec.h" | 286 | +#include "hw/sysbus.h" |
105 | +#include "tcg/tcg-gvec-desc.h" | 287 | +#include "migration/vmstate.h" |
106 | +#include "translate.h" | 288 | +#include "qemu/log.h" |
107 | +#include "exec/helper-gen.h" | 289 | +#include "qemu/module.h" |
108 | +#include "translate-a64.h" | 290 | +#include "exec/address-spaces.h" |
109 | +#include "fpu/softfloat.h" | 291 | +#include "hw/qdev-properties.h" |
110 | + | 292 | +#include "qapi/error.h" |
293 | +#include "qemu/bitops.h" | ||
294 | +#include "hw/misc/allwinner-r40-dramc.h" | ||
295 | +#include "trace.h" | ||
296 | + | ||
297 | +#define REG_INDEX(offset) (offset / sizeof(uint32_t)) | ||
298 | + | ||
299 | +/* DRAMCOM register offsets */ | ||
300 | +enum { | ||
301 | + REG_DRAMCOM_CR = 0x0000, /* Control Register */ | ||
302 | +}; | ||
303 | + | ||
304 | +/* DRAMCOMM register flags */ | ||
305 | +enum { | ||
306 | + REG_DRAMCOM_CR_DUAL_RANK = (1 << 0), | ||
307 | +}; | ||
308 | + | ||
309 | +/* DRAMCTL register offsets */ | ||
310 | +enum { | ||
311 | + REG_DRAMCTL_PIR = 0x0000, /* PHY Initialization Register */ | ||
312 | + REG_DRAMCTL_PGSR = 0x0010, /* PHY General Status Register */ | ||
313 | + REG_DRAMCTL_STATR = 0x0018, /* Status Register */ | ||
314 | + REG_DRAMCTL_PGCR = 0x0100, /* PHY general configuration registers */ | ||
315 | +}; | ||
316 | + | ||
317 | +/* DRAMCTL register flags */ | ||
318 | +enum { | ||
319 | + REG_DRAMCTL_PGSR_INITDONE = (1 << 0), | ||
320 | + REG_DRAMCTL_PGSR_READ_TIMEOUT = (1 << 13), | ||
321 | + REG_DRAMCTL_PGCR_ENABLE_READ_TIMEOUT = (1 << 25), | ||
322 | +}; | ||
323 | + | ||
324 | +enum { | ||
325 | + REG_DRAMCTL_STATR_ACTIVE = (1 << 0), | ||
326 | +}; | ||
327 | + | ||
328 | +#define DRAM_MAX_ROW_BITS 16 | ||
329 | +#define DRAM_MAX_COL_BITS 13 /* 8192 */ | ||
330 | +#define DRAM_MAX_BANK 3 | ||
331 | + | ||
332 | +static uint64_t dram_autodetect_cells[DRAM_MAX_ROW_BITS] | ||
333 | + [DRAM_MAX_BANK] | ||
334 | + [DRAM_MAX_COL_BITS]; | ||
335 | +struct VirtualDDRChip { | ||
336 | + uint32_t ram_size; | ||
337 | + uint8_t bank_bits; | ||
338 | + uint8_t row_bits; | ||
339 | + uint8_t col_bits; | ||
340 | +}; | ||
111 | + | 341 | + |
112 | +/* | 342 | +/* |
113 | + * Include the generated decoder. | 343 | + * Only power of 2 RAM sizes from 256MiB up to 2048MiB are supported, |
344 | + * 2GiB memory is not supported due to dual rank feature. | ||
114 | + */ | 345 | + */ |
115 | + | 346 | +static const struct VirtualDDRChip dummy_ddr_chips[] = { |
116 | +#include "decode-sme.c.inc" | 347 | + { |
117 | diff --git a/target/arm/meson.build b/target/arm/meson.build | 348 | + .ram_size = 256, |
349 | + .bank_bits = 3, | ||
350 | + .row_bits = 12, | ||
351 | + .col_bits = 13, | ||
352 | + }, { | ||
353 | + .ram_size = 512, | ||
354 | + .bank_bits = 3, | ||
355 | + .row_bits = 13, | ||
356 | + .col_bits = 13, | ||
357 | + }, { | ||
358 | + .ram_size = 1024, | ||
359 | + .bank_bits = 3, | ||
360 | + .row_bits = 14, | ||
361 | + .col_bits = 13, | ||
362 | + }, { | ||
363 | + 0 | ||
364 | + } | ||
365 | +}; | ||
366 | + | ||
367 | +static const struct VirtualDDRChip *get_match_ddr(uint32_t ram_size) | ||
368 | +{ | ||
369 | + const struct VirtualDDRChip *ddr; | ||
370 | + | ||
371 | + for (ddr = &dummy_ddr_chips[0]; ddr->ram_size; ddr++) { | ||
372 | + if (ddr->ram_size == ram_size) { | ||
373 | + return ddr; | ||
374 | + } | ||
375 | + } | ||
376 | + | ||
377 | + return NULL; | ||
378 | +} | ||
379 | + | ||
380 | +static uint64_t *address_to_autodetect_cells(AwR40DramCtlState *s, | ||
381 | + const struct VirtualDDRChip *ddr, | ||
382 | + uint32_t offset) | ||
383 | +{ | ||
384 | + int row_index = 0, bank_index = 0, col_index = 0; | ||
385 | + uint32_t row_addr, bank_addr, col_addr; | ||
386 | + | ||
387 | + row_addr = extract32(offset, s->set_col_bits + s->set_bank_bits, | ||
388 | + s->set_row_bits); | ||
389 | + bank_addr = extract32(offset, s->set_col_bits, s->set_bank_bits); | ||
390 | + col_addr = extract32(offset, 0, s->set_col_bits); | ||
391 | + | ||
392 | + for (int i = 0; i < ddr->row_bits; i++) { | ||
393 | + if (row_addr & BIT(i)) { | ||
394 | + row_index = i; | ||
395 | + } | ||
396 | + } | ||
397 | + | ||
398 | + for (int i = 0; i < ddr->bank_bits; i++) { | ||
399 | + if (bank_addr & BIT(i)) { | ||
400 | + bank_index = i; | ||
401 | + } | ||
402 | + } | ||
403 | + | ||
404 | + for (int i = 0; i < ddr->col_bits; i++) { | ||
405 | + if (col_addr & BIT(i)) { | ||
406 | + col_index = i; | ||
407 | + } | ||
408 | + } | ||
409 | + | ||
410 | + trace_allwinner_r40_dramc_offset_to_cell(offset, row_index, bank_index, | ||
411 | + col_index); | ||
412 | + return &dram_autodetect_cells[row_index][bank_index][col_index]; | ||
413 | +} | ||
414 | + | ||
415 | +static void allwinner_r40_dramc_map_rows(AwR40DramCtlState *s, uint8_t row_bits, | ||
416 | + uint8_t bank_bits, uint8_t col_bits) | ||
417 | +{ | ||
418 | + const struct VirtualDDRChip *ddr = get_match_ddr(s->ram_size); | ||
419 | + bool enable_detect_cells; | ||
420 | + | ||
421 | + trace_allwinner_r40_dramc_map_rows(row_bits, bank_bits, col_bits); | ||
422 | + | ||
423 | + if (!ddr) { | ||
424 | + return; | ||
425 | + } | ||
426 | + | ||
427 | + s->set_row_bits = row_bits; | ||
428 | + s->set_bank_bits = bank_bits; | ||
429 | + s->set_col_bits = col_bits; | ||
430 | + | ||
431 | + enable_detect_cells = ddr->bank_bits != bank_bits | ||
432 | + || ddr->row_bits != row_bits | ||
433 | + || ddr->col_bits != col_bits; | ||
434 | + | ||
435 | + if (enable_detect_cells) { | ||
436 | + trace_allwinner_r40_dramc_detect_cells_enable(); | ||
437 | + } else { | ||
438 | + trace_allwinner_r40_dramc_detect_cells_disable(); | ||
439 | + } | ||
440 | + | ||
441 | + memory_region_set_enabled(&s->detect_cells, enable_detect_cells); | ||
442 | +} | ||
443 | + | ||
444 | +static uint64_t allwinner_r40_dramcom_read(void *opaque, hwaddr offset, | ||
445 | + unsigned size) | ||
446 | +{ | ||
447 | + const AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
448 | + const uint32_t idx = REG_INDEX(offset); | ||
449 | + | ||
450 | + if (idx >= AW_R40_DRAMCOM_REGS_NUM) { | ||
451 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
452 | + __func__, (uint32_t)offset); | ||
453 | + return 0; | ||
454 | + } | ||
455 | + | ||
456 | + trace_allwinner_r40_dramcom_read(offset, s->dramcom[idx], size); | ||
457 | + return s->dramcom[idx]; | ||
458 | +} | ||
459 | + | ||
460 | +static void allwinner_r40_dramcom_write(void *opaque, hwaddr offset, | ||
461 | + uint64_t val, unsigned size) | ||
462 | +{ | ||
463 | + AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
464 | + const uint32_t idx = REG_INDEX(offset); | ||
465 | + | ||
466 | + trace_allwinner_r40_dramcom_write(offset, val, size); | ||
467 | + | ||
468 | + if (idx >= AW_R40_DRAMCOM_REGS_NUM) { | ||
469 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
470 | + __func__, (uint32_t)offset); | ||
471 | + return; | ||
472 | + } | ||
473 | + | ||
474 | + switch (offset) { | ||
475 | + case REG_DRAMCOM_CR: /* Control Register */ | ||
476 | + if (!(val & REG_DRAMCOM_CR_DUAL_RANK)) { | ||
477 | + allwinner_r40_dramc_map_rows(s, ((val >> 4) & 0xf) + 1, | ||
478 | + ((val >> 2) & 0x1) + 2, | ||
479 | + (((val >> 8) & 0xf) + 3)); | ||
480 | + } | ||
481 | + break; | ||
482 | + }; | ||
483 | + | ||
484 | + s->dramcom[idx] = (uint32_t) val; | ||
485 | +} | ||
486 | + | ||
487 | +static uint64_t allwinner_r40_dramctl_read(void *opaque, hwaddr offset, | ||
488 | + unsigned size) | ||
489 | +{ | ||
490 | + const AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
491 | + const uint32_t idx = REG_INDEX(offset); | ||
492 | + | ||
493 | + if (idx >= AW_R40_DRAMCTL_REGS_NUM) { | ||
494 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
495 | + __func__, (uint32_t)offset); | ||
496 | + return 0; | ||
497 | + } | ||
498 | + | ||
499 | + trace_allwinner_r40_dramctl_read(offset, s->dramctl[idx], size); | ||
500 | + return s->dramctl[idx]; | ||
501 | +} | ||
502 | + | ||
503 | +static void allwinner_r40_dramctl_write(void *opaque, hwaddr offset, | ||
504 | + uint64_t val, unsigned size) | ||
505 | +{ | ||
506 | + AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
507 | + const uint32_t idx = REG_INDEX(offset); | ||
508 | + | ||
509 | + trace_allwinner_r40_dramctl_write(offset, val, size); | ||
510 | + | ||
511 | + if (idx >= AW_R40_DRAMCTL_REGS_NUM) { | ||
512 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
513 | + __func__, (uint32_t)offset); | ||
514 | + return; | ||
515 | + } | ||
516 | + | ||
517 | + switch (offset) { | ||
518 | + case REG_DRAMCTL_PIR: /* PHY Initialization Register */ | ||
519 | + s->dramctl[REG_INDEX(REG_DRAMCTL_PGSR)] |= REG_DRAMCTL_PGSR_INITDONE; | ||
520 | + s->dramctl[REG_INDEX(REG_DRAMCTL_STATR)] |= REG_DRAMCTL_STATR_ACTIVE; | ||
521 | + break; | ||
522 | + } | ||
523 | + | ||
524 | + s->dramctl[idx] = (uint32_t) val; | ||
525 | +} | ||
526 | + | ||
527 | +static uint64_t allwinner_r40_dramphy_read(void *opaque, hwaddr offset, | ||
528 | + unsigned size) | ||
529 | +{ | ||
530 | + const AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
531 | + const uint32_t idx = REG_INDEX(offset); | ||
532 | + | ||
533 | + if (idx >= AW_R40_DRAMPHY_REGS_NUM) { | ||
534 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
535 | + __func__, (uint32_t)offset); | ||
536 | + return 0; | ||
537 | + } | ||
538 | + | ||
539 | + trace_allwinner_r40_dramphy_read(offset, s->dramphy[idx], size); | ||
540 | + return s->dramphy[idx]; | ||
541 | +} | ||
542 | + | ||
543 | +static void allwinner_r40_dramphy_write(void *opaque, hwaddr offset, | ||
544 | + uint64_t val, unsigned size) | ||
545 | +{ | ||
546 | + AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
547 | + const uint32_t idx = REG_INDEX(offset); | ||
548 | + | ||
549 | + trace_allwinner_r40_dramphy_write(offset, val, size); | ||
550 | + | ||
551 | + if (idx >= AW_R40_DRAMPHY_REGS_NUM) { | ||
552 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
553 | + __func__, (uint32_t)offset); | ||
554 | + return; | ||
555 | + } | ||
556 | + | ||
557 | + s->dramphy[idx] = (uint32_t) val; | ||
558 | +} | ||
559 | + | ||
560 | +static const MemoryRegionOps allwinner_r40_dramcom_ops = { | ||
561 | + .read = allwinner_r40_dramcom_read, | ||
562 | + .write = allwinner_r40_dramcom_write, | ||
563 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
564 | + .valid = { | ||
565 | + .min_access_size = 4, | ||
566 | + .max_access_size = 4, | ||
567 | + }, | ||
568 | + .impl.min_access_size = 4, | ||
569 | +}; | ||
570 | + | ||
571 | +static const MemoryRegionOps allwinner_r40_dramctl_ops = { | ||
572 | + .read = allwinner_r40_dramctl_read, | ||
573 | + .write = allwinner_r40_dramctl_write, | ||
574 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
575 | + .valid = { | ||
576 | + .min_access_size = 4, | ||
577 | + .max_access_size = 4, | ||
578 | + }, | ||
579 | + .impl.min_access_size = 4, | ||
580 | +}; | ||
581 | + | ||
582 | +static const MemoryRegionOps allwinner_r40_dramphy_ops = { | ||
583 | + .read = allwinner_r40_dramphy_read, | ||
584 | + .write = allwinner_r40_dramphy_write, | ||
585 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
586 | + .valid = { | ||
587 | + .min_access_size = 4, | ||
588 | + .max_access_size = 4, | ||
589 | + }, | ||
590 | + .impl.min_access_size = 4, | ||
591 | +}; | ||
592 | + | ||
593 | +static uint64_t allwinner_r40_detect_read(void *opaque, hwaddr offset, | ||
594 | + unsigned size) | ||
595 | +{ | ||
596 | + AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
597 | + const struct VirtualDDRChip *ddr = get_match_ddr(s->ram_size); | ||
598 | + uint64_t data = 0; | ||
599 | + | ||
600 | + if (ddr) { | ||
601 | + data = *address_to_autodetect_cells(s, ddr, (uint32_t)offset); | ||
602 | + } | ||
603 | + | ||
604 | + trace_allwinner_r40_dramc_detect_cell_read(offset, data); | ||
605 | + return data; | ||
606 | +} | ||
607 | + | ||
608 | +static void allwinner_r40_detect_write(void *opaque, hwaddr offset, | ||
609 | + uint64_t data, unsigned size) | ||
610 | +{ | ||
611 | + AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
612 | + const struct VirtualDDRChip *ddr = get_match_ddr(s->ram_size); | ||
613 | + | ||
614 | + if (ddr) { | ||
615 | + uint64_t *cell = address_to_autodetect_cells(s, ddr, (uint32_t)offset); | ||
616 | + trace_allwinner_r40_dramc_detect_cell_write(offset, data); | ||
617 | + *cell = data; | ||
618 | + } | ||
619 | +} | ||
620 | + | ||
621 | +static const MemoryRegionOps allwinner_r40_detect_ops = { | ||
622 | + .read = allwinner_r40_detect_read, | ||
623 | + .write = allwinner_r40_detect_write, | ||
624 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
625 | + .valid = { | ||
626 | + .min_access_size = 4, | ||
627 | + .max_access_size = 4, | ||
628 | + }, | ||
629 | + .impl.min_access_size = 4, | ||
630 | +}; | ||
631 | + | ||
632 | +/* | ||
633 | + * mctl_r40_detect_rank_count in u-boot will write the high 1G of DDR | ||
634 | + * to detect wether the board support dual_rank or not. Create a virtual memory | ||
635 | + * if the board's ram_size less or equal than 1G, and set read time out flag of | ||
636 | + * REG_DRAMCTL_PGSR when the user touch this high dram. | ||
637 | + */ | ||
638 | +static uint64_t allwinner_r40_dualrank_detect_read(void *opaque, hwaddr offset, | ||
639 | + unsigned size) | ||
640 | +{ | ||
641 | + AwR40DramCtlState *s = AW_R40_DRAMC(opaque); | ||
642 | + uint32_t reg; | ||
643 | + | ||
644 | + reg = s->dramctl[REG_INDEX(REG_DRAMCTL_PGCR)]; | ||
645 | + if (reg & REG_DRAMCTL_PGCR_ENABLE_READ_TIMEOUT) { /* Enable read time out */ | ||
646 | + /* | ||
647 | + * this driver only support one rank, mark READ_TIMEOUT when try | ||
648 | + * read the second rank. | ||
649 | + */ | ||
650 | + s->dramctl[REG_INDEX(REG_DRAMCTL_PGSR)] | ||
651 | + |= REG_DRAMCTL_PGSR_READ_TIMEOUT; | ||
652 | + } | ||
653 | + | ||
654 | + return 0; | ||
655 | +} | ||
656 | + | ||
657 | +static const MemoryRegionOps allwinner_r40_dualrank_detect_ops = { | ||
658 | + .read = allwinner_r40_dualrank_detect_read, | ||
659 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
660 | + .valid = { | ||
661 | + .min_access_size = 4, | ||
662 | + .max_access_size = 4, | ||
663 | + }, | ||
664 | + .impl.min_access_size = 4, | ||
665 | +}; | ||
666 | + | ||
667 | +static void allwinner_r40_dramc_reset(DeviceState *dev) | ||
668 | +{ | ||
669 | + AwR40DramCtlState *s = AW_R40_DRAMC(dev); | ||
670 | + | ||
671 | + /* Set default values for registers */ | ||
672 | + memset(&s->dramcom, 0, sizeof(s->dramcom)); | ||
673 | + memset(&s->dramctl, 0, sizeof(s->dramctl)); | ||
674 | + memset(&s->dramphy, 0, sizeof(s->dramphy)); | ||
675 | +} | ||
676 | + | ||
677 | +static void allwinner_r40_dramc_realize(DeviceState *dev, Error **errp) | ||
678 | +{ | ||
679 | + AwR40DramCtlState *s = AW_R40_DRAMC(dev); | ||
680 | + | ||
681 | + if (!get_match_ddr(s->ram_size)) { | ||
682 | + error_report("%s: ram-size %u MiB is not supported", | ||
683 | + __func__, s->ram_size); | ||
684 | + exit(1); | ||
685 | + } | ||
686 | + | ||
687 | + /* detect_cells */ | ||
688 | + sysbus_mmio_map_overlap(SYS_BUS_DEVICE(s), 3, s->ram_addr, 10); | ||
689 | + memory_region_set_enabled(&s->detect_cells, false); | ||
690 | + | ||
691 | + /* | ||
692 | + * We only support DRAM size up to 1G now, so prepare a high memory page | ||
693 | + * after 1G for dualrank detect. index = 4 | ||
694 | + */ | ||
695 | + memory_region_init_io(&s->dram_high, OBJECT(s), | ||
696 | + &allwinner_r40_dualrank_detect_ops, s, | ||
697 | + "DRAMHIGH", KiB); | ||
698 | + sysbus_init_mmio(SYS_BUS_DEVICE(s), &s->dram_high); | ||
699 | + sysbus_mmio_map(SYS_BUS_DEVICE(s), 4, s->ram_addr + GiB); | ||
700 | +} | ||
701 | + | ||
702 | +static void allwinner_r40_dramc_init(Object *obj) | ||
703 | +{ | ||
704 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
705 | + AwR40DramCtlState *s = AW_R40_DRAMC(obj); | ||
706 | + | ||
707 | + /* DRAMCOM registers, index 0 */ | ||
708 | + memory_region_init_io(&s->dramcom_iomem, OBJECT(s), | ||
709 | + &allwinner_r40_dramcom_ops, s, | ||
710 | + "DRAMCOM", 4 * KiB); | ||
711 | + sysbus_init_mmio(sbd, &s->dramcom_iomem); | ||
712 | + | ||
713 | + /* DRAMCTL registers, index 1 */ | ||
714 | + memory_region_init_io(&s->dramctl_iomem, OBJECT(s), | ||
715 | + &allwinner_r40_dramctl_ops, s, | ||
716 | + "DRAMCTL", 4 * KiB); | ||
717 | + sysbus_init_mmio(sbd, &s->dramctl_iomem); | ||
718 | + | ||
719 | + /* DRAMPHY registers. index 2 */ | ||
720 | + memory_region_init_io(&s->dramphy_iomem, OBJECT(s), | ||
721 | + &allwinner_r40_dramphy_ops, s, | ||
722 | + "DRAMPHY", 4 * KiB); | ||
723 | + sysbus_init_mmio(sbd, &s->dramphy_iomem); | ||
724 | + | ||
725 | + /* R40 support max 2G memory but we only support up to 1G now. index 3 */ | ||
726 | + memory_region_init_io(&s->detect_cells, OBJECT(s), | ||
727 | + &allwinner_r40_detect_ops, s, | ||
728 | + "DRAMCELLS", 1 * GiB); | ||
729 | + sysbus_init_mmio(sbd, &s->detect_cells); | ||
730 | +} | ||
731 | + | ||
732 | +static Property allwinner_r40_dramc_properties[] = { | ||
733 | + DEFINE_PROP_UINT64("ram-addr", AwR40DramCtlState, ram_addr, 0x0), | ||
734 | + DEFINE_PROP_UINT32("ram-size", AwR40DramCtlState, ram_size, 256), /* MiB */ | ||
735 | + DEFINE_PROP_END_OF_LIST() | ||
736 | +}; | ||
737 | + | ||
738 | +static const VMStateDescription allwinner_r40_dramc_vmstate = { | ||
739 | + .name = "allwinner-r40-dramc", | ||
740 | + .version_id = 1, | ||
741 | + .minimum_version_id = 1, | ||
742 | + .fields = (VMStateField[]) { | ||
743 | + VMSTATE_UINT32_ARRAY(dramcom, AwR40DramCtlState, | ||
744 | + AW_R40_DRAMCOM_REGS_NUM), | ||
745 | + VMSTATE_UINT32_ARRAY(dramctl, AwR40DramCtlState, | ||
746 | + AW_R40_DRAMCTL_REGS_NUM), | ||
747 | + VMSTATE_UINT32_ARRAY(dramphy, AwR40DramCtlState, | ||
748 | + AW_R40_DRAMPHY_REGS_NUM), | ||
749 | + VMSTATE_END_OF_LIST() | ||
750 | + } | ||
751 | +}; | ||
752 | + | ||
753 | +static void allwinner_r40_dramc_class_init(ObjectClass *klass, void *data) | ||
754 | +{ | ||
755 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
756 | + | ||
757 | + dc->reset = allwinner_r40_dramc_reset; | ||
758 | + dc->vmsd = &allwinner_r40_dramc_vmstate; | ||
759 | + dc->realize = allwinner_r40_dramc_realize; | ||
760 | + device_class_set_props(dc, allwinner_r40_dramc_properties); | ||
761 | +} | ||
762 | + | ||
763 | +static const TypeInfo allwinner_r40_dramc_info = { | ||
764 | + .name = TYPE_AW_R40_DRAMC, | ||
765 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
766 | + .instance_init = allwinner_r40_dramc_init, | ||
767 | + .instance_size = sizeof(AwR40DramCtlState), | ||
768 | + .class_init = allwinner_r40_dramc_class_init, | ||
769 | +}; | ||
770 | + | ||
771 | +static void allwinner_r40_dramc_register(void) | ||
772 | +{ | ||
773 | + type_register_static(&allwinner_r40_dramc_info); | ||
774 | +} | ||
775 | + | ||
776 | +type_init(allwinner_r40_dramc_register) | ||
777 | diff --git a/hw/misc/meson.build b/hw/misc/meson.build | ||
118 | index XXXXXXX..XXXXXXX 100644 | 778 | index XXXXXXX..XXXXXXX 100644 |
119 | --- a/target/arm/meson.build | 779 | --- a/hw/misc/meson.build |
120 | +++ b/target/arm/meson.build | 780 | +++ b/hw/misc/meson.build |
121 | @@ -XXX,XX +XXX,XX @@ | 781 | @@ -XXX,XX +XXX,XX @@ softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-dramc.c |
122 | gen = [ | 782 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-sysctrl.c')) |
123 | decodetree.process('sve.decode', extra_args: '--decode=disas_sve'), | 783 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-sid.c')) |
124 | + decodetree.process('sme.decode', extra_args: '--decode=disas_sme'), | 784 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_R40', if_true: files('allwinner-r40-ccu.c')) |
125 | decodetree.process('neon-shared.decode', extra_args: '--decode=disas_neon_shared'), | 785 | +softmmu_ss.add(when: 'CONFIG_ALLWINNER_R40', if_true: files('allwinner-r40-dramc.c')) |
126 | decodetree.process('neon-dp.decode', extra_args: '--decode=disas_neon_dp'), | 786 | softmmu_ss.add(when: 'CONFIG_AXP2XX_PMU', if_true: files('axp2xx.c')) |
127 | decodetree.process('neon-ls.decode', extra_args: '--decode=disas_neon_ls'), | 787 | softmmu_ss.add(when: 'CONFIG_REALVIEW', if_true: files('arm_sysctl.c')) |
128 | @@ -XXX,XX +XXX,XX @@ arm_ss.add(when: 'TARGET_AARCH64', if_true: files( | 788 | softmmu_ss.add(when: 'CONFIG_NSERIES', if_true: files('cbus.c')) |
129 | 'sme_helper.c', | 789 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events |
130 | 'translate-a64.c', | 790 | index XXXXXXX..XXXXXXX 100644 |
131 | 'translate-sve.c', | 791 | --- a/hw/misc/trace-events |
132 | + 'translate-sme.c', | 792 | +++ b/hw/misc/trace-events |
133 | )) | 793 | @@ -XXX,XX +XXX,XX @@ allwinner_h3_dramctl_write(uint64_t offset, uint64_t data, unsigned size) "Write |
134 | 794 | allwinner_h3_dramphy_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | |
135 | arm_softmmu_ss = ss.source_set() | 795 | allwinner_h3_dramphy_write(uint64_t offset, uint64_t data, unsigned size) "write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 |
796 | |||
797 | +# allwinner-r40-dramc.c | ||
798 | +allwinner_r40_dramc_detect_cells_disable(void) "Disable detect cells" | ||
799 | +allwinner_r40_dramc_detect_cells_enable(void) "Enable detect cells" | ||
800 | +allwinner_r40_dramc_map_rows(uint8_t row_bits, uint8_t bank_bits, uint8_t col_bits) "DRAM layout: row_bits %d, bank_bits %d, col_bits %d" | ||
801 | +allwinner_r40_dramc_offset_to_cell(uint64_t offset, int row, int bank, int col) "offset 0x%" PRIx64 " row %d bank %d col %d" | ||
802 | +allwinner_r40_dramc_detect_cell_write(uint64_t offset, uint64_t data) "offset 0x%" PRIx64 " data 0x%" PRIx64 "" | ||
803 | +allwinner_r40_dramc_detect_cell_read(uint64_t offset, uint64_t data) "offset 0x%" PRIx64 " data 0x%" PRIx64 "" | ||
804 | +allwinner_r40_dramcom_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
805 | +allwinner_r40_dramcom_write(uint64_t offset, uint64_t data, unsigned size) "Write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
806 | +allwinner_r40_dramctl_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
807 | +allwinner_r40_dramctl_write(uint64_t offset, uint64_t data, unsigned size) "Write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
808 | +allwinner_r40_dramphy_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
809 | +allwinner_r40_dramphy_write(uint64_t offset, uint64_t data, unsigned size) "write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
810 | + | ||
811 | # allwinner-sid.c | ||
812 | allwinner_sid_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
813 | allwinner_sid_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
136 | -- | 814 | -- |
137 | 2.25.1 | 815 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | This is an SVE instruction that operates using the SVE vector | 3 | A64's sd register was similar to H3, and it introduced a new register |
4 | length but that it is present only if SME is implemented. | 4 | named SAMP_DL_REG location at 0x144. The dma descriptor buffer size of |
5 | 5 | mmc2 is only 8K and the other mmc controllers has 64K. | |
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Also fix allwinner-r40's mmc controller type. |
8 | Message-id: 20220708151540.18136-31-richard.henderson@linaro.org | 8 | |
9 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | target/arm/helper.h | 18 +++++++ | 12 | include/hw/sd/allwinner-sdhost.h | 9 ++++ |
12 | target/arm/sve.decode | 5 ++ | 13 | hw/arm/allwinner-r40.c | 2 +- |
13 | target/arm/translate-sve.c | 102 +++++++++++++++++++++++++++++++++++++ | 14 | hw/sd/allwinner-sdhost.c | 72 ++++++++++++++++++++++++++++++-- |
14 | target/arm/vec_helper.c | 24 +++++++++ | 15 | 3 files changed, 79 insertions(+), 4 deletions(-) |
15 | 4 files changed, 149 insertions(+) | 16 | |
16 | 17 | diff --git a/include/hw/sd/allwinner-sdhost.h b/include/hw/sd/allwinner-sdhost.h | |
17 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
18 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/target/arm/helper.h | 19 | --- a/include/hw/sd/allwinner-sdhost.h |
20 | +++ b/target/arm/helper.h | 20 | +++ b/include/hw/sd/allwinner-sdhost.h |
21 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_6(gvec_bfmlal, TCG_CALL_NO_RWG, | 21 | @@ -XXX,XX +XXX,XX @@ |
22 | DEF_HELPER_FLAGS_6(gvec_bfmlal_idx, TCG_CALL_NO_RWG, | 22 | /** Allwinner sun5i family and newer (A13, H2+, H3, etc) */ |
23 | void, ptr, ptr, ptr, ptr, ptr, i32) | 23 | #define TYPE_AW_SDHOST_SUN5I TYPE_AW_SDHOST "-sun5i" |
24 | 24 | ||
25 | +DEF_HELPER_FLAGS_5(gvec_sclamp_b, TCG_CALL_NO_RWG, | 25 | +/** Allwinner sun50i-a64 */ |
26 | + void, ptr, ptr, ptr, ptr, i32) | 26 | +#define TYPE_AW_SDHOST_SUN50I_A64 TYPE_AW_SDHOST "-sun50i-a64" |
27 | +DEF_HELPER_FLAGS_5(gvec_sclamp_h, TCG_CALL_NO_RWG, | 27 | + |
28 | + void, ptr, ptr, ptr, ptr, i32) | 28 | +/** Allwinner sun50i-a64 emmc */ |
29 | +DEF_HELPER_FLAGS_5(gvec_sclamp_s, TCG_CALL_NO_RWG, | 29 | +#define TYPE_AW_SDHOST_SUN50I_A64_EMMC TYPE_AW_SDHOST "-sun50i-a64-emmc" |
30 | + void, ptr, ptr, ptr, ptr, i32) | 30 | + |
31 | +DEF_HELPER_FLAGS_5(gvec_sclamp_d, TCG_CALL_NO_RWG, | 31 | /** @} */ |
32 | + void, ptr, ptr, ptr, ptr, i32) | 32 | |
33 | + | 33 | /** |
34 | +DEF_HELPER_FLAGS_5(gvec_uclamp_b, TCG_CALL_NO_RWG, | 34 | @@ -XXX,XX +XXX,XX @@ struct AwSdHostState { |
35 | + void, ptr, ptr, ptr, ptr, i32) | 35 | uint32_t startbit_detect; /**< eMMC DDR Start Bit Detection Control */ |
36 | +DEF_HELPER_FLAGS_5(gvec_uclamp_h, TCG_CALL_NO_RWG, | 36 | uint32_t response_crc; /**< Response CRC */ |
37 | + void, ptr, ptr, ptr, ptr, i32) | 37 | uint32_t data_crc[8]; /**< Data CRC */ |
38 | +DEF_HELPER_FLAGS_5(gvec_uclamp_s, TCG_CALL_NO_RWG, | 38 | + uint32_t sample_delay; /**< Sample delay control */ |
39 | + void, ptr, ptr, ptr, ptr, i32) | 39 | uint32_t status_crc; /**< Status CRC */ |
40 | +DEF_HELPER_FLAGS_5(gvec_uclamp_d, TCG_CALL_NO_RWG, | 40 | |
41 | + void, ptr, ptr, ptr, ptr, i32) | 41 | /** @} */ |
42 | + | 42 | @@ -XXX,XX +XXX,XX @@ struct AwSdHostClass { |
43 | #ifdef TARGET_AARCH64 | 43 | size_t max_desc_size; |
44 | #include "helper-a64.h" | 44 | bool is_sun4i; |
45 | #include "helper-sve.h" | 45 | |
46 | diff --git a/target/arm/sve.decode b/target/arm/sve.decode | 46 | + /** does the IP block support autocalibration? */ |
47 | + bool can_calibrate; | ||
48 | }; | ||
49 | |||
50 | #endif /* HW_SD_ALLWINNER_SDHOST_H */ | ||
51 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
47 | index XXXXXXX..XXXXXXX 100644 | 52 | index XXXXXXX..XXXXXXX 100644 |
48 | --- a/target/arm/sve.decode | 53 | --- a/hw/arm/allwinner-r40.c |
49 | +++ b/target/arm/sve.decode | 54 | +++ b/hw/arm/allwinner-r40.c |
50 | @@ -XXX,XX +XXX,XX @@ PSEL 00100101 .. 1 100 .. 01 .... 0 .... 0 .... \ | 55 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) |
51 | @psel esz=2 imm=%psel_imm_s | 56 | |
52 | PSEL 00100101 .1 1 000 .. 01 .... 0 .... 0 .... \ | 57 | for (int i = 0; i < AW_R40_NUM_MMCS; i++) { |
53 | @psel esz=3 imm=%psel_imm_d | 58 | object_initialize_child(obj, mmc_names[i], &s->mmc[i], |
54 | + | 59 | - TYPE_AW_SDHOST_SUN5I); |
55 | +### SVE clamp | 60 | + TYPE_AW_SDHOST_SUN50I_A64); |
56 | + | 61 | } |
57 | +SCLAMP 01000100 .. 0 ..... 110000 ..... ..... @rda_rn_rm | 62 | |
58 | +UCLAMP 01000100 .. 0 ..... 110001 ..... ..... @rda_rn_rm | 63 | object_initialize_child(obj, "twi0", &s->i2c0, TYPE_AW_I2C_SUN6I); |
59 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 64 | diff --git a/hw/sd/allwinner-sdhost.c b/hw/sd/allwinner-sdhost.c |
60 | index XXXXXXX..XXXXXXX 100644 | 65 | index XXXXXXX..XXXXXXX 100644 |
61 | --- a/target/arm/translate-sve.c | 66 | --- a/hw/sd/allwinner-sdhost.c |
62 | +++ b/target/arm/translate-sve.c | 67 | +++ b/hw/sd/allwinner-sdhost.c |
63 | @@ -XXX,XX +XXX,XX @@ static bool trans_PSEL(DisasContext *s, arg_psel *a) | 68 | @@ -XXX,XX +XXX,XX @@ enum { |
64 | tcg_temp_free_ptr(ptr); | 69 | REG_SD_DATA1_CRC = 0x12C, /* CRC Data 1 from card/eMMC */ |
65 | return true; | 70 | REG_SD_DATA0_CRC = 0x130, /* CRC Data 0 from card/eMMC */ |
66 | } | 71 | REG_SD_CRC_STA = 0x134, /* CRC status from card/eMMC during write */ |
67 | + | 72 | + REG_SD_SAMP_DL = 0x144, /* Sample Delay Control (sun50i-a64) */ |
68 | +static void gen_sclamp_i32(TCGv_i32 d, TCGv_i32 n, TCGv_i32 m, TCGv_i32 a) | 73 | REG_SD_FIFO = 0x200, /* Read/Write FIFO */ |
74 | }; | ||
75 | |||
76 | @@ -XXX,XX +XXX,XX @@ enum { | ||
77 | REG_SD_RES_CRC_RST = 0x0, | ||
78 | REG_SD_DATA_CRC_RST = 0x0, | ||
79 | REG_SD_CRC_STA_RST = 0x0, | ||
80 | + REG_SD_SAMPLE_DL_RST = 0x00002000, | ||
81 | REG_SD_FIFO_RST = 0x0, | ||
82 | }; | ||
83 | |||
84 | @@ -XXX,XX +XXX,XX @@ static uint64_t allwinner_sdhost_read(void *opaque, hwaddr offset, | ||
85 | { | ||
86 | AwSdHostState *s = AW_SDHOST(opaque); | ||
87 | AwSdHostClass *sc = AW_SDHOST_GET_CLASS(s); | ||
88 | + bool out_of_bounds = false; | ||
89 | uint32_t res = 0; | ||
90 | |||
91 | switch (offset) { | ||
92 | @@ -XXX,XX +XXX,XX @@ static uint64_t allwinner_sdhost_read(void *opaque, hwaddr offset, | ||
93 | case REG_SD_FIFO: /* Read/Write FIFO */ | ||
94 | res = allwinner_sdhost_fifo_read(s); | ||
95 | break; | ||
96 | + case REG_SD_SAMP_DL: /* Sample Delay */ | ||
97 | + if (sc->can_calibrate) { | ||
98 | + res = s->sample_delay; | ||
99 | + } else { | ||
100 | + out_of_bounds = true; | ||
101 | + } | ||
102 | + break; | ||
103 | default: | ||
104 | - qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset %" | ||
105 | - HWADDR_PRIx"\n", __func__, offset); | ||
106 | + out_of_bounds = true; | ||
107 | res = 0; | ||
108 | break; | ||
109 | } | ||
110 | |||
111 | + if (out_of_bounds) { | ||
112 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset %" | ||
113 | + HWADDR_PRIx"\n", __func__, offset); | ||
114 | + } | ||
115 | + | ||
116 | trace_allwinner_sdhost_read(offset, res, size); | ||
117 | return res; | ||
118 | } | ||
119 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_write(void *opaque, hwaddr offset, | ||
120 | { | ||
121 | AwSdHostState *s = AW_SDHOST(opaque); | ||
122 | AwSdHostClass *sc = AW_SDHOST_GET_CLASS(s); | ||
123 | + bool out_of_bounds = false; | ||
124 | |||
125 | trace_allwinner_sdhost_write(offset, value, size); | ||
126 | |||
127 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_write(void *opaque, hwaddr offset, | ||
128 | case REG_SD_DATA0_CRC: /* CRC Data 0 from card/eMMC */ | ||
129 | case REG_SD_CRC_STA: /* CRC status from card/eMMC in write operation */ | ||
130 | break; | ||
131 | + case REG_SD_SAMP_DL: /* Sample delay control */ | ||
132 | + if (sc->can_calibrate) { | ||
133 | + s->sample_delay = value; | ||
134 | + } else { | ||
135 | + out_of_bounds = true; | ||
136 | + } | ||
137 | + break; | ||
138 | default: | ||
139 | + out_of_bounds = true; | ||
140 | + break; | ||
141 | + } | ||
142 | + | ||
143 | + if (out_of_bounds) { | ||
144 | qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset %" | ||
145 | HWADDR_PRIx"\n", __func__, offset); | ||
146 | - break; | ||
147 | } | ||
148 | } | ||
149 | |||
150 | @@ -XXX,XX +XXX,XX @@ static const VMStateDescription vmstate_allwinner_sdhost = { | ||
151 | VMSTATE_UINT32(response_crc, AwSdHostState), | ||
152 | VMSTATE_UINT32_ARRAY(data_crc, AwSdHostState, 8), | ||
153 | VMSTATE_UINT32(status_crc, AwSdHostState), | ||
154 | + VMSTATE_UINT32(sample_delay, AwSdHostState), | ||
155 | VMSTATE_END_OF_LIST() | ||
156 | } | ||
157 | }; | ||
158 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_realize(DeviceState *dev, Error **errp) | ||
159 | static void allwinner_sdhost_reset(DeviceState *dev) | ||
160 | { | ||
161 | AwSdHostState *s = AW_SDHOST(dev); | ||
162 | + AwSdHostClass *sc = AW_SDHOST_GET_CLASS(s); | ||
163 | |||
164 | s->global_ctl = REG_SD_GCTL_RST; | ||
165 | s->clock_ctl = REG_SD_CKCR_RST; | ||
166 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_reset(DeviceState *dev) | ||
167 | } | ||
168 | |||
169 | s->status_crc = REG_SD_CRC_STA_RST; | ||
170 | + | ||
171 | + if (sc->can_calibrate) { | ||
172 | + s->sample_delay = REG_SD_SAMPLE_DL_RST; | ||
173 | + } | ||
174 | } | ||
175 | |||
176 | static void allwinner_sdhost_bus_class_init(ObjectClass *klass, void *data) | ||
177 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_sun4i_class_init(ObjectClass *klass, void *data) | ||
178 | AwSdHostClass *sc = AW_SDHOST_CLASS(klass); | ||
179 | sc->max_desc_size = 8 * KiB; | ||
180 | sc->is_sun4i = true; | ||
181 | + sc->can_calibrate = false; | ||
182 | } | ||
183 | |||
184 | static void allwinner_sdhost_sun5i_class_init(ObjectClass *klass, void *data) | ||
185 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_sun5i_class_init(ObjectClass *klass, void *data) | ||
186 | AwSdHostClass *sc = AW_SDHOST_CLASS(klass); | ||
187 | sc->max_desc_size = 64 * KiB; | ||
188 | sc->is_sun4i = false; | ||
189 | + sc->can_calibrate = false; | ||
190 | +} | ||
191 | + | ||
192 | +static void allwinner_sdhost_sun50i_a64_class_init(ObjectClass *klass, | ||
193 | + void *data) | ||
69 | +{ | 194 | +{ |
70 | + tcg_gen_smax_i32(d, a, n); | 195 | + AwSdHostClass *sc = AW_SDHOST_CLASS(klass); |
71 | + tcg_gen_smin_i32(d, d, m); | 196 | + sc->max_desc_size = 64 * KiB; |
197 | + sc->is_sun4i = false; | ||
198 | + sc->can_calibrate = true; | ||
72 | +} | 199 | +} |
73 | + | 200 | + |
74 | +static void gen_sclamp_i64(TCGv_i64 d, TCGv_i64 n, TCGv_i64 m, TCGv_i64 a) | 201 | +static void allwinner_sdhost_sun50i_a64_emmc_class_init(ObjectClass *klass, |
202 | + void *data) | ||
75 | +{ | 203 | +{ |
76 | + tcg_gen_smax_i64(d, a, n); | 204 | + AwSdHostClass *sc = AW_SDHOST_CLASS(klass); |
77 | + tcg_gen_smin_i64(d, d, m); | 205 | + sc->max_desc_size = 8 * KiB; |
78 | +} | 206 | + sc->is_sun4i = false; |
79 | + | 207 | + sc->can_calibrate = true; |
80 | +static void gen_sclamp_vec(unsigned vece, TCGv_vec d, TCGv_vec n, | 208 | } |
81 | + TCGv_vec m, TCGv_vec a) | 209 | |
82 | +{ | 210 | static const TypeInfo allwinner_sdhost_info = { |
83 | + tcg_gen_smax_vec(vece, d, a, n); | 211 | @@ -XXX,XX +XXX,XX @@ static const TypeInfo allwinner_sdhost_sun5i_info = { |
84 | + tcg_gen_smin_vec(vece, d, d, m); | 212 | .class_init = allwinner_sdhost_sun5i_class_init, |
85 | +} | 213 | }; |
86 | + | 214 | |
87 | +static void gen_sclamp(unsigned vece, uint32_t d, uint32_t n, uint32_t m, | 215 | +static const TypeInfo allwinner_sdhost_sun50i_a64_info = { |
88 | + uint32_t a, uint32_t oprsz, uint32_t maxsz) | 216 | + .name = TYPE_AW_SDHOST_SUN50I_A64, |
89 | +{ | 217 | + .parent = TYPE_AW_SDHOST, |
90 | + static const TCGOpcode vecop[] = { | 218 | + .class_init = allwinner_sdhost_sun50i_a64_class_init, |
91 | + INDEX_op_smin_vec, INDEX_op_smax_vec, 0 | 219 | +}; |
92 | + }; | 220 | + |
93 | + static const GVecGen4 ops[4] = { | 221 | +static const TypeInfo allwinner_sdhost_sun50i_a64_emmc_info = { |
94 | + { .fniv = gen_sclamp_vec, | 222 | + .name = TYPE_AW_SDHOST_SUN50I_A64_EMMC, |
95 | + .fno = gen_helper_gvec_sclamp_b, | 223 | + .parent = TYPE_AW_SDHOST, |
96 | + .opt_opc = vecop, | 224 | + .class_init = allwinner_sdhost_sun50i_a64_emmc_class_init, |
97 | + .vece = MO_8 }, | 225 | +}; |
98 | + { .fniv = gen_sclamp_vec, | 226 | + |
99 | + .fno = gen_helper_gvec_sclamp_h, | 227 | static const TypeInfo allwinner_sdhost_bus_info = { |
100 | + .opt_opc = vecop, | 228 | .name = TYPE_AW_SDHOST_BUS, |
101 | + .vece = MO_16 }, | 229 | .parent = TYPE_SD_BUS, |
102 | + { .fni4 = gen_sclamp_i32, | 230 | @@ -XXX,XX +XXX,XX @@ static void allwinner_sdhost_register_types(void) |
103 | + .fniv = gen_sclamp_vec, | 231 | type_register_static(&allwinner_sdhost_info); |
104 | + .fno = gen_helper_gvec_sclamp_s, | 232 | type_register_static(&allwinner_sdhost_sun4i_info); |
105 | + .opt_opc = vecop, | 233 | type_register_static(&allwinner_sdhost_sun5i_info); |
106 | + .vece = MO_32 }, | 234 | + type_register_static(&allwinner_sdhost_sun50i_a64_info); |
107 | + { .fni8 = gen_sclamp_i64, | 235 | + type_register_static(&allwinner_sdhost_sun50i_a64_emmc_info); |
108 | + .fniv = gen_sclamp_vec, | 236 | type_register_static(&allwinner_sdhost_bus_info); |
109 | + .fno = gen_helper_gvec_sclamp_d, | 237 | } |
110 | + .opt_opc = vecop, | 238 | |
111 | + .vece = MO_64, | ||
112 | + .prefer_i64 = TCG_TARGET_REG_BITS == 64 } | ||
113 | + }; | ||
114 | + tcg_gen_gvec_4(d, n, m, a, oprsz, maxsz, &ops[vece]); | ||
115 | +} | ||
116 | + | ||
117 | +TRANS_FEAT(SCLAMP, aa64_sme, gen_gvec_fn_arg_zzzz, gen_sclamp, a) | ||
118 | + | ||
119 | +static void gen_uclamp_i32(TCGv_i32 d, TCGv_i32 n, TCGv_i32 m, TCGv_i32 a) | ||
120 | +{ | ||
121 | + tcg_gen_umax_i32(d, a, n); | ||
122 | + tcg_gen_umin_i32(d, d, m); | ||
123 | +} | ||
124 | + | ||
125 | +static void gen_uclamp_i64(TCGv_i64 d, TCGv_i64 n, TCGv_i64 m, TCGv_i64 a) | ||
126 | +{ | ||
127 | + tcg_gen_umax_i64(d, a, n); | ||
128 | + tcg_gen_umin_i64(d, d, m); | ||
129 | +} | ||
130 | + | ||
131 | +static void gen_uclamp_vec(unsigned vece, TCGv_vec d, TCGv_vec n, | ||
132 | + TCGv_vec m, TCGv_vec a) | ||
133 | +{ | ||
134 | + tcg_gen_umax_vec(vece, d, a, n); | ||
135 | + tcg_gen_umin_vec(vece, d, d, m); | ||
136 | +} | ||
137 | + | ||
138 | +static void gen_uclamp(unsigned vece, uint32_t d, uint32_t n, uint32_t m, | ||
139 | + uint32_t a, uint32_t oprsz, uint32_t maxsz) | ||
140 | +{ | ||
141 | + static const TCGOpcode vecop[] = { | ||
142 | + INDEX_op_umin_vec, INDEX_op_umax_vec, 0 | ||
143 | + }; | ||
144 | + static const GVecGen4 ops[4] = { | ||
145 | + { .fniv = gen_uclamp_vec, | ||
146 | + .fno = gen_helper_gvec_uclamp_b, | ||
147 | + .opt_opc = vecop, | ||
148 | + .vece = MO_8 }, | ||
149 | + { .fniv = gen_uclamp_vec, | ||
150 | + .fno = gen_helper_gvec_uclamp_h, | ||
151 | + .opt_opc = vecop, | ||
152 | + .vece = MO_16 }, | ||
153 | + { .fni4 = gen_uclamp_i32, | ||
154 | + .fniv = gen_uclamp_vec, | ||
155 | + .fno = gen_helper_gvec_uclamp_s, | ||
156 | + .opt_opc = vecop, | ||
157 | + .vece = MO_32 }, | ||
158 | + { .fni8 = gen_uclamp_i64, | ||
159 | + .fniv = gen_uclamp_vec, | ||
160 | + .fno = gen_helper_gvec_uclamp_d, | ||
161 | + .opt_opc = vecop, | ||
162 | + .vece = MO_64, | ||
163 | + .prefer_i64 = TCG_TARGET_REG_BITS == 64 } | ||
164 | + }; | ||
165 | + tcg_gen_gvec_4(d, n, m, a, oprsz, maxsz, &ops[vece]); | ||
166 | +} | ||
167 | + | ||
168 | +TRANS_FEAT(UCLAMP, aa64_sme, gen_gvec_fn_arg_zzzz, gen_uclamp, a) | ||
169 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
170 | index XXXXXXX..XXXXXXX 100644 | ||
171 | --- a/target/arm/vec_helper.c | ||
172 | +++ b/target/arm/vec_helper.c | ||
173 | @@ -XXX,XX +XXX,XX @@ void HELPER(gvec_bfmlal_idx)(void *vd, void *vn, void *vm, | ||
174 | } | ||
175 | clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
176 | } | ||
177 | + | ||
178 | +#define DO_CLAMP(NAME, TYPE) \ | ||
179 | +void HELPER(NAME)(void *d, void *n, void *m, void *a, uint32_t desc) \ | ||
180 | +{ \ | ||
181 | + intptr_t i, opr_sz = simd_oprsz(desc); \ | ||
182 | + for (i = 0; i < opr_sz; i += sizeof(TYPE)) { \ | ||
183 | + TYPE aa = *(TYPE *)(a + i); \ | ||
184 | + TYPE nn = *(TYPE *)(n + i); \ | ||
185 | + TYPE mm = *(TYPE *)(m + i); \ | ||
186 | + TYPE dd = MIN(MAX(aa, nn), mm); \ | ||
187 | + *(TYPE *)(d + i) = dd; \ | ||
188 | + } \ | ||
189 | + clear_tail(d, opr_sz, simd_maxsz(desc)); \ | ||
190 | +} | ||
191 | + | ||
192 | +DO_CLAMP(gvec_sclamp_b, int8_t) | ||
193 | +DO_CLAMP(gvec_sclamp_h, int16_t) | ||
194 | +DO_CLAMP(gvec_sclamp_s, int32_t) | ||
195 | +DO_CLAMP(gvec_sclamp_d, int64_t) | ||
196 | + | ||
197 | +DO_CLAMP(gvec_uclamp_b, uint8_t) | ||
198 | +DO_CLAMP(gvec_uclamp_h, uint16_t) | ||
199 | +DO_CLAMP(gvec_uclamp_s, uint32_t) | ||
200 | +DO_CLAMP(gvec_uclamp_d, uint64_t) | ||
201 | -- | 239 | -- |
202 | 2.25.1 | 240 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | This is an SVE instruction that operates using the SVE vector | 3 | R40 has two ethernet controllers named as emac and gmac. The emac is |
4 | length but that it is present only if SME is implemented. | 4 | compatibled with A10, and the GMAC is compatibled with H3. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20220708151540.18136-30-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 8 | --- |
11 | target/arm/helper-sve.h | 2 ++ | 9 | include/hw/arm/allwinner-r40.h | 6 ++++ |
12 | target/arm/sve.decode | 1 + | 10 | hw/arm/allwinner-r40.c | 50 ++++++++++++++++++++++++++++++++-- |
13 | target/arm/sve_helper.c | 16 ++++++++++++++++ | 11 | hw/arm/bananapi_m2u.c | 3 ++ |
14 | target/arm/translate-sve.c | 2 ++ | 12 | 3 files changed, 57 insertions(+), 2 deletions(-) |
15 | 4 files changed, 21 insertions(+) | ||
16 | 13 | ||
17 | diff --git a/target/arm/helper-sve.h b/target/arm/helper-sve.h | 14 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
18 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/target/arm/helper-sve.h | 16 | --- a/include/hw/arm/allwinner-r40.h |
20 | +++ b/target/arm/helper-sve.h | 17 | +++ b/include/hw/arm/allwinner-r40.h |
21 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(sve_revh_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 18 | @@ -XXX,XX +XXX,XX @@ |
22 | 19 | #include "hw/misc/allwinner-r40-ccu.h" | |
23 | DEF_HELPER_FLAGS_4(sve_revw_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 20 | #include "hw/misc/allwinner-r40-dramc.h" |
24 | 21 | #include "hw/i2c/allwinner-i2c.h" | |
25 | +DEF_HELPER_FLAGS_4(sme_revd_q, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 22 | +#include "hw/net/allwinner_emac.h" |
23 | +#include "hw/net/allwinner-sun8i-emac.h" | ||
24 | #include "target/arm/cpu.h" | ||
25 | #include "sysemu/block-backend.h" | ||
26 | |||
27 | @@ -XXX,XX +XXX,XX @@ enum { | ||
28 | AW_R40_DEV_SRAM_A2, | ||
29 | AW_R40_DEV_SRAM_A3, | ||
30 | AW_R40_DEV_SRAM_A4, | ||
31 | + AW_R40_DEV_EMAC, | ||
32 | AW_R40_DEV_MMC0, | ||
33 | AW_R40_DEV_MMC1, | ||
34 | AW_R40_DEV_MMC2, | ||
35 | @@ -XXX,XX +XXX,XX @@ enum { | ||
36 | AW_R40_DEV_UART6, | ||
37 | AW_R40_DEV_UART7, | ||
38 | AW_R40_DEV_TWI0, | ||
39 | + AW_R40_DEV_GMAC, | ||
40 | AW_R40_DEV_GIC_DIST, | ||
41 | AW_R40_DEV_GIC_CPU, | ||
42 | AW_R40_DEV_GIC_HYP, | ||
43 | @@ -XXX,XX +XXX,XX @@ struct AwR40State { | ||
44 | AwR40ClockCtlState ccu; | ||
45 | AwR40DramCtlState dramc; | ||
46 | AWI2CState i2c0; | ||
47 | + AwEmacState emac; | ||
48 | + AwSun8iEmacState gmac; | ||
49 | GICState gic; | ||
50 | MemoryRegion sram_a1; | ||
51 | MemoryRegion sram_a2; | ||
52 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
53 | index XXXXXXX..XXXXXXX 100644 | ||
54 | --- a/hw/arm/allwinner-r40.c | ||
55 | +++ b/hw/arm/allwinner-r40.c | ||
56 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { | ||
57 | [AW_R40_DEV_SRAM_A2] = 0x00004000, | ||
58 | [AW_R40_DEV_SRAM_A3] = 0x00008000, | ||
59 | [AW_R40_DEV_SRAM_A4] = 0x0000b400, | ||
60 | + [AW_R40_DEV_EMAC] = 0x01c0b000, | ||
61 | [AW_R40_DEV_MMC0] = 0x01c0f000, | ||
62 | [AW_R40_DEV_MMC1] = 0x01c10000, | ||
63 | [AW_R40_DEV_MMC2] = 0x01c11000, | ||
64 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { | ||
65 | [AW_R40_DEV_UART6] = 0x01c29800, | ||
66 | [AW_R40_DEV_UART7] = 0x01c29c00, | ||
67 | [AW_R40_DEV_TWI0] = 0x01c2ac00, | ||
68 | + [AW_R40_DEV_GMAC] = 0x01c50000, | ||
69 | [AW_R40_DEV_DRAMCOM] = 0x01c62000, | ||
70 | [AW_R40_DEV_DRAMCTL] = 0x01c63000, | ||
71 | [AW_R40_DEV_DRAMPHY] = 0x01c65000, | ||
72 | @@ -XXX,XX +XXX,XX @@ static struct AwR40Unimplemented r40_unimplemented[] = { | ||
73 | { "spi1", 0x01c06000, 4 * KiB }, | ||
74 | { "cs0", 0x01c09000, 4 * KiB }, | ||
75 | { "keymem", 0x01c0a000, 4 * KiB }, | ||
76 | - { "emac", 0x01c0b000, 4 * KiB }, | ||
77 | { "usb0-otg", 0x01c13000, 4 * KiB }, | ||
78 | { "usb0-host", 0x01c14000, 4 * KiB }, | ||
79 | { "crypto", 0x01c15000, 4 * KiB }, | ||
80 | @@ -XXX,XX +XXX,XX @@ static struct AwR40Unimplemented r40_unimplemented[] = { | ||
81 | { "tvd2", 0x01c33000, 4 * KiB }, | ||
82 | { "tvd3", 0x01c34000, 4 * KiB }, | ||
83 | { "gpu", 0x01c40000, 64 * KiB }, | ||
84 | - { "gmac", 0x01c50000, 64 * KiB }, | ||
85 | { "hstmr", 0x01c60000, 4 * KiB }, | ||
86 | { "tcon-top", 0x01c70000, 4 * KiB }, | ||
87 | { "lcd0", 0x01c71000, 4 * KiB }, | ||
88 | @@ -XXX,XX +XXX,XX @@ enum { | ||
89 | AW_R40_GIC_SPI_MMC1 = 33, | ||
90 | AW_R40_GIC_SPI_MMC2 = 34, | ||
91 | AW_R40_GIC_SPI_MMC3 = 35, | ||
92 | + AW_R40_GIC_SPI_EMAC = 55, | ||
93 | + AW_R40_GIC_SPI_GMAC = 85, | ||
94 | }; | ||
95 | |||
96 | /* Allwinner R40 general constants */ | ||
97 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) | ||
98 | |||
99 | object_initialize_child(obj, "twi0", &s->i2c0, TYPE_AW_I2C_SUN6I); | ||
100 | |||
101 | + object_initialize_child(obj, "emac", &s->emac, TYPE_AW_EMAC); | ||
102 | + object_initialize_child(obj, "gmac", &s->gmac, TYPE_AW_SUN8I_EMAC); | ||
103 | + object_property_add_alias(obj, "gmac-phy-addr", | ||
104 | + OBJECT(&s->gmac), "phy-addr"); | ||
26 | + | 105 | + |
27 | DEF_HELPER_FLAGS_4(sve_rbit_b, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 106 | object_initialize_child(obj, "dramc", &s->dramc, TYPE_AW_R40_DRAMC); |
28 | DEF_HELPER_FLAGS_4(sve_rbit_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 107 | object_property_add_alias(obj, "ram-addr", OBJECT(&s->dramc), |
29 | DEF_HELPER_FLAGS_4(sve_rbit_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 108 | "ram-addr"); |
30 | diff --git a/target/arm/sve.decode b/target/arm/sve.decode | 109 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) |
31 | index XXXXXXX..XXXXXXX 100644 | 110 | |
32 | --- a/target/arm/sve.decode | 111 | static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
33 | +++ b/target/arm/sve.decode | 112 | { |
34 | @@ -XXX,XX +XXX,XX @@ REVB 00000101 .. 1001 00 100 ... ..... ..... @rd_pg_rn | 113 | + const char *r40_nic_models[] = { "gmac", "emac", NULL }; |
35 | REVH 00000101 .. 1001 01 100 ... ..... ..... @rd_pg_rn | 114 | AwR40State *s = AW_R40(dev); |
36 | REVW 00000101 .. 1001 10 100 ... ..... ..... @rd_pg_rn | 115 | unsigned i; |
37 | RBIT 00000101 .. 1001 11 100 ... ..... ..... @rd_pg_rn | 116 | |
38 | +REVD 00000101 00 1011 10 100 ... ..... ..... @rd_pg_rn_e0 | 117 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
39 | 118 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 2, | |
40 | # SVE vector splice (predicated, destructive) | 119 | s->memmap[AW_R40_DEV_DRAMPHY]); |
41 | SPLICE 00000101 .. 101 100 100 ... ..... ..... @rdn_pg_rm | 120 | |
42 | diff --git a/target/arm/sve_helper.c b/target/arm/sve_helper.c | 121 | + /* nic support gmac and emac */ |
43 | index XXXXXXX..XXXXXXX 100644 | 122 | + for (int i = 0; i < ARRAY_SIZE(r40_nic_models) - 1; i++) { |
44 | --- a/target/arm/sve_helper.c | 123 | + NICInfo *nic = &nd_table[i]; |
45 | +++ b/target/arm/sve_helper.c | ||
46 | @@ -XXX,XX +XXX,XX @@ DO_ZPZ_D(sve_revh_d, uint64_t, hswap64) | ||
47 | |||
48 | DO_ZPZ_D(sve_revw_d, uint64_t, wswap64) | ||
49 | |||
50 | +void HELPER(sme_revd_q)(void *vd, void *vn, void *vg, uint32_t desc) | ||
51 | +{ | ||
52 | + intptr_t i, opr_sz = simd_oprsz(desc) / 8; | ||
53 | + uint64_t *d = vd, *n = vn; | ||
54 | + uint8_t *pg = vg; | ||
55 | + | 124 | + |
56 | + for (i = 0; i < opr_sz; i += 2) { | 125 | + if (!nic->used) { |
57 | + if (pg[H1(i)] & 1) { | 126 | + continue; |
58 | + uint64_t n0 = n[i + 0]; | 127 | + } |
59 | + uint64_t n1 = n[i + 1]; | 128 | + if (qemu_show_nic_models(nic->model, r40_nic_models)) { |
60 | + d[i + 0] = n1; | 129 | + exit(0); |
61 | + d[i + 1] = n0; | 130 | + } |
131 | + | ||
132 | + switch (qemu_find_nic_model(nic, r40_nic_models, r40_nic_models[0])) { | ||
133 | + case 0: /* gmac */ | ||
134 | + qdev_set_nic_properties(DEVICE(&s->gmac), nic); | ||
135 | + break; | ||
136 | + case 1: /* emac */ | ||
137 | + qdev_set_nic_properties(DEVICE(&s->emac), nic); | ||
138 | + break; | ||
139 | + default: | ||
140 | + exit(1); | ||
141 | + break; | ||
62 | + } | 142 | + } |
63 | + } | 143 | + } |
64 | +} | ||
65 | + | 144 | + |
66 | DO_ZPZ(sve_rbit_b, uint8_t, H1, revbit8) | 145 | + /* GMAC */ |
67 | DO_ZPZ(sve_rbit_h, uint16_t, H1_2, revbit16) | 146 | + object_property_set_link(OBJECT(&s->gmac), "dma-memory", |
68 | DO_ZPZ(sve_rbit_s, uint32_t, H1_4, revbit32) | 147 | + OBJECT(get_system_memory()), &error_fatal); |
69 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 148 | + sysbus_realize(SYS_BUS_DEVICE(&s->gmac), &error_fatal); |
149 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gmac), 0, s->memmap[AW_R40_DEV_GMAC]); | ||
150 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gmac), 0, | ||
151 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_R40_GIC_SPI_GMAC)); | ||
152 | + | ||
153 | + /* EMAC */ | ||
154 | + sysbus_realize(SYS_BUS_DEVICE(&s->emac), &error_fatal); | ||
155 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->emac), 0, s->memmap[AW_R40_DEV_EMAC]); | ||
156 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->emac), 0, | ||
157 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_R40_GIC_SPI_EMAC)); | ||
158 | + | ||
159 | /* Unimplemented devices */ | ||
160 | for (i = 0; i < ARRAY_SIZE(r40_unimplemented); i++) { | ||
161 | create_unimplemented_device(r40_unimplemented[i].device_name, | ||
162 | diff --git a/hw/arm/bananapi_m2u.c b/hw/arm/bananapi_m2u.c | ||
70 | index XXXXXXX..XXXXXXX 100644 | 163 | index XXXXXXX..XXXXXXX 100644 |
71 | --- a/target/arm/translate-sve.c | 164 | --- a/hw/arm/bananapi_m2u.c |
72 | +++ b/target/arm/translate-sve.c | 165 | +++ b/hw/arm/bananapi_m2u.c |
73 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(REVH, aa64_sve, gen_gvec_ool_arg_zpz, revh_fns[a->esz], a, 0) | 166 | @@ -XXX,XX +XXX,XX @@ static void bpim2u_init(MachineState *machine) |
74 | TRANS_FEAT(REVW, aa64_sve, gen_gvec_ool_arg_zpz, | 167 | object_property_set_int(OBJECT(r40), "ram-size", |
75 | a->esz == 3 ? gen_helper_sve_revw_d : NULL, a, 0) | 168 | r40->ram_size, &error_abort); |
76 | 169 | ||
77 | +TRANS_FEAT(REVD, aa64_sme, gen_gvec_ool_arg_zpz, gen_helper_sme_revd_q, a, 0) | 170 | + /* GMAC PHY */ |
171 | + object_property_set_uint(OBJECT(r40), "gmac-phy-addr", 1, &error_abort); | ||
78 | + | 172 | + |
79 | TRANS_FEAT(SPLICE, aa64_sve, gen_gvec_ool_arg_zpzz, | 173 | /* Mark R40 object realized */ |
80 | gen_helper_sve_splice, a, a->esz) | 174 | qdev_realize(DEVICE(r40), NULL, &error_abort); |
81 | 175 | ||
82 | -- | 176 | -- |
83 | 2.25.1 | 177 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | We can reuse the SVE functions for implementing moves to/from | 3 | Only a few important registers are added, especially the SRAM_VER |
4 | horizontal tile slices, but we need new ones for moves to/from | 4 | register. |
5 | vertical tile slices. | ||
6 | 5 | ||
7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Reviewed-by: Niek Linnenbank <nieklinnenbank@gmail.com> |
9 | Message-id: 20220708151540.18136-20-richard.henderson@linaro.org | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 9 | --- |
12 | target/arm/helper-sme.h | 12 +++ | 10 | include/hw/arm/allwinner-r40.h | 3 + |
13 | target/arm/helper-sve.h | 2 + | 11 | include/hw/misc/allwinner-sramc.h | 69 +++++++++++ |
14 | target/arm/translate-a64.h | 8 ++ | 12 | hw/arm/allwinner-r40.c | 7 +- |
15 | target/arm/translate.h | 5 ++ | 13 | hw/misc/allwinner-sramc.c | 184 ++++++++++++++++++++++++++++++ |
16 | target/arm/sme.decode | 15 ++++ | 14 | hw/arm/Kconfig | 1 + |
17 | target/arm/sme_helper.c | 151 ++++++++++++++++++++++++++++++++++++- | 15 | hw/misc/Kconfig | 3 + |
18 | target/arm/sve_helper.c | 12 +++ | 16 | hw/misc/meson.build | 1 + |
19 | target/arm/translate-sme.c | 127 +++++++++++++++++++++++++++++++ | 17 | hw/misc/trace-events | 4 + |
20 | 8 files changed, 331 insertions(+), 1 deletion(-) | 18 | 8 files changed, 271 insertions(+), 1 deletion(-) |
19 | create mode 100644 include/hw/misc/allwinner-sramc.h | ||
20 | create mode 100644 hw/misc/allwinner-sramc.c | ||
21 | 21 | ||
22 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | 22 | diff --git a/include/hw/arm/allwinner-r40.h b/include/hw/arm/allwinner-r40.h |
23 | index XXXXXXX..XXXXXXX 100644 | 23 | index XXXXXXX..XXXXXXX 100644 |
24 | --- a/target/arm/helper-sme.h | 24 | --- a/include/hw/arm/allwinner-r40.h |
25 | +++ b/target/arm/helper-sme.h | 25 | +++ b/include/hw/arm/allwinner-r40.h |
26 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_2(set_pstate_sm, TCG_CALL_NO_RWG, void, env, i32) | 26 | @@ -XXX,XX +XXX,XX @@ |
27 | DEF_HELPER_FLAGS_2(set_pstate_za, TCG_CALL_NO_RWG, void, env, i32) | 27 | #include "hw/sd/allwinner-sdhost.h" |
28 | 28 | #include "hw/misc/allwinner-r40-ccu.h" | |
29 | DEF_HELPER_FLAGS_3(sme_zero, TCG_CALL_NO_RWG, void, env, i32, i32) | 29 | #include "hw/misc/allwinner-r40-dramc.h" |
30 | + | 30 | +#include "hw/misc/allwinner-sramc.h" |
31 | +/* Move to/from vertical array slices, i.e. columns, so 'c'. */ | 31 | #include "hw/i2c/allwinner-i2c.h" |
32 | +DEF_HELPER_FLAGS_4(sme_mova_cz_b, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 32 | #include "hw/net/allwinner_emac.h" |
33 | +DEF_HELPER_FLAGS_4(sme_mova_zc_b, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 33 | #include "hw/net/allwinner-sun8i-emac.h" |
34 | +DEF_HELPER_FLAGS_4(sme_mova_cz_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 34 | @@ -XXX,XX +XXX,XX @@ enum { |
35 | +DEF_HELPER_FLAGS_4(sme_mova_zc_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 35 | AW_R40_DEV_SRAM_A2, |
36 | +DEF_HELPER_FLAGS_4(sme_mova_cz_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 36 | AW_R40_DEV_SRAM_A3, |
37 | +DEF_HELPER_FLAGS_4(sme_mova_zc_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 37 | AW_R40_DEV_SRAM_A4, |
38 | +DEF_HELPER_FLAGS_4(sme_mova_cz_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 38 | + AW_R40_DEV_SRAMC, |
39 | +DEF_HELPER_FLAGS_4(sme_mova_zc_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 39 | AW_R40_DEV_EMAC, |
40 | +DEF_HELPER_FLAGS_4(sme_mova_cz_q, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 40 | AW_R40_DEV_MMC0, |
41 | +DEF_HELPER_FLAGS_4(sme_mova_zc_q, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | 41 | AW_R40_DEV_MMC1, |
42 | diff --git a/target/arm/helper-sve.h b/target/arm/helper-sve.h | 42 | @@ -XXX,XX +XXX,XX @@ struct AwR40State { |
43 | index XXXXXXX..XXXXXXX 100644 | 43 | |
44 | --- a/target/arm/helper-sve.h | 44 | ARMCPU cpus[AW_R40_NUM_CPUS]; |
45 | +++ b/target/arm/helper-sve.h | 45 | const hwaddr *memmap; |
46 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(sve_sel_zpzz_s, TCG_CALL_NO_RWG, | 46 | + AwSRAMCState sramc; |
47 | void, ptr, ptr, ptr, ptr, i32) | 47 | AwA10PITState timer; |
48 | DEF_HELPER_FLAGS_5(sve_sel_zpzz_d, TCG_CALL_NO_RWG, | 48 | AwSdHostState mmc[AW_R40_NUM_MMCS]; |
49 | void, ptr, ptr, ptr, ptr, i32) | 49 | AwR40ClockCtlState ccu; |
50 | +DEF_HELPER_FLAGS_5(sve_sel_zpzz_q, TCG_CALL_NO_RWG, | 50 | diff --git a/include/hw/misc/allwinner-sramc.h b/include/hw/misc/allwinner-sramc.h |
51 | + void, ptr, ptr, ptr, ptr, i32) | 51 | new file mode 100644 |
52 | 52 | index XXXXXXX..XXXXXXX | |
53 | DEF_HELPER_FLAGS_5(sve2_addp_zpzz_b, TCG_CALL_NO_RWG, | 53 | --- /dev/null |
54 | void, ptr, ptr, ptr, ptr, i32) | 54 | +++ b/include/hw/misc/allwinner-sramc.h |
55 | diff --git a/target/arm/translate-a64.h b/target/arm/translate-a64.h | 55 | @@ -XXX,XX +XXX,XX @@ |
56 | index XXXXXXX..XXXXXXX 100644 | 56 | +/* |
57 | --- a/target/arm/translate-a64.h | 57 | + * Allwinner SRAM controller emulation |
58 | +++ b/target/arm/translate-a64.h | 58 | + * |
59 | @@ -XXX,XX +XXX,XX @@ static inline int pred_gvec_reg_size(DisasContext *s) | 59 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> |
60 | return size_for_gvec(pred_full_reg_size(s)); | 60 | + * |
61 | + * This program is free software: you can redistribute it and/or modify | ||
62 | + * it under the terms of the GNU General Public License as published by | ||
63 | + * the Free Software Foundation, either version 2 of the License, or | ||
64 | + * (at your option) any later version. | ||
65 | + * | ||
66 | + * This program is distributed in the hope that it will be useful, | ||
67 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
68 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
69 | + * GNU General Public License for more details. | ||
70 | + * | ||
71 | + * You should have received a copy of the GNU General Public License | ||
72 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
73 | + */ | ||
74 | + | ||
75 | +#ifndef HW_MISC_ALLWINNER_SRAMC_H | ||
76 | +#define HW_MISC_ALLWINNER_SRAMC_H | ||
77 | + | ||
78 | +#include "qom/object.h" | ||
79 | +#include "hw/sysbus.h" | ||
80 | +#include "qemu/uuid.h" | ||
81 | + | ||
82 | +/** | ||
83 | + * Object model | ||
84 | + * @{ | ||
85 | + */ | ||
86 | +#define TYPE_AW_SRAMC "allwinner-sramc" | ||
87 | +#define TYPE_AW_SRAMC_SUN8I_R40 TYPE_AW_SRAMC "-sun8i-r40" | ||
88 | +OBJECT_DECLARE_TYPE(AwSRAMCState, AwSRAMCClass, AW_SRAMC) | ||
89 | + | ||
90 | +/** @} */ | ||
91 | + | ||
92 | +/** | ||
93 | + * Allwinner SRAMC object instance state | ||
94 | + */ | ||
95 | +struct AwSRAMCState { | ||
96 | + /*< private >*/ | ||
97 | + SysBusDevice parent_obj; | ||
98 | + /*< public >*/ | ||
99 | + | ||
100 | + /** Maps I/O registers in physical memory */ | ||
101 | + MemoryRegion iomem; | ||
102 | + | ||
103 | + /* registers */ | ||
104 | + uint32_t sram_ctl1; | ||
105 | + uint32_t sram_ver; | ||
106 | + uint32_t sram_soft_entry_reg0; | ||
107 | +}; | ||
108 | + | ||
109 | +/** | ||
110 | + * Allwinner SRAM Controller class-level struct. | ||
111 | + * | ||
112 | + * This struct is filled by each sunxi device specific code | ||
113 | + * such that the generic code can use this struct to support | ||
114 | + * all devices. | ||
115 | + */ | ||
116 | +struct AwSRAMCClass { | ||
117 | + /*< private >*/ | ||
118 | + SysBusDeviceClass parent_class; | ||
119 | + /*< public >*/ | ||
120 | + | ||
121 | + uint32_t sram_version_code; | ||
122 | +}; | ||
123 | + | ||
124 | +#endif /* HW_MISC_ALLWINNER_SRAMC_H */ | ||
125 | diff --git a/hw/arm/allwinner-r40.c b/hw/arm/allwinner-r40.c | ||
126 | index XXXXXXX..XXXXXXX 100644 | ||
127 | --- a/hw/arm/allwinner-r40.c | ||
128 | +++ b/hw/arm/allwinner-r40.c | ||
129 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_r40_memmap[] = { | ||
130 | [AW_R40_DEV_SRAM_A2] = 0x00004000, | ||
131 | [AW_R40_DEV_SRAM_A3] = 0x00008000, | ||
132 | [AW_R40_DEV_SRAM_A4] = 0x0000b400, | ||
133 | + [AW_R40_DEV_SRAMC] = 0x01c00000, | ||
134 | [AW_R40_DEV_EMAC] = 0x01c0b000, | ||
135 | [AW_R40_DEV_MMC0] = 0x01c0f000, | ||
136 | [AW_R40_DEV_MMC1] = 0x01c10000, | ||
137 | @@ -XXX,XX +XXX,XX @@ struct AwR40Unimplemented { | ||
138 | static struct AwR40Unimplemented r40_unimplemented[] = { | ||
139 | { "d-engine", 0x01000000, 4 * MiB }, | ||
140 | { "d-inter", 0x01400000, 128 * KiB }, | ||
141 | - { "sram-c", 0x01c00000, 4 * KiB }, | ||
142 | { "dma", 0x01c02000, 4 * KiB }, | ||
143 | { "nfdc", 0x01c03000, 4 * KiB }, | ||
144 | { "ts", 0x01c04000, 4 * KiB }, | ||
145 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_init(Object *obj) | ||
146 | "ram-addr"); | ||
147 | object_property_add_alias(obj, "ram-size", OBJECT(&s->dramc), | ||
148 | "ram-size"); | ||
149 | + | ||
150 | + object_initialize_child(obj, "sramc", &s->sramc, TYPE_AW_SRAMC_SUN8I_R40); | ||
61 | } | 151 | } |
62 | 152 | ||
63 | +/* Return a newly allocated pointer to the predicate register. */ | 153 | static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
64 | +static inline TCGv_ptr pred_full_reg_ptr(DisasContext *s, int regno) | 154 | @@ -XXX,XX +XXX,XX @@ static void allwinner_r40_realize(DeviceState *dev, Error **errp) |
65 | +{ | 155 | AW_R40_GIC_SPI_TIMER1)); |
66 | + TCGv_ptr ret = tcg_temp_new_ptr(); | 156 | |
67 | + tcg_gen_addi_ptr(ret, cpu_env, pred_full_reg_offset(s, regno)); | 157 | /* SRAM */ |
68 | + return ret; | 158 | + sysbus_realize(SYS_BUS_DEVICE(&s->sramc), &error_fatal); |
69 | +} | 159 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->sramc), 0, s->memmap[AW_R40_DEV_SRAMC]); |
70 | + | 160 | + |
71 | bool disas_sve(DisasContext *, uint32_t); | 161 | memory_region_init_ram(&s->sram_a1, OBJECT(dev), "sram A1", |
72 | bool disas_sme(DisasContext *, uint32_t); | 162 | 16 * KiB, &error_abort); |
73 | 163 | memory_region_init_ram(&s->sram_a2, OBJECT(dev), "sram A2", | |
74 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 164 | diff --git a/hw/misc/allwinner-sramc.c b/hw/misc/allwinner-sramc.c |
75 | index XXXXXXX..XXXXXXX 100644 | 165 | new file mode 100644 |
76 | --- a/target/arm/translate.h | 166 | index XXXXXXX..XXXXXXX |
77 | +++ b/target/arm/translate.h | 167 | --- /dev/null |
78 | @@ -XXX,XX +XXX,XX @@ static inline int plus_2(DisasContext *s, int x) | 168 | +++ b/hw/misc/allwinner-sramc.c |
79 | return x + 2; | ||
80 | } | ||
81 | |||
82 | +static inline int plus_12(DisasContext *s, int x) | ||
83 | +{ | ||
84 | + return x + 12; | ||
85 | +} | ||
86 | + | ||
87 | static inline int times_2(DisasContext *s, int x) | ||
88 | { | ||
89 | return x * 2; | ||
90 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | ||
91 | index XXXXXXX..XXXXXXX 100644 | ||
92 | --- a/target/arm/sme.decode | ||
93 | +++ b/target/arm/sme.decode | ||
94 | @@ -XXX,XX +XXX,XX @@ | 169 | @@ -XXX,XX +XXX,XX @@ |
95 | ### SME Misc | ||
96 | |||
97 | ZERO 11000000 00 001 00000000000 imm:8 | ||
98 | + | ||
99 | +### SME Move into/from Array | ||
100 | + | ||
101 | +%mova_rs 13:2 !function=plus_12 | ||
102 | +&mova esz rs pg zr za_imm v:bool to_vec:bool | ||
103 | + | ||
104 | +MOVA 11000000 esz:2 00000 0 v:1 .. pg:3 zr:5 0 za_imm:4 \ | ||
105 | + &mova to_vec=0 rs=%mova_rs | ||
106 | +MOVA 11000000 11 00000 1 v:1 .. pg:3 zr:5 0 za_imm:4 \ | ||
107 | + &mova to_vec=0 rs=%mova_rs esz=4 | ||
108 | + | ||
109 | +MOVA 11000000 esz:2 00001 0 v:1 .. pg:3 0 za_imm:4 zr:5 \ | ||
110 | + &mova to_vec=1 rs=%mova_rs | ||
111 | +MOVA 11000000 11 00001 1 v:1 .. pg:3 0 za_imm:4 zr:5 \ | ||
112 | + &mova to_vec=1 rs=%mova_rs esz=4 | ||
113 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | ||
114 | index XXXXXXX..XXXXXXX 100644 | ||
115 | --- a/target/arm/sme_helper.c | ||
116 | +++ b/target/arm/sme_helper.c | ||
117 | @@ -XXX,XX +XXX,XX @@ | ||
118 | |||
119 | #include "qemu/osdep.h" | ||
120 | #include "cpu.h" | ||
121 | -#include "internals.h" | ||
122 | +#include "tcg/tcg-gvec-desc.h" | ||
123 | #include "exec/helper-proto.h" | ||
124 | +#include "qemu/int128.h" | ||
125 | +#include "vec_internal.h" | ||
126 | |||
127 | /* ResetSVEState */ | ||
128 | void arm_reset_sve_state(CPUARMState *env) | ||
129 | @@ -XXX,XX +XXX,XX @@ void helper_sme_zero(CPUARMState *env, uint32_t imm, uint32_t svl) | ||
130 | } | ||
131 | } | ||
132 | } | ||
133 | + | ||
134 | + | ||
135 | +/* | 170 | +/* |
136 | + * When considering the ZA storage as an array of elements of | 171 | + * Allwinner R40 SRAM controller emulation |
137 | + * type T, the index within that array of the Nth element of | 172 | + * |
138 | + * a vertical slice of a tile can be calculated like this, | 173 | + * Copyright (C) 2023 qianfan Zhao <qianfanguijin@163.com> |
139 | + * regardless of the size of type T. This is because the tiles | 174 | + * |
140 | + * are interleaved, so if type T is size N bytes then row 1 of | 175 | + * This program is free software: you can redistribute it and/or modify |
141 | + * the tile is N rows away from row 0. The division by N to | 176 | + * it under the terms of the GNU General Public License as published by |
142 | + * convert a byte offset into an array index and the multiplication | 177 | + * the Free Software Foundation, either version 2 of the License, or |
143 | + * by N to convert from vslice-index-within-the-tile to | 178 | + * (at your option) any later version. |
144 | + * the index within the ZA storage cancel out. | 179 | + * |
145 | + */ | 180 | + * This program is distributed in the hope that it will be useful, |
146 | +#define tile_vslice_index(i) ((i) * sizeof(ARMVectorReg)) | 181 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of |
182 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
183 | + * GNU General Public License for more details. | ||
184 | + * | ||
185 | + * You should have received a copy of the GNU General Public License | ||
186 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
187 | + */ | ||
188 | + | ||
189 | +#include "qemu/osdep.h" | ||
190 | +#include "qemu/units.h" | ||
191 | +#include "hw/sysbus.h" | ||
192 | +#include "migration/vmstate.h" | ||
193 | +#include "qemu/log.h" | ||
194 | +#include "qemu/module.h" | ||
195 | +#include "qapi/error.h" | ||
196 | +#include "hw/qdev-properties.h" | ||
197 | +#include "hw/qdev-properties-system.h" | ||
198 | +#include "hw/misc/allwinner-sramc.h" | ||
199 | +#include "trace.h" | ||
147 | + | 200 | + |
148 | +/* | 201 | +/* |
149 | + * When doing byte arithmetic on the ZA storage, the element | 202 | + * register offsets |
150 | + * byteoff bytes away in a tile vertical slice is always this | 203 | + * https://linux-sunxi.org/SRAM_Controller_Register_Guide |
151 | + * many bytes away in the ZA storage, regardless of the | 204 | + */ |
152 | + * size of the tile element, assuming that byteoff is a multiple | 205 | +enum { |
153 | + * of the element size. Again this is because of the interleaving | 206 | + REG_SRAM_CTL1_CFG = 0x04, /* SRAM Control register 1 */ |
154 | + * of the tiles. For instance if we have 1 byte per element then | 207 | + REG_SRAM_VER = 0x24, /* SRAM Version register */ |
155 | + * each row of the ZA storage has one byte of the vslice data, | 208 | + REG_SRAM_R40_SOFT_ENTRY_REG0 = 0xbc, |
156 | + * and (counting from 0) byte 8 goes in row 8 of the storage | 209 | +}; |
157 | + * at offset (8 * row-size-in-bytes). | 210 | + |
158 | + * If we have 8 bytes per element then each row of the ZA storage | 211 | +/* REG_SRAMC_VERSION bit defines */ |
159 | + * has 8 bytes of the data, but there are 8 interleaved tiles and | 212 | +#define SRAM_VER_READ_ENABLE (1 << 15) |
160 | + * so byte 8 of the data goes into row 1 of the tile, | 213 | +#define SRAM_VER_VERSION_SHIFT 16 |
161 | + * which is again row 8 of the storage, so the offset is still | 214 | +#define SRAM_VERSION_SUN8I_R40 0x1701 |
162 | + * (8 * row-size-in-bytes). Similarly for other element sizes. | 215 | + |
163 | + */ | 216 | +static uint64_t allwinner_sramc_read(void *opaque, hwaddr offset, |
164 | +#define tile_vslice_offset(byteoff) ((byteoff) * sizeof(ARMVectorReg)) | 217 | + unsigned size) |
165 | + | 218 | +{ |
166 | + | 219 | + AwSRAMCState *s = AW_SRAMC(opaque); |
167 | +/* | 220 | + AwSRAMCClass *sc = AW_SRAMC_GET_CLASS(s); |
168 | + * Move Zreg vector to ZArray column. | 221 | + uint64_t val = 0; |
169 | + */ | 222 | + |
170 | +#define DO_MOVA_C(NAME, TYPE, H) \ | 223 | + switch (offset) { |
171 | +void HELPER(NAME)(void *za, void *vn, void *vg, uint32_t desc) \ | 224 | + case REG_SRAM_CTL1_CFG: |
172 | +{ \ | 225 | + val = s->sram_ctl1; |
173 | + int i, oprsz = simd_oprsz(desc); \ | 226 | + break; |
174 | + for (i = 0; i < oprsz; ) { \ | 227 | + case REG_SRAM_VER: |
175 | + uint16_t pg = *(uint16_t *)(vg + H1_2(i >> 3)); \ | 228 | + /* bit15: lock bit, set this bit before reading this register */ |
176 | + do { \ | 229 | + if (s->sram_ver & SRAM_VER_READ_ENABLE) { |
177 | + if (pg & 1) { \ | 230 | + val = SRAM_VER_READ_ENABLE | |
178 | + *(TYPE *)(za + tile_vslice_offset(i)) = *(TYPE *)(vn + H(i)); \ | 231 | + (sc->sram_version_code << SRAM_VER_VERSION_SHIFT); |
179 | + } \ | ||
180 | + i += sizeof(TYPE); \ | ||
181 | + pg >>= sizeof(TYPE); \ | ||
182 | + } while (i & 15); \ | ||
183 | + } \ | ||
184 | +} | ||
185 | + | ||
186 | +DO_MOVA_C(sme_mova_cz_b, uint8_t, H1) | ||
187 | +DO_MOVA_C(sme_mova_cz_h, uint16_t, H1_2) | ||
188 | +DO_MOVA_C(sme_mova_cz_s, uint32_t, H1_4) | ||
189 | + | ||
190 | +void HELPER(sme_mova_cz_d)(void *za, void *vn, void *vg, uint32_t desc) | ||
191 | +{ | ||
192 | + int i, oprsz = simd_oprsz(desc) / 8; | ||
193 | + uint8_t *pg = vg; | ||
194 | + uint64_t *n = vn; | ||
195 | + uint64_t *a = za; | ||
196 | + | ||
197 | + for (i = 0; i < oprsz; i++) { | ||
198 | + if (pg[H1(i)] & 1) { | ||
199 | + a[tile_vslice_index(i)] = n[i]; | ||
200 | + } | 232 | + } |
233 | + break; | ||
234 | + case REG_SRAM_R40_SOFT_ENTRY_REG0: | ||
235 | + val = s->sram_soft_entry_reg0; | ||
236 | + break; | ||
237 | + default: | ||
238 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
239 | + __func__, (uint32_t)offset); | ||
240 | + return 0; | ||
201 | + } | 241 | + } |
202 | +} | 242 | + |
203 | + | 243 | + trace_allwinner_sramc_read(offset, val); |
204 | +void HELPER(sme_mova_cz_q)(void *za, void *vn, void *vg, uint32_t desc) | 244 | + |
205 | +{ | 245 | + return val; |
206 | + int i, oprsz = simd_oprsz(desc) / 16; | 246 | +} |
207 | + uint16_t *pg = vg; | 247 | + |
208 | + Int128 *n = vn; | 248 | +static void allwinner_sramc_write(void *opaque, hwaddr offset, |
209 | + Int128 *a = za; | 249 | + uint64_t val, unsigned size) |
210 | + | 250 | +{ |
211 | + /* | 251 | + AwSRAMCState *s = AW_SRAMC(opaque); |
212 | + * Int128 is used here simply to copy 16 bytes, and to simplify | 252 | + |
213 | + * the address arithmetic. | 253 | + trace_allwinner_sramc_write(offset, val); |
214 | + */ | 254 | + |
215 | + for (i = 0; i < oprsz; i++) { | 255 | + switch (offset) { |
216 | + if (pg[H2(i)] & 1) { | 256 | + case REG_SRAM_CTL1_CFG: |
217 | + a[tile_vslice_index(i)] = n[i]; | 257 | + s->sram_ctl1 = val; |
218 | + } | 258 | + break; |
259 | + case REG_SRAM_VER: | ||
260 | + /* Only the READ_ENABLE bit is writeable */ | ||
261 | + s->sram_ver = val & SRAM_VER_READ_ENABLE; | ||
262 | + break; | ||
263 | + case REG_SRAM_R40_SOFT_ENTRY_REG0: | ||
264 | + s->sram_soft_entry_reg0 = val; | ||
265 | + break; | ||
266 | + default: | ||
267 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
268 | + __func__, (uint32_t)offset); | ||
269 | + break; | ||
219 | + } | 270 | + } |
220 | +} | 271 | +} |
221 | + | 272 | + |
222 | +#undef DO_MOVA_C | 273 | +static const MemoryRegionOps allwinner_sramc_ops = { |
223 | + | 274 | + .read = allwinner_sramc_read, |
224 | +/* | 275 | + .write = allwinner_sramc_write, |
225 | + * Move ZArray column to Zreg vector. | 276 | + .endianness = DEVICE_NATIVE_ENDIAN, |
226 | + */ | 277 | + .valid = { |
227 | +#define DO_MOVA_Z(NAME, TYPE, H) \ | 278 | + .min_access_size = 4, |
228 | +void HELPER(NAME)(void *vd, void *za, void *vg, uint32_t desc) \ | 279 | + .max_access_size = 4, |
229 | +{ \ | 280 | + }, |
230 | + int i, oprsz = simd_oprsz(desc); \ | 281 | + .impl.min_access_size = 4, |
231 | + for (i = 0; i < oprsz; ) { \ | 282 | +}; |
232 | + uint16_t pg = *(uint16_t *)(vg + H1_2(i >> 3)); \ | 283 | + |
233 | + do { \ | 284 | +static const VMStateDescription allwinner_sramc_vmstate = { |
234 | + if (pg & 1) { \ | 285 | + .name = "allwinner-sramc", |
235 | + *(TYPE *)(vd + H(i)) = *(TYPE *)(za + tile_vslice_offset(i)); \ | 286 | + .version_id = 1, |
236 | + } \ | 287 | + .minimum_version_id = 1, |
237 | + i += sizeof(TYPE); \ | 288 | + .fields = (VMStateField[]) { |
238 | + pg >>= sizeof(TYPE); \ | 289 | + VMSTATE_UINT32(sram_ver, AwSRAMCState), |
239 | + } while (i & 15); \ | 290 | + VMSTATE_UINT32(sram_soft_entry_reg0, AwSRAMCState), |
240 | + } \ | 291 | + VMSTATE_END_OF_LIST() |
241 | +} | ||
242 | + | ||
243 | +DO_MOVA_Z(sme_mova_zc_b, uint8_t, H1) | ||
244 | +DO_MOVA_Z(sme_mova_zc_h, uint16_t, H1_2) | ||
245 | +DO_MOVA_Z(sme_mova_zc_s, uint32_t, H1_4) | ||
246 | + | ||
247 | +void HELPER(sme_mova_zc_d)(void *vd, void *za, void *vg, uint32_t desc) | ||
248 | +{ | ||
249 | + int i, oprsz = simd_oprsz(desc) / 8; | ||
250 | + uint8_t *pg = vg; | ||
251 | + uint64_t *d = vd; | ||
252 | + uint64_t *a = za; | ||
253 | + | ||
254 | + for (i = 0; i < oprsz; i++) { | ||
255 | + if (pg[H1(i)] & 1) { | ||
256 | + d[i] = a[tile_vslice_index(i)]; | ||
257 | + } | ||
258 | + } | 292 | + } |
259 | +} | 293 | +}; |
260 | + | 294 | + |
261 | +void HELPER(sme_mova_zc_q)(void *vd, void *za, void *vg, uint32_t desc) | 295 | +static void allwinner_sramc_reset(DeviceState *dev) |
262 | +{ | 296 | +{ |
263 | + int i, oprsz = simd_oprsz(desc) / 16; | 297 | + AwSRAMCState *s = AW_SRAMC(dev); |
264 | + uint16_t *pg = vg; | 298 | + AwSRAMCClass *sc = AW_SRAMC_GET_CLASS(s); |
265 | + Int128 *d = vd; | 299 | + |
266 | + Int128 *a = za; | 300 | + switch (sc->sram_version_code) { |
267 | + | 301 | + case SRAM_VERSION_SUN8I_R40: |
268 | + /* | 302 | + s->sram_ctl1 = 0x1300; |
269 | + * Int128 is used here simply to copy 16 bytes, and to simplify | 303 | + break; |
270 | + * the address arithmetic. | ||
271 | + */ | ||
272 | + for (i = 0; i < oprsz; i++, za += sizeof(ARMVectorReg)) { | ||
273 | + if (pg[H2(i)] & 1) { | ||
274 | + d[i] = a[tile_vslice_index(i)]; | ||
275 | + } | ||
276 | + } | 304 | + } |
277 | +} | 305 | +} |
278 | + | 306 | + |
279 | +#undef DO_MOVA_Z | 307 | +static void allwinner_sramc_class_init(ObjectClass *klass, void *data) |
280 | diff --git a/target/arm/sve_helper.c b/target/arm/sve_helper.c | 308 | +{ |
281 | index XXXXXXX..XXXXXXX 100644 | 309 | + DeviceClass *dc = DEVICE_CLASS(klass); |
282 | --- a/target/arm/sve_helper.c | 310 | + |
283 | +++ b/target/arm/sve_helper.c | 311 | + dc->reset = allwinner_sramc_reset; |
284 | @@ -XXX,XX +XXX,XX @@ void HELPER(sve_sel_zpzz_d)(void *vd, void *vn, void *vm, | 312 | + dc->vmsd = &allwinner_sramc_vmstate; |
285 | } | 313 | +} |
286 | } | 314 | + |
287 | 315 | +static void allwinner_sramc_init(Object *obj) | |
288 | +void HELPER(sve_sel_zpzz_q)(void *vd, void *vn, void *vm, | 316 | +{ |
289 | + void *vg, uint32_t desc) | 317 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); |
290 | +{ | 318 | + AwSRAMCState *s = AW_SRAMC(obj); |
291 | + intptr_t i, opr_sz = simd_oprsz(desc) / 16; | 319 | + |
292 | + Int128 *d = vd, *n = vn, *m = vm; | 320 | + /* Memory mapping */ |
293 | + uint16_t *pg = vg; | 321 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_sramc_ops, s, |
294 | + | 322 | + TYPE_AW_SRAMC, 1 * KiB); |
295 | + for (i = 0; i < opr_sz; i += 1) { | 323 | + sysbus_init_mmio(sbd, &s->iomem); |
296 | + d[i] = (pg[H2(i)] & 1 ? n : m)[i]; | 324 | +} |
297 | + } | 325 | + |
298 | +} | 326 | +static const TypeInfo allwinner_sramc_info = { |
299 | + | 327 | + .name = TYPE_AW_SRAMC, |
300 | /* Two operand comparison controlled by a predicate. | 328 | + .parent = TYPE_SYS_BUS_DEVICE, |
301 | * ??? It is very tempting to want to be able to expand this inline | 329 | + .instance_init = allwinner_sramc_init, |
302 | * with x86 instructions, e.g. | 330 | + .instance_size = sizeof(AwSRAMCState), |
303 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 331 | + .class_init = allwinner_sramc_class_init, |
304 | index XXXXXXX..XXXXXXX 100644 | 332 | +}; |
305 | --- a/target/arm/translate-sme.c | 333 | + |
306 | +++ b/target/arm/translate-sme.c | 334 | +static void allwinner_r40_sramc_class_init(ObjectClass *klass, void *data) |
307 | @@ -XXX,XX +XXX,XX @@ | 335 | +{ |
308 | #include "decode-sme.c.inc" | 336 | + AwSRAMCClass *sc = AW_SRAMC_CLASS(klass); |
309 | 337 | + | |
310 | 338 | + sc->sram_version_code = SRAM_VERSION_SUN8I_R40; | |
311 | +/* | 339 | +} |
312 | + * Resolve tile.size[index] to a host pointer, where tile and index | 340 | + |
313 | + * are always decoded together, dependent on the element size. | 341 | +static const TypeInfo allwinner_r40_sramc_info = { |
314 | + */ | 342 | + .name = TYPE_AW_SRAMC_SUN8I_R40, |
315 | +static TCGv_ptr get_tile_rowcol(DisasContext *s, int esz, int rs, | 343 | + .parent = TYPE_AW_SRAMC, |
316 | + int tile_index, bool vertical) | 344 | + .class_init = allwinner_r40_sramc_class_init, |
317 | +{ | 345 | +}; |
318 | + int tile = tile_index >> (4 - esz); | 346 | + |
319 | + int index = esz == MO_128 ? 0 : extract32(tile_index, 0, 4 - esz); | 347 | +static void allwinner_sramc_register(void) |
320 | + int pos, len, offset; | 348 | +{ |
321 | + TCGv_i32 tmp; | 349 | + type_register_static(&allwinner_sramc_info); |
322 | + TCGv_ptr addr; | 350 | + type_register_static(&allwinner_r40_sramc_info); |
323 | + | 351 | +} |
324 | + /* Compute the final index, which is Rs+imm. */ | 352 | + |
325 | + tmp = tcg_temp_new_i32(); | 353 | +type_init(allwinner_sramc_register) |
326 | + tcg_gen_trunc_tl_i32(tmp, cpu_reg(s, rs)); | 354 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig |
327 | + tcg_gen_addi_i32(tmp, tmp, index); | 355 | index XXXXXXX..XXXXXXX 100644 |
328 | + | 356 | --- a/hw/arm/Kconfig |
329 | + /* Prepare a power-of-two modulo via extraction of @len bits. */ | 357 | +++ b/hw/arm/Kconfig |
330 | + len = ctz32(streaming_vec_reg_size(s)) - esz; | 358 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_H3 |
331 | + | 359 | config ALLWINNER_R40 |
332 | + if (vertical) { | 360 | bool |
333 | + /* | 361 | default y if TCG && ARM |
334 | + * Compute the byte offset of the index within the tile: | 362 | + select ALLWINNER_SRAMC |
335 | + * (index % (svl / size)) * size | 363 | select ALLWINNER_A10_PIT |
336 | + * = (index % (svl >> esz)) << esz | 364 | select AXP2XX_PMU |
337 | + * Perform the power-of-two modulo via extraction of the low @len bits. | 365 | select SERIAL |
338 | + * Perform the multiply by shifting left by @pos bits. | 366 | diff --git a/hw/misc/Kconfig b/hw/misc/Kconfig |
339 | + * Perform these operations simultaneously via deposit into zero. | 367 | index XXXXXXX..XXXXXXX 100644 |
340 | + */ | 368 | --- a/hw/misc/Kconfig |
341 | + pos = esz; | 369 | +++ b/hw/misc/Kconfig |
342 | + tcg_gen_deposit_z_i32(tmp, tmp, pos, len); | 370 | @@ -XXX,XX +XXX,XX @@ config VIRT_CTRL |
343 | + | 371 | config LASI |
344 | + /* | 372 | bool |
345 | + * For big-endian, adjust the indexed column byte offset within | 373 | |
346 | + * the uint64_t host words that make up env->zarray[]. | 374 | +config ALLWINNER_SRAMC |
347 | + */ | 375 | + bool |
348 | + if (HOST_BIG_ENDIAN && esz < MO_64) { | 376 | + |
349 | + tcg_gen_xori_i32(tmp, tmp, 8 - (1 << esz)); | 377 | config ALLWINNER_A10_CCM |
350 | + } | 378 | bool |
351 | + } else { | 379 | |
352 | + /* | 380 | diff --git a/hw/misc/meson.build b/hw/misc/meson.build |
353 | + * Compute the byte offset of the index within the tile: | 381 | index XXXXXXX..XXXXXXX 100644 |
354 | + * (index % (svl / size)) * (size * sizeof(row)) | 382 | --- a/hw/misc/meson.build |
355 | + * = (index % (svl >> esz)) << (esz + log2(sizeof(row))) | 383 | +++ b/hw/misc/meson.build |
356 | + */ | 384 | @@ -XXX,XX +XXX,XX @@ subdir('macio') |
357 | + pos = esz + ctz32(sizeof(ARMVectorReg)); | 385 | |
358 | + tcg_gen_deposit_z_i32(tmp, tmp, pos, len); | 386 | softmmu_ss.add(when: 'CONFIG_IVSHMEM_DEVICE', if_true: files('ivshmem.c')) |
359 | + | 387 | |
360 | + /* Row slices are always aligned and need no endian adjustment. */ | 388 | +softmmu_ss.add(when: 'CONFIG_ALLWINNER_SRAMC', if_true: files('allwinner-sramc.c')) |
361 | + } | 389 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_A10_CCM', if_true: files('allwinner-a10-ccm.c')) |
362 | + | 390 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_A10_DRAMC', if_true: files('allwinner-a10-dramc.c')) |
363 | + /* The tile byte offset within env->zarray is the row. */ | 391 | softmmu_ss.add(when: 'CONFIG_ALLWINNER_H3', if_true: files('allwinner-h3-ccu.c')) |
364 | + offset = tile * sizeof(ARMVectorReg); | 392 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events |
365 | + | 393 | index XXXXXXX..XXXXXXX 100644 |
366 | + /* Include the byte offset of zarray to make this relative to env. */ | 394 | --- a/hw/misc/trace-events |
367 | + offset += offsetof(CPUARMState, zarray); | 395 | +++ b/hw/misc/trace-events |
368 | + tcg_gen_addi_i32(tmp, tmp, offset); | 396 | @@ -XXX,XX +XXX,XX @@ allwinner_r40_dramphy_write(uint64_t offset, uint64_t data, unsigned size) "writ |
369 | + | 397 | allwinner_sid_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 |
370 | + /* Add the byte offset to env to produce the final pointer. */ | 398 | allwinner_sid_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 |
371 | + addr = tcg_temp_new_ptr(); | 399 | |
372 | + tcg_gen_ext_i32_ptr(addr, tmp); | 400 | +# allwinner-sramc.c |
373 | + tcg_temp_free_i32(tmp); | 401 | +allwinner_sramc_read(uint64_t offset, uint64_t data) "offset 0x%" PRIx64 " data 0x%" PRIx64 |
374 | + tcg_gen_add_ptr(addr, addr, cpu_env); | 402 | +allwinner_sramc_write(uint64_t offset, uint64_t data) "offset 0x%" PRIx64 " data 0x%" PRIx64 |
375 | + | 403 | + |
376 | + return addr; | 404 | # avr_power.c |
377 | +} | 405 | avr_power_read(uint8_t value) "power_reduc read value:%u" |
378 | + | 406 | avr_power_write(uint8_t value) "power_reduc write value:%u" |
379 | static bool trans_ZERO(DisasContext *s, arg_ZERO *a) | ||
380 | { | ||
381 | if (!dc_isar_feature(aa64_sme, s)) { | ||
382 | @@ -XXX,XX +XXX,XX @@ static bool trans_ZERO(DisasContext *s, arg_ZERO *a) | ||
383 | } | ||
384 | return true; | ||
385 | } | ||
386 | + | ||
387 | +static bool trans_MOVA(DisasContext *s, arg_MOVA *a) | ||
388 | +{ | ||
389 | + static gen_helper_gvec_4 * const h_fns[5] = { | ||
390 | + gen_helper_sve_sel_zpzz_b, gen_helper_sve_sel_zpzz_h, | ||
391 | + gen_helper_sve_sel_zpzz_s, gen_helper_sve_sel_zpzz_d, | ||
392 | + gen_helper_sve_sel_zpzz_q | ||
393 | + }; | ||
394 | + static gen_helper_gvec_3 * const cz_fns[5] = { | ||
395 | + gen_helper_sme_mova_cz_b, gen_helper_sme_mova_cz_h, | ||
396 | + gen_helper_sme_mova_cz_s, gen_helper_sme_mova_cz_d, | ||
397 | + gen_helper_sme_mova_cz_q, | ||
398 | + }; | ||
399 | + static gen_helper_gvec_3 * const zc_fns[5] = { | ||
400 | + gen_helper_sme_mova_zc_b, gen_helper_sme_mova_zc_h, | ||
401 | + gen_helper_sme_mova_zc_s, gen_helper_sme_mova_zc_d, | ||
402 | + gen_helper_sme_mova_zc_q, | ||
403 | + }; | ||
404 | + | ||
405 | + TCGv_ptr t_za, t_zr, t_pg; | ||
406 | + TCGv_i32 t_desc; | ||
407 | + int svl; | ||
408 | + | ||
409 | + if (!dc_isar_feature(aa64_sme, s)) { | ||
410 | + return false; | ||
411 | + } | ||
412 | + if (!sme_smza_enabled_check(s)) { | ||
413 | + return true; | ||
414 | + } | ||
415 | + | ||
416 | + t_za = get_tile_rowcol(s, a->esz, a->rs, a->za_imm, a->v); | ||
417 | + t_zr = vec_full_reg_ptr(s, a->zr); | ||
418 | + t_pg = pred_full_reg_ptr(s, a->pg); | ||
419 | + | ||
420 | + svl = streaming_vec_reg_size(s); | ||
421 | + t_desc = tcg_constant_i32(simd_desc(svl, svl, 0)); | ||
422 | + | ||
423 | + if (a->v) { | ||
424 | + /* Vertical slice -- use sme mova helpers. */ | ||
425 | + if (a->to_vec) { | ||
426 | + zc_fns[a->esz](t_zr, t_za, t_pg, t_desc); | ||
427 | + } else { | ||
428 | + cz_fns[a->esz](t_za, t_zr, t_pg, t_desc); | ||
429 | + } | ||
430 | + } else { | ||
431 | + /* Horizontal slice -- reuse sve sel helpers. */ | ||
432 | + if (a->to_vec) { | ||
433 | + h_fns[a->esz](t_zr, t_za, t_zr, t_pg, t_desc); | ||
434 | + } else { | ||
435 | + h_fns[a->esz](t_za, t_zr, t_za, t_pg, t_desc); | ||
436 | + } | ||
437 | + } | ||
438 | + | ||
439 | + tcg_temp_free_ptr(t_za); | ||
440 | + tcg_temp_free_ptr(t_zr); | ||
441 | + tcg_temp_free_ptr(t_pg); | ||
442 | + | ||
443 | + return true; | ||
444 | +} | ||
445 | -- | 407 | -- |
446 | 2.25.1 | 408 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | In parse_user_sigframe, the kernel rejects duplicate sve records, | 3 | Add test case for booting from initrd and sd card. |
4 | or records that are smaller than the header. We were silently | ||
5 | allowing these cases to pass, dropping the record. | ||
6 | 4 | ||
7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 5 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 6 | Reviewed-by: Niek Linnenbank <nieklinnenbank@gmail.com> |
9 | Message-id: 20220708151540.18136-38-richard.henderson@linaro.org | 7 | Tested-by: Niek Linnenbank <nieklinnenbank@gmail.com> |
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 9 | --- |
12 | linux-user/aarch64/signal.c | 5 ++++- | 10 | tests/avocado/boot_linux_console.py | 176 ++++++++++++++++++++++++++++ |
13 | 1 file changed, 4 insertions(+), 1 deletion(-) | 11 | 1 file changed, 176 insertions(+) |
14 | 12 | ||
15 | diff --git a/linux-user/aarch64/signal.c b/linux-user/aarch64/signal.c | 13 | diff --git a/tests/avocado/boot_linux_console.py b/tests/avocado/boot_linux_console.py |
16 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/linux-user/aarch64/signal.c | 15 | --- a/tests/avocado/boot_linux_console.py |
18 | +++ b/linux-user/aarch64/signal.c | 16 | +++ b/tests/avocado/boot_linux_console.py |
19 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 17 | @@ -XXX,XX +XXX,XX @@ def test_arm_quanta_gsj_initrd(self): |
20 | break; | 18 | self.wait_for_console_pattern( |
21 | 19 | 'Give root password for system maintenance') | |
22 | case TARGET_SVE_MAGIC: | 20 | |
23 | + if (sve || size < sizeof(struct target_sve_context)) { | 21 | + def test_arm_bpim2u(self): |
24 | + goto err; | 22 | + """ |
25 | + } | 23 | + :avocado: tags=arch:arm |
26 | if (cpu_isar_feature(aa64_sve, env_archcpu(env))) { | 24 | + :avocado: tags=machine:bpim2u |
27 | vq = sve_vq(env); | 25 | + :avocado: tags=accel:tcg |
28 | sve_size = QEMU_ALIGN_UP(TARGET_SVE_SIG_CONTEXT_SIZE(vq), 16); | 26 | + """ |
29 | - if (!sve && size == sve_size) { | 27 | + deb_url = ('https://apt.armbian.com/pool/main/l/linux-5.10.16-sunxi/' |
30 | + if (size == sve_size) { | 28 | + 'linux-image-current-sunxi_21.02.2_armhf.deb') |
31 | sve = (struct target_sve_context *)ctx; | 29 | + deb_hash = '9fa84beda245cabf0b4fa84cf6eaa7738ead1da0' |
32 | break; | 30 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) |
33 | } | 31 | + kernel_path = self.extract_from_deb(deb_path, |
32 | + '/boot/vmlinuz-5.10.16-sunxi') | ||
33 | + dtb_path = ('/usr/lib/linux-image-current-sunxi/' | ||
34 | + 'sun8i-r40-bananapi-m2-ultra.dtb') | ||
35 | + dtb_path = self.extract_from_deb(deb_path, dtb_path) | ||
36 | + | ||
37 | + self.vm.set_console() | ||
38 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | ||
39 | + 'console=ttyS0,115200n8 ' | ||
40 | + 'earlycon=uart,mmio32,0x1c28000') | ||
41 | + self.vm.add_args('-kernel', kernel_path, | ||
42 | + '-dtb', dtb_path, | ||
43 | + '-append', kernel_command_line) | ||
44 | + self.vm.launch() | ||
45 | + console_pattern = 'Kernel command line: %s' % kernel_command_line | ||
46 | + self.wait_for_console_pattern(console_pattern) | ||
47 | + | ||
48 | + def test_arm_bpim2u_initrd(self): | ||
49 | + """ | ||
50 | + :avocado: tags=arch:arm | ||
51 | + :avocado: tags=accel:tcg | ||
52 | + :avocado: tags=machine:bpim2u | ||
53 | + """ | ||
54 | + deb_url = ('https://apt.armbian.com/pool/main/l/linux-5.10.16-sunxi/' | ||
55 | + 'linux-image-current-sunxi_21.02.2_armhf.deb') | ||
56 | + deb_hash = '9fa84beda245cabf0b4fa84cf6eaa7738ead1da0' | ||
57 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | ||
58 | + kernel_path = self.extract_from_deb(deb_path, | ||
59 | + '/boot/vmlinuz-5.10.16-sunxi') | ||
60 | + dtb_path = ('/usr/lib/linux-image-current-sunxi/' | ||
61 | + 'sun8i-r40-bananapi-m2-ultra.dtb') | ||
62 | + dtb_path = self.extract_from_deb(deb_path, dtb_path) | ||
63 | + initrd_url = ('https://github.com/groeck/linux-build-test/raw/' | ||
64 | + '2eb0a73b5d5a28df3170c546ddaaa9757e1e0848/rootfs/' | ||
65 | + 'arm/rootfs-armv7a.cpio.gz') | ||
66 | + initrd_hash = '604b2e45cdf35045846b8bbfbf2129b1891bdc9c' | ||
67 | + initrd_path_gz = self.fetch_asset(initrd_url, asset_hash=initrd_hash) | ||
68 | + initrd_path = os.path.join(self.workdir, 'rootfs.cpio') | ||
69 | + archive.gzip_uncompress(initrd_path_gz, initrd_path) | ||
70 | + | ||
71 | + self.vm.set_console() | ||
72 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | ||
73 | + 'console=ttyS0,115200 ' | ||
74 | + 'panic=-1 noreboot') | ||
75 | + self.vm.add_args('-kernel', kernel_path, | ||
76 | + '-dtb', dtb_path, | ||
77 | + '-initrd', initrd_path, | ||
78 | + '-append', kernel_command_line, | ||
79 | + '-no-reboot') | ||
80 | + self.vm.launch() | ||
81 | + self.wait_for_console_pattern('Boot successful.') | ||
82 | + | ||
83 | + exec_command_and_wait_for_pattern(self, 'cat /proc/cpuinfo', | ||
84 | + 'Allwinner sun8i Family') | ||
85 | + exec_command_and_wait_for_pattern(self, 'cat /proc/iomem', | ||
86 | + 'system-control@1c00000') | ||
87 | + exec_command_and_wait_for_pattern(self, 'reboot', | ||
88 | + 'reboot: Restarting system') | ||
89 | + # Wait for VM to shut down gracefully | ||
90 | + self.vm.wait() | ||
91 | + | ||
92 | + def test_arm_bpim2u_gmac(self): | ||
93 | + """ | ||
94 | + :avocado: tags=arch:arm | ||
95 | + :avocado: tags=accel:tcg | ||
96 | + :avocado: tags=machine:bpim2u | ||
97 | + :avocado: tags=device:sd | ||
98 | + """ | ||
99 | + self.require_netdev('user') | ||
100 | + | ||
101 | + deb_url = ('https://apt.armbian.com/pool/main/l/linux-5.10.16-sunxi/' | ||
102 | + 'linux-image-current-sunxi_21.02.2_armhf.deb') | ||
103 | + deb_hash = '9fa84beda245cabf0b4fa84cf6eaa7738ead1da0' | ||
104 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | ||
105 | + kernel_path = self.extract_from_deb(deb_path, | ||
106 | + '/boot/vmlinuz-5.10.16-sunxi') | ||
107 | + dtb_path = ('/usr/lib/linux-image-current-sunxi/' | ||
108 | + 'sun8i-r40-bananapi-m2-ultra.dtb') | ||
109 | + dtb_path = self.extract_from_deb(deb_path, dtb_path) | ||
110 | + rootfs_url = ('http://storage.kernelci.org/images/rootfs/buildroot/' | ||
111 | + 'buildroot-baseline/20221116.0/armel/rootfs.ext2.xz') | ||
112 | + rootfs_hash = 'fae32f337c7b87547b10f42599acf109da8b6d9a' | ||
113 | + rootfs_path_xz = self.fetch_asset(rootfs_url, asset_hash=rootfs_hash) | ||
114 | + rootfs_path = os.path.join(self.workdir, 'rootfs.cpio') | ||
115 | + archive.lzma_uncompress(rootfs_path_xz, rootfs_path) | ||
116 | + image_pow2ceil_expand(rootfs_path) | ||
117 | + | ||
118 | + self.vm.set_console() | ||
119 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | ||
120 | + 'console=ttyS0,115200 ' | ||
121 | + 'root=/dev/mmcblk0 rootwait rw ' | ||
122 | + 'panic=-1 noreboot') | ||
123 | + self.vm.add_args('-kernel', kernel_path, | ||
124 | + '-dtb', dtb_path, | ||
125 | + '-drive', 'file=' + rootfs_path + ',if=sd,format=raw', | ||
126 | + '-net', 'nic,model=gmac,netdev=host_gmac', | ||
127 | + '-netdev', 'user,id=host_gmac', | ||
128 | + '-append', kernel_command_line, | ||
129 | + '-no-reboot') | ||
130 | + self.vm.launch() | ||
131 | + shell_ready = "/bin/sh: can't access tty; job control turned off" | ||
132 | + self.wait_for_console_pattern(shell_ready) | ||
133 | + | ||
134 | + exec_command_and_wait_for_pattern(self, 'cat /proc/cpuinfo', | ||
135 | + 'Allwinner sun8i Family') | ||
136 | + exec_command_and_wait_for_pattern(self, 'cat /proc/partitions', | ||
137 | + 'mmcblk0') | ||
138 | + exec_command_and_wait_for_pattern(self, 'ifconfig eth0 up', | ||
139 | + 'eth0: Link is Up') | ||
140 | + exec_command_and_wait_for_pattern(self, 'udhcpc eth0', | ||
141 | + 'udhcpc: lease of 10.0.2.15 obtained') | ||
142 | + exec_command_and_wait_for_pattern(self, 'ping -c 3 10.0.2.2', | ||
143 | + '3 packets transmitted, 3 packets received, 0% packet loss') | ||
144 | + exec_command_and_wait_for_pattern(self, 'reboot', | ||
145 | + 'reboot: Restarting system') | ||
146 | + # Wait for VM to shut down gracefully | ||
147 | + self.vm.wait() | ||
148 | + | ||
149 | + @skipUnless(os.getenv('AVOCADO_ALLOW_LARGE_STORAGE'), 'storage limited') | ||
150 | + def test_arm_bpim2u_openwrt_22_03_3(self): | ||
151 | + """ | ||
152 | + :avocado: tags=arch:arm | ||
153 | + :avocado: tags=machine:bpim2u | ||
154 | + :avocado: tags=device:sd | ||
155 | + """ | ||
156 | + | ||
157 | + # This test download a 8.9 MiB compressed image and expand it | ||
158 | + # to 127 MiB. | ||
159 | + image_url = ('https://downloads.openwrt.org/releases/22.03.3/targets/' | ||
160 | + 'sunxi/cortexa7/openwrt-22.03.3-sunxi-cortexa7-' | ||
161 | + 'sinovoip_bananapi-m2-ultra-ext4-sdcard.img.gz') | ||
162 | + image_hash = ('5b41b4e11423e562c6011640f9a7cd3b' | ||
163 | + 'dd0a3d42b83430f7caa70a432e6cd82c') | ||
164 | + image_path_gz = self.fetch_asset(image_url, asset_hash=image_hash, | ||
165 | + algorithm='sha256') | ||
166 | + image_path = archive.extract(image_path_gz, self.workdir) | ||
167 | + image_pow2ceil_expand(image_path) | ||
168 | + | ||
169 | + self.vm.set_console() | ||
170 | + self.vm.add_args('-drive', 'file=' + image_path + ',if=sd,format=raw', | ||
171 | + '-nic', 'user', | ||
172 | + '-no-reboot') | ||
173 | + self.vm.launch() | ||
174 | + | ||
175 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | ||
176 | + 'usbcore.nousb ' | ||
177 | + 'noreboot') | ||
178 | + | ||
179 | + self.wait_for_console_pattern('U-Boot SPL') | ||
180 | + | ||
181 | + interrupt_interactive_console_until_pattern( | ||
182 | + self, 'Hit any key to stop autoboot:', '=>') | ||
183 | + exec_command_and_wait_for_pattern(self, "setenv extraargs '" + | ||
184 | + kernel_command_line + "'", '=>') | ||
185 | + exec_command_and_wait_for_pattern(self, 'boot', 'Starting kernel ...'); | ||
186 | + | ||
187 | + self.wait_for_console_pattern( | ||
188 | + 'Please press Enter to activate this console.') | ||
189 | + | ||
190 | + exec_command_and_wait_for_pattern(self, ' ', 'root@') | ||
191 | + | ||
192 | + exec_command_and_wait_for_pattern(self, 'cat /proc/cpuinfo', | ||
193 | + 'Allwinner sun8i Family') | ||
194 | + exec_command_and_wait_for_pattern(self, 'cat /proc/iomem', | ||
195 | + 'system-control@1c00000') | ||
196 | + | ||
197 | def test_arm_orangepi(self): | ||
198 | """ | ||
199 | :avocado: tags=arch:arm | ||
34 | -- | 200 | -- |
35 | 2.25.1 | 201 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: qianfan Zhao <qianfanguijin@163.com> |
---|---|---|---|
2 | 2 | ||
3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 3 | Add documents for Banana Pi M2U |
4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 4 | |
5 | Message-id: 20220708151540.18136-35-richard.henderson@linaro.org | 5 | Signed-off-by: qianfan Zhao <qianfanguijin@163.com> |
6 | Reviewed-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
7 | [PMM: Minor format fixes to correct sphinx errors] | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 9 | --- |
8 | linux-user/aarch64/cpu_loop.c | 9 +++++++++ | 10 | docs/system/arm/bananapi_m2u.rst | 139 +++++++++++++++++++++++++++++++ |
9 | 1 file changed, 9 insertions(+) | 11 | docs/system/target-arm.rst | 1 + |
12 | 2 files changed, 140 insertions(+) | ||
13 | create mode 100644 docs/system/arm/bananapi_m2u.rst | ||
10 | 14 | ||
11 | diff --git a/linux-user/aarch64/cpu_loop.c b/linux-user/aarch64/cpu_loop.c | 15 | diff --git a/docs/system/arm/bananapi_m2u.rst b/docs/system/arm/bananapi_m2u.rst |
16 | new file mode 100644 | ||
17 | index XXXXXXX..XXXXXXX | ||
18 | --- /dev/null | ||
19 | +++ b/docs/system/arm/bananapi_m2u.rst | ||
20 | @@ -XXX,XX +XXX,XX @@ | ||
21 | +Banana Pi BPI-M2U (``bpim2u``) | ||
22 | +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ | ||
23 | + | ||
24 | +Banana Pi BPI-M2 Ultra is a quad-core mini single board computer built with | ||
25 | +Allwinner A40i/R40/V40 SoC. It features 2GB of RAM and 8GB eMMC. It also | ||
26 | +has onboard WiFi and BT. On the ports side, the BPI-M2 Ultra has 2 USB A | ||
27 | +2.0 ports, 1 USB OTG port, 1 HDMI port, 1 audio jack, a DC power port, | ||
28 | +and last but not least, a SATA port. | ||
29 | + | ||
30 | +Supported devices | ||
31 | +""""""""""""""""" | ||
32 | + | ||
33 | +The Banana Pi M2U machine supports the following devices: | ||
34 | + | ||
35 | + * SMP (Quad Core Cortex-A7) | ||
36 | + * Generic Interrupt Controller configuration | ||
37 | + * SRAM mappings | ||
38 | + * SDRAM controller | ||
39 | + * Timer device (re-used from Allwinner A10) | ||
40 | + * UART | ||
41 | + * SD/MMC storage controller | ||
42 | + * EMAC ethernet | ||
43 | + * GMAC ethernet | ||
44 | + * Clock Control Unit | ||
45 | + * TWI (I2C) | ||
46 | + | ||
47 | +Limitations | ||
48 | +""""""""""" | ||
49 | + | ||
50 | +Currently, Banana Pi M2U does *not* support the following features: | ||
51 | + | ||
52 | +- Graphical output via HDMI, GPU and/or the Display Engine | ||
53 | +- Audio output | ||
54 | +- Hardware Watchdog | ||
55 | +- Real Time Clock | ||
56 | +- USB 2.0 interfaces | ||
57 | + | ||
58 | +Also see the 'unimplemented' array in the Allwinner R40 SoC module | ||
59 | +for a complete list of unimplemented I/O devices: ``./hw/arm/allwinner-r40.c`` | ||
60 | + | ||
61 | +Boot options | ||
62 | +"""""""""""" | ||
63 | + | ||
64 | +The Banana Pi M2U machine can start using the standard -kernel functionality | ||
65 | +for loading a Linux kernel or ELF executable. Additionally, the Banana Pi M2U | ||
66 | +machine can also emulate the BootROM which is present on an actual Allwinner R40 | ||
67 | +based SoC, which loads the bootloader from a SD card, specified via the -sd | ||
68 | +argument to qemu-system-arm. | ||
69 | + | ||
70 | +Running mainline Linux | ||
71 | +"""""""""""""""""""""" | ||
72 | + | ||
73 | +To build a Linux mainline kernel that can be booted by the Banana Pi M2U machine, | ||
74 | +simply configure the kernel using the sunxi_defconfig configuration: | ||
75 | + | ||
76 | +.. code-block:: bash | ||
77 | + | ||
78 | + $ ARCH=arm CROSS_COMPILE=arm-linux-gnueabi- make mrproper | ||
79 | + $ ARCH=arm CROSS_COMPILE=arm-linux-gnueabi- make sunxi_defconfig | ||
80 | + | ||
81 | +To boot the newly build linux kernel in QEMU with the Banana Pi M2U machine, use: | ||
82 | + | ||
83 | +.. code-block:: bash | ||
84 | + | ||
85 | + $ qemu-system-arm -M bpim2u -nographic \ | ||
86 | + -kernel /path/to/linux/arch/arm/boot/zImage \ | ||
87 | + -append 'console=ttyS0,115200' \ | ||
88 | + -dtb /path/to/linux/arch/arm/boot/dts/sun8i-r40-bananapi-m2-ultra.dtb | ||
89 | + | ||
90 | +Banana Pi M2U images | ||
91 | +"""""""""""""""""""" | ||
92 | + | ||
93 | +Note that the mainline kernel does not have a root filesystem. You can choose | ||
94 | +to build you own image with buildroot using the bananapi_m2_ultra_defconfig. | ||
95 | +Also see https://buildroot.org for more information. | ||
96 | + | ||
97 | +Another possibility is to run an OpenWrt image for Banana Pi M2U which | ||
98 | +can be downloaded from: | ||
99 | + | ||
100 | + https://downloads.openwrt.org/releases/22.03.3/targets/sunxi/cortexa7/ | ||
101 | + | ||
102 | +When using an image as an SD card, it must be resized to a power of two. This can be | ||
103 | +done with the ``qemu-img`` command. It is recommended to only increase the image size | ||
104 | +instead of shrinking it to a power of two, to avoid loss of data. For example, | ||
105 | +to prepare a downloaded Armbian image, first extract it and then increase | ||
106 | +its size to one gigabyte as follows: | ||
107 | + | ||
108 | +.. code-block:: bash | ||
109 | + | ||
110 | + $ qemu-img resize \ | ||
111 | + openwrt-22.03.3-sunxi-cortexa7-sinovoip_bananapi-m2-ultra-ext4-sdcard.img \ | ||
112 | + 1G | ||
113 | + | ||
114 | +Instead of providing a custom Linux kernel via the -kernel command you may also | ||
115 | +choose to let the Banana Pi M2U machine load the bootloader from SD card, just like | ||
116 | +a real board would do using the BootROM. Simply pass the selected image via the -sd | ||
117 | +argument and remove the -kernel, -append, -dbt and -initrd arguments: | ||
118 | + | ||
119 | +.. code-block:: bash | ||
120 | + | ||
121 | + $ qemu-system-arm -M bpim2u -nic user -nographic \ | ||
122 | + -sd openwrt-22.03.3-sunxi-cortexa7-sinovoip_bananapi-m2-ultra-ext4-sdcard.img | ||
123 | + | ||
124 | +Running U-Boot | ||
125 | +"""""""""""""" | ||
126 | + | ||
127 | +U-Boot mainline can be build and configured using the Bananapi_M2_Ultra_defconfig | ||
128 | +using similar commands as describe above for Linux. Note that it is recommended | ||
129 | +for development/testing to select the following configuration setting in U-Boot: | ||
130 | + | ||
131 | + Device Tree Control > Provider for DTB for DT Control > Embedded DTB | ||
132 | + | ||
133 | +The BootROM of allwinner R40 loading u-boot from the 8KiB offset of sdcard. | ||
134 | +Let's create an bootable disk image: | ||
135 | + | ||
136 | +.. code-block:: bash | ||
137 | + | ||
138 | + $ dd if=/dev/zero of=sd.img bs=32M count=1 | ||
139 | + $ dd if=u-boot-sunxi-with-spl.bin of=sd.img bs=1k seek=8 conv=notrunc | ||
140 | + | ||
141 | +And then boot it. | ||
142 | + | ||
143 | +.. code-block:: bash | ||
144 | + | ||
145 | + $ qemu-system-arm -M bpim2u -nographic -sd sd.img | ||
146 | + | ||
147 | +Banana Pi M2U integration tests | ||
148 | +""""""""""""""""""""""""""""""" | ||
149 | + | ||
150 | +The Banana Pi M2U machine has several integration tests included. | ||
151 | +To run the whole set of tests, build QEMU from source and simply | ||
152 | +provide the following command: | ||
153 | + | ||
154 | +.. code-block:: bash | ||
155 | + | ||
156 | + $ cd qemu-build-dir | ||
157 | + $ AVOCADO_ALLOW_LARGE_STORAGE=yes tests/venv/bin/avocado \ | ||
158 | + --verbose --show=app,console run -t machine:bpim2u \ | ||
159 | + ../tests/avocado/boot_linux_console.py | ||
160 | diff --git a/docs/system/target-arm.rst b/docs/system/target-arm.rst | ||
12 | index XXXXXXX..XXXXXXX 100644 | 161 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/linux-user/aarch64/cpu_loop.c | 162 | --- a/docs/system/target-arm.rst |
14 | +++ b/linux-user/aarch64/cpu_loop.c | 163 | +++ b/docs/system/target-arm.rst |
15 | @@ -XXX,XX +XXX,XX @@ void cpu_loop(CPUARMState *env) | 164 | @@ -XXX,XX +XXX,XX @@ undocumented; you can get a complete list by running |
16 | 165 | arm/versatile | |
17 | switch (trapnr) { | 166 | arm/vexpress |
18 | case EXCP_SWI: | 167 | arm/aspeed |
19 | + /* | 168 | + arm/bananapi_m2u.rst |
20 | + * On syscall, PSTATE.ZA is preserved, along with the ZA matrix. | 169 | arm/sabrelite |
21 | + * PSTATE.SM is cleared, per SMSTOP, which does ResetSVEState. | 170 | arm/digic |
22 | + */ | 171 | arm/cubieboard |
23 | + if (FIELD_EX64(env->svcr, SVCR, SM)) { | ||
24 | + env->svcr = FIELD_DP64(env->svcr, SVCR, SM, 0); | ||
25 | + arm_rebuild_hflags(env); | ||
26 | + arm_reset_sve_state(env); | ||
27 | + } | ||
28 | ret = do_syscall(env, | ||
29 | env->xregs[8], | ||
30 | env->xregs[0], | ||
31 | -- | 172 | -- |
32 | 2.25.1 | 173 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap | 3 | Document the meaning of exclusive_high in a big-endian context, |
4 | if full a64 support is not enabled in streaming mode. | 4 | and why we can't change it now. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-15-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-2-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/sme-fa64.decode | 3 --- | 11 | target/arm/cpu.h | 8 ++++++++ |
12 | target/arm/translate-sve.c | 2 ++ | 12 | 1 file changed, 8 insertions(+) |
13 | 2 files changed, 2 insertions(+), 3 deletions(-) | ||
14 | 13 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 14 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
16 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 16 | --- a/target/arm/cpu.h |
18 | +++ b/target/arm/sme-fa64.decode | 17 | +++ b/target/arm/cpu.h |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 18 | @@ -XXX,XX +XXX,XX @@ typedef struct CPUArchState { |
20 | # --11 1100 --0- ---- ---- ---- ---- ---- # Load/store FP register (unscaled imm) | 19 | uint64_t zcr_el[4]; /* ZCR_EL[1-3] */ |
21 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 20 | uint64_t smcr_el[4]; /* SMCR_EL[1-3] */ |
22 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 21 | } vfp; |
23 | - | 22 | + |
24 | -FAIL 1010 010- -01- ---- 000- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+scalar) | 23 | uint64_t exclusive_addr; |
25 | -FAIL 1010 010- -010 ---- 001- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+imm) | 24 | uint64_t exclusive_val; |
26 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 25 | + /* |
27 | index XXXXXXX..XXXXXXX 100644 | 26 | + * Contains the 'val' for the second 64-bit register of LDXP, which comes |
28 | --- a/target/arm/translate-sve.c | 27 | + * from the higher address, not the high part of a complete 128-bit value. |
29 | +++ b/target/arm/translate-sve.c | 28 | + * In some ways it might be more convenient to record the exclusive value |
30 | @@ -XXX,XX +XXX,XX @@ static bool trans_LD1RO_zprr(DisasContext *s, arg_rprr_load *a) | 29 | + * as the low and high halves of a 128 bit data value, but the current |
31 | if (a->rm == 31) { | 30 | + * semantics of these fields are baked into the migration format. |
32 | return false; | 31 | + */ |
33 | } | 32 | uint64_t exclusive_high; |
34 | + s->is_nonstreaming = true; | 33 | |
35 | if (sve_access_check(s)) { | 34 | /* iwMMXt coprocessor state. */ |
36 | TCGv_i64 addr = new_tmp_a64(s); | ||
37 | tcg_gen_shli_i64(addr, cpu_reg(s, a->rm), dtype_msz(a->dtype)); | ||
38 | @@ -XXX,XX +XXX,XX @@ static bool trans_LD1RO_zpri(DisasContext *s, arg_rpri_load *a) | ||
39 | if (!dc_isar_feature(aa64_sve_f64mm, s)) { | ||
40 | return false; | ||
41 | } | ||
42 | + s->is_nonstreaming = true; | ||
43 | if (sve_access_check(s)) { | ||
44 | TCGv_i64 addr = new_tmp_a64(s); | ||
45 | tcg_gen_addi_i64(addr, cpu_reg_sp(s, a->rn), a->imm * 32); | ||
46 | -- | 35 | -- |
47 | 2.25.1 | 36 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap if full | 3 | Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org> |
4 | a64 support is not enabled in streaming mode. In this case, introduce | ||
5 | PRF_ns (prefetch non-streaming) to handle the checks. | ||
6 | |||
7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 4 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 5 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
9 | Message-id: 20220708151540.18136-13-richard.henderson@linaro.org | 6 | Message-id: 20230530191438.411344-3-richard.henderson@linaro.org |
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 8 | --- |
12 | target/arm/sme-fa64.decode | 3 --- | 9 | target/arm/cpu.h | 5 +++++ |
13 | target/arm/sve.decode | 10 +++++----- | 10 | 1 file changed, 5 insertions(+) |
14 | target/arm/translate-sve.c | 11 +++++++++++ | ||
15 | 3 files changed, 16 insertions(+), 8 deletions(-) | ||
16 | 11 | ||
17 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 12 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
18 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/target/arm/sme-fa64.decode | 14 | --- a/target/arm/cpu.h |
20 | +++ b/target/arm/sme-fa64.decode | 15 | +++ b/target/arm/cpu.h |
21 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 16 | @@ -XXX,XX +XXX,XX @@ static inline bool isar_feature_aa64_st(const ARMISARegisters *id) |
22 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 17 | return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, ST) != 0; |
23 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | ||
24 | |||
25 | -FAIL 1000 010- -00- ---- 111- ---- ---- ---- # SVE 32-bit gather prefetch (vector+imm) | ||
26 | -FAIL 1000 0100 0-1- ---- 0--- ---- ---- ---- # SVE 32-bit gather prefetch (scalar+vector) | ||
27 | FAIL 1010 010- ---- ---- 011- ---- ---- ---- # SVE contiguous FF load (scalar+scalar) | ||
28 | FAIL 1010 010- ---1 ---- 101- ---- ---- ---- # SVE contiguous NF load (scalar+imm) | ||
29 | FAIL 1010 010- -01- ---- 000- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+scalar) | ||
30 | FAIL 1010 010- -010 ---- 001- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+imm) | ||
31 | -FAIL 1100 010- ---- ---- ---- ---- ---- ---- # SVE 64-bit gather load/prefetch | ||
32 | diff --git a/target/arm/sve.decode b/target/arm/sve.decode | ||
33 | index XXXXXXX..XXXXXXX 100644 | ||
34 | --- a/target/arm/sve.decode | ||
35 | +++ b/target/arm/sve.decode | ||
36 | @@ -XXX,XX +XXX,XX @@ LD1RO_zpri 1010010 .. 01 0.... 001 ... ..... ..... \ | ||
37 | @rpri_load_msz nreg=0 | ||
38 | |||
39 | # SVE 32-bit gather prefetch (scalar plus 32-bit scaled offsets) | ||
40 | -PRF 1000010 00 -1 ----- 0-- --- ----- 0 ---- | ||
41 | +PRF_ns 1000010 00 -1 ----- 0-- --- ----- 0 ---- | ||
42 | |||
43 | # SVE 32-bit gather prefetch (vector plus immediate) | ||
44 | -PRF 1000010 -- 00 ----- 111 --- ----- 0 ---- | ||
45 | +PRF_ns 1000010 -- 00 ----- 111 --- ----- 0 ---- | ||
46 | |||
47 | # SVE contiguous prefetch (scalar plus immediate) | ||
48 | PRF 1000010 11 1- ----- 0-- --- ----- 0 ---- | ||
49 | @@ -XXX,XX +XXX,XX @@ LD1_zpiz 1100010 .. 01 ..... 1.. ... ..... ..... \ | ||
50 | @rpri_g_load esz=3 | ||
51 | |||
52 | # SVE 64-bit gather prefetch (scalar plus 64-bit scaled offsets) | ||
53 | -PRF 1100010 00 11 ----- 1-- --- ----- 0 ---- | ||
54 | +PRF_ns 1100010 00 11 ----- 1-- --- ----- 0 ---- | ||
55 | |||
56 | # SVE 64-bit gather prefetch (scalar plus unpacked 32-bit scaled offsets) | ||
57 | -PRF 1100010 00 -1 ----- 0-- --- ----- 0 ---- | ||
58 | +PRF_ns 1100010 00 -1 ----- 0-- --- ----- 0 ---- | ||
59 | |||
60 | # SVE 64-bit gather prefetch (vector plus immediate) | ||
61 | -PRF 1100010 -- 00 ----- 111 --- ----- 0 ---- | ||
62 | +PRF_ns 1100010 -- 00 ----- 111 --- ----- 0 ---- | ||
63 | |||
64 | ### SVE Memory Store Group | ||
65 | |||
66 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | ||
67 | index XXXXXXX..XXXXXXX 100644 | ||
68 | --- a/target/arm/translate-sve.c | ||
69 | +++ b/target/arm/translate-sve.c | ||
70 | @@ -XXX,XX +XXX,XX @@ static bool trans_PRF_rr(DisasContext *s, arg_PRF_rr *a) | ||
71 | return true; | ||
72 | } | 18 | } |
73 | 19 | ||
74 | +static bool trans_PRF_ns(DisasContext *s, arg_PRF_ns *a) | 20 | +static inline bool isar_feature_aa64_lse2(const ARMISARegisters *id) |
75 | +{ | 21 | +{ |
76 | + if (!dc_isar_feature(aa64_sve, s)) { | 22 | + return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, AT) != 0; |
77 | + return false; | ||
78 | + } | ||
79 | + /* Prefetch is a nop within QEMU. */ | ||
80 | + s->is_nonstreaming = true; | ||
81 | + (void)sve_access_check(s); | ||
82 | + return true; | ||
83 | +} | 23 | +} |
84 | + | 24 | + |
85 | /* | 25 | static inline bool isar_feature_aa64_fwb(const ARMISARegisters *id) |
86 | * Move Prefix | 26 | { |
87 | * | 27 | return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, FWB) != 0; |
88 | -- | 28 | -- |
89 | 2.25.1 | 29 | 2.34.1 |
30 | |||
31 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Let finalize_memop_atom be the new basic function, with | ||
4 | finalize_memop and finalize_memop_pair testing FEAT_LSE2 | ||
5 | to apply the appropriate atomicity. | ||
6 | |||
7 | Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org> | ||
8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
3 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 9 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
4 | Message-id: 20220708151540.18136-27-richard.henderson@linaro.org | 10 | Message-id: 20230530191438.411344-4-richard.henderson@linaro.org |
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | --- | 12 | --- |
8 | target/arm/helper-sme.h | 2 ++ | 13 | target/arm/tcg/translate.h | 39 +++++++++++++++++++++++++++++----- |
9 | target/arm/sme.decode | 1 + | 14 | target/arm/tcg/translate-a64.c | 2 ++ |
10 | target/arm/sme_helper.c | 74 ++++++++++++++++++++++++++++++++++++++ | 15 | target/arm/tcg/translate.c | 1 + |
11 | target/arm/translate-sme.c | 1 + | 16 | 3 files changed, 37 insertions(+), 5 deletions(-) |
12 | 4 files changed, 78 insertions(+) | ||
13 | 17 | ||
14 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | 18 | diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h |
15 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/helper-sme.h | 20 | --- a/target/arm/tcg/translate.h |
17 | +++ b/target/arm/helper-sme.h | 21 | +++ b/target/arm/tcg/translate.h |
18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(sme_addva_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 22 | @@ -XXX,XX +XXX,XX @@ typedef struct DisasContext { |
19 | DEF_HELPER_FLAGS_5(sme_addha_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 23 | uint64_t features; /* CPU features bits */ |
20 | DEF_HELPER_FLAGS_5(sme_addva_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 24 | bool aarch64; |
21 | 25 | bool thumb; | |
22 | +DEF_HELPER_FLAGS_7(sme_fmopa_h, TCG_CALL_NO_RWG, | 26 | + bool lse2; |
23 | + void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | 27 | /* Because unallocated encodings generate different exception syndrome |
24 | DEF_HELPER_FLAGS_7(sme_fmopa_s, TCG_CALL_NO_RWG, | 28 | * information from traps due to FP being disabled, we can't do a single |
25 | void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | 29 | * "is fp access disabled" check at a high level in the decode tree. |
26 | DEF_HELPER_FLAGS_7(sme_fmopa_d, TCG_CALL_NO_RWG, | 30 | @@ -XXX,XX +XXX,XX @@ static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour) |
27 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | ||
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/target/arm/sme.decode | ||
30 | +++ b/target/arm/sme.decode | ||
31 | @@ -XXX,XX +XXX,XX @@ FMOPA_s 10000000 100 ..... ... ... ..... . 00 .. @op_32 | ||
32 | FMOPA_d 10000000 110 ..... ... ... ..... . 0 ... @op_64 | ||
33 | |||
34 | BFMOPA 10000001 100 ..... ... ... ..... . 00 .. @op_32 | ||
35 | +FMOPA_h 10000001 101 ..... ... ... ..... . 00 .. @op_32 | ||
36 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | ||
37 | index XXXXXXX..XXXXXXX 100644 | ||
38 | --- a/target/arm/sme_helper.c | ||
39 | +++ b/target/arm/sme_helper.c | ||
40 | @@ -XXX,XX +XXX,XX @@ static inline uint32_t f16mop_adj_pair(uint32_t pair, uint32_t pg, uint32_t neg) | ||
41 | return pair; | ||
42 | } | 31 | } |
43 | 32 | ||
44 | +static float32 f16_dotadd(float32 sum, uint32_t e1, uint32_t e2, | 33 | /** |
45 | + float_status *s_std, float_status *s_odd) | 34 | - * finalize_memop: |
46 | +{ | 35 | + * finalize_memop_atom: |
47 | + float64 e1r = float16_to_float64(e1 & 0xffff, true, s_std); | 36 | * @s: DisasContext |
48 | + float64 e1c = float16_to_float64(e1 >> 16, true, s_std); | 37 | * @opc: size+sign+align of the memory operation |
49 | + float64 e2r = float16_to_float64(e2 & 0xffff, true, s_std); | 38 | + * @atom: atomicity of the memory operation |
50 | + float64 e2c = float16_to_float64(e2 >> 16, true, s_std); | 39 | * |
51 | + float64 t64; | 40 | - * Build the complete MemOp for a memory operation, including alignment |
52 | + float32 t32; | 41 | - * and endianness. |
53 | + | 42 | + * Build the complete MemOp for a memory operation, including alignment, |
54 | + /* | 43 | + * endianness, and atomicity. |
55 | + * The ARM pseudocode function FPDot performs both multiplies | 44 | * |
56 | + * and the add with a single rounding operation. Emulate this | 45 | * If (op & MO_AMASK) then the operation already contains the required |
57 | + * by performing the first multiply in round-to-odd, then doing | 46 | * alignment, e.g. for AccType_ATOMIC. Otherwise, this an optionally |
58 | + * the second multiply as fused multiply-add, and rounding to | 47 | @@ -XXX,XX +XXX,XX @@ static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour) |
59 | + * float32 all in one step. | 48 | * and this is applied here. Note that there is no way to indicate that |
60 | + */ | 49 | * no alignment should ever be enforced; this must be handled manually. |
61 | + t64 = float64_mul(e1r, e2r, s_odd); | 50 | */ |
62 | + t64 = float64r32_muladd(e1c, e2c, t64, 0, s_std); | 51 | -static inline MemOp finalize_memop(DisasContext *s, MemOp opc) |
63 | + | 52 | +static inline MemOp finalize_memop_atom(DisasContext *s, MemOp opc, MemOp atom) |
64 | + /* This conversion is exact, because we've already rounded. */ | 53 | { |
65 | + t32 = float64_to_float32(t64, s_std); | 54 | if (s->align_mem && !(opc & MO_AMASK)) { |
66 | + | 55 | opc |= MO_ALIGN; |
67 | + /* The final accumulation step is not fused. */ | 56 | } |
68 | + return float32_add(sum, t32, s_std); | 57 | - return opc | s->be_data; |
58 | + return opc | atom | s->be_data; | ||
69 | +} | 59 | +} |
70 | + | 60 | + |
71 | +void HELPER(sme_fmopa_h)(void *vza, void *vzn, void *vzm, void *vpn, | 61 | +/** |
72 | + void *vpm, void *vst, uint32_t desc) | 62 | + * finalize_memop: |
63 | + * @s: DisasContext | ||
64 | + * @opc: size+sign+align of the memory operation | ||
65 | + * | ||
66 | + * Like finalize_memop_atom, but with default atomicity. | ||
67 | + */ | ||
68 | +static inline MemOp finalize_memop(DisasContext *s, MemOp opc) | ||
73 | +{ | 69 | +{ |
74 | + intptr_t row, col, oprsz = simd_maxsz(desc); | 70 | + MemOp atom = s->lse2 ? MO_ATOM_WITHIN16 : MO_ATOM_IFALIGN; |
75 | + uint32_t neg = simd_data(desc) * 0x80008000u; | 71 | + return finalize_memop_atom(s, opc, atom); |
76 | + uint16_t *pn = vpn, *pm = vpm; | ||
77 | + float_status fpst_odd, fpst_std; | ||
78 | + | ||
79 | + /* | ||
80 | + * Make a copy of float_status because this operation does not | ||
81 | + * update the cumulative fp exception status. It also produces | ||
82 | + * default nans. Make a second copy with round-to-odd -- see above. | ||
83 | + */ | ||
84 | + fpst_std = *(float_status *)vst; | ||
85 | + set_default_nan_mode(true, &fpst_std); | ||
86 | + fpst_odd = fpst_std; | ||
87 | + set_float_rounding_mode(float_round_to_odd, &fpst_odd); | ||
88 | + | ||
89 | + for (row = 0; row < oprsz; ) { | ||
90 | + uint16_t prow = pn[H2(row >> 4)]; | ||
91 | + do { | ||
92 | + void *vza_row = vza + tile_vslice_offset(row); | ||
93 | + uint32_t n = *(uint32_t *)(vzn + H1_4(row)); | ||
94 | + | ||
95 | + n = f16mop_adj_pair(n, prow, neg); | ||
96 | + | ||
97 | + for (col = 0; col < oprsz; ) { | ||
98 | + uint16_t pcol = pm[H2(col >> 4)]; | ||
99 | + do { | ||
100 | + if (prow & pcol & 0b0101) { | ||
101 | + uint32_t *a = vza_row + H1_4(col); | ||
102 | + uint32_t m = *(uint32_t *)(vzm + H1_4(col)); | ||
103 | + | ||
104 | + m = f16mop_adj_pair(m, pcol, 0); | ||
105 | + *a = f16_dotadd(*a, n, m, &fpst_std, &fpst_odd); | ||
106 | + | ||
107 | + col += 4; | ||
108 | + pcol >>= 4; | ||
109 | + } | ||
110 | + } while (col & 15); | ||
111 | + } | ||
112 | + row += 4; | ||
113 | + prow >>= 4; | ||
114 | + } while (row & 15); | ||
115 | + } | ||
116 | +} | 72 | +} |
117 | + | 73 | + |
118 | void HELPER(sme_bfmopa)(void *vza, void *vzn, void *vzm, void *vpn, | 74 | +/** |
119 | void *vpm, uint32_t desc) | 75 | + * finalize_memop_pair: |
120 | { | 76 | + * @s: DisasContext |
121 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 77 | + * @opc: size+sign+align of the memory operation |
78 | + * | ||
79 | + * Like finalize_memop_atom, but with atomicity for a pair. | ||
80 | + * C.f. Pseudocode for Mem[], operand ispair. | ||
81 | + */ | ||
82 | +static inline MemOp finalize_memop_pair(DisasContext *s, MemOp opc) | ||
83 | +{ | ||
84 | + MemOp atom = s->lse2 ? MO_ATOM_WITHIN16_PAIR : MO_ATOM_IFALIGN_PAIR; | ||
85 | + return finalize_memop_atom(s, opc, atom); | ||
86 | } | ||
87 | |||
88 | /** | ||
89 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c | ||
122 | index XXXXXXX..XXXXXXX 100644 | 90 | index XXXXXXX..XXXXXXX 100644 |
123 | --- a/target/arm/translate-sme.c | 91 | --- a/target/arm/tcg/translate-a64.c |
124 | +++ b/target/arm/translate-sme.c | 92 | +++ b/target/arm/tcg/translate-a64.c |
125 | @@ -XXX,XX +XXX,XX @@ static bool do_outprod_fpst(DisasContext *s, arg_op *a, MemOp esz, | 93 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_init_disas_context(DisasContextBase *dcbase, |
126 | return true; | 94 | tcg_debug_assert(dc->tbid & 1); |
127 | } | 95 | #endif |
128 | 96 | ||
129 | +TRANS_FEAT(FMOPA_h, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_h) | 97 | + dc->lse2 = dc_isar_feature(aa64_lse2, dc); |
130 | TRANS_FEAT(FMOPA_s, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_s) | 98 | + |
131 | TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a, MO_64, gen_helper_sme_fmopa_d) | 99 | /* Single step state. The code-generation logic here is: |
100 | * SS_ACTIVE == 0: | ||
101 | * generate code with no special handling for single-stepping (except | ||
102 | diff --git a/target/arm/tcg/translate.c b/target/arm/tcg/translate.c | ||
103 | index XXXXXXX..XXXXXXX 100644 | ||
104 | --- a/target/arm/tcg/translate.c | ||
105 | +++ b/target/arm/tcg/translate.c | ||
106 | @@ -XXX,XX +XXX,XX @@ static void arm_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs) | ||
107 | dc->sme_trap_nonstreaming = | ||
108 | EX_TBFLAG_A32(tb_flags, SME_TRAP_NONSTREAMING); | ||
109 | } | ||
110 | + dc->lse2 = false; /* applies only to aarch64 */ | ||
111 | dc->cp_regs = cpu->cp_regs; | ||
112 | dc->features = env->features; | ||
132 | 113 | ||
133 | -- | 114 | -- |
134 | 2.25.1 | 115 | 2.34.1 |
116 | |||
117 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap | 3 | While we don't require 16-byte atomicity here, using a single larger |
4 | if full a64 support is not enabled in streaming mode. | 4 | load simplifies the code, and makes it a closer match to STXP. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-12-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-5-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/sme-fa64.decode | 9 --------- | 11 | target/arm/tcg/translate-a64.c | 31 ++++++++++++++++++++----------- |
12 | target/arm/translate-sve.c | 6 ++++++ | 12 | 1 file changed, 20 insertions(+), 11 deletions(-) |
13 | 2 files changed, 6 insertions(+), 9 deletions(-) | ||
14 | 13 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 14 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
16 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 16 | --- a/target/arm/tcg/translate-a64.c |
18 | +++ b/target/arm/sme-fa64.decode | 17 | +++ b/target/arm/tcg/translate-a64.c |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 18 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, |
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 19 | TCGv_i64 addr, int size, bool is_pair) |
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 20 | { |
22 | 21 | int idx = get_mem_index(s); | |
23 | -FAIL 1000 010- -00- ---- 10-- ---- ---- ---- # SVE2 32-bit gather NT load (vector+scalar) | 22 | - MemOp memop = s->be_data; |
24 | FAIL 1000 010- -00- ---- 111- ---- ---- ---- # SVE 32-bit gather prefetch (vector+imm) | 23 | + MemOp memop; |
25 | FAIL 1000 0100 0-1- ---- 0--- ---- ---- ---- # SVE 32-bit gather prefetch (scalar+vector) | 24 | |
26 | -FAIL 1000 010- -01- ---- 1--- ---- ---- ---- # SVE 32-bit gather load (vector+imm) | 25 | g_assert(size <= 3); |
27 | -FAIL 1000 0100 0-0- ---- 0--- ---- ---- ---- # SVE 32-bit gather load byte (scalar+vector) | 26 | if (is_pair) { |
28 | -FAIL 1000 0100 1--- ---- 0--- ---- ---- ---- # SVE 32-bit gather load half (scalar+vector) | 27 | g_assert(size >= 2); |
29 | -FAIL 1000 0101 0--- ---- 0--- ---- ---- ---- # SVE 32-bit gather load word (scalar+vector) | 28 | if (size == 2) { |
30 | FAIL 1010 010- ---- ---- 011- ---- ---- ---- # SVE contiguous FF load (scalar+scalar) | 29 | /* The pair must be single-copy atomic for the doubleword. */ |
31 | FAIL 1010 010- ---1 ---- 101- ---- ---- ---- # SVE contiguous NF load (scalar+imm) | 30 | - memop |= MO_64 | MO_ALIGN; |
32 | FAIL 1010 010- -01- ---- 000- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+scalar) | 31 | + memop = finalize_memop(s, MO_64 | MO_ALIGN); |
33 | FAIL 1010 010- -010 ---- 001- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+imm) | 32 | tcg_gen_qemu_ld_i64(cpu_exclusive_val, addr, idx, memop); |
34 | FAIL 1100 010- ---- ---- ---- ---- ---- ---- # SVE 64-bit gather load/prefetch | 33 | if (s->be_data == MO_LE) { |
35 | -FAIL 1110 010- -00- ---- 001- ---- ---- ---- # SVE2 64-bit scatter NT store (vector+scalar) | 34 | tcg_gen_extract_i64(cpu_reg(s, rt), cpu_exclusive_val, 0, 32); |
36 | -FAIL 1110 010- -10- ---- 001- ---- ---- ---- # SVE2 32-bit scatter NT store (vector+scalar) | 35 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, |
37 | -FAIL 1110 010- ---- ---- 1-0- ---- ---- ---- # SVE scatter store (scalar+32-bit vector) | 36 | tcg_gen_extract_i64(cpu_reg(s, rt2), cpu_exclusive_val, 0, 32); |
38 | -FAIL 1110 010- ---- ---- 101- ---- ---- ---- # SVE scatter store (misc) | 37 | } |
39 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 38 | } else { |
40 | index XXXXXXX..XXXXXXX 100644 | 39 | - /* The pair must be single-copy atomic for *each* doubleword, not |
41 | --- a/target/arm/translate-sve.c | 40 | - the entire quadword, however it must be quadword aligned. */ |
42 | +++ b/target/arm/translate-sve.c | 41 | - memop |= MO_64; |
43 | @@ -XXX,XX +XXX,XX @@ static bool trans_LD1_zprz(DisasContext *s, arg_LD1_zprz *a) | 42 | - tcg_gen_qemu_ld_i64(cpu_exclusive_val, addr, idx, |
44 | if (!dc_isar_feature(aa64_sve, s)) { | 43 | - memop | MO_ALIGN_16); |
45 | return false; | 44 | + /* |
46 | } | 45 | + * The pair must be single-copy atomic for *each* doubleword, not |
47 | + s->is_nonstreaming = true; | 46 | + * the entire quadword, however it must be quadword aligned. |
48 | if (!sve_access_check(s)) { | 47 | + * Expose the complete load to tcg, for ease of tlb lookup, |
49 | return true; | 48 | + * but indicate that only 8-byte atomicity is required. |
50 | } | 49 | + */ |
51 | @@ -XXX,XX +XXX,XX @@ static bool trans_LD1_zpiz(DisasContext *s, arg_LD1_zpiz *a) | 50 | + TCGv_i128 t16 = tcg_temp_new_i128(); |
52 | if (!dc_isar_feature(aa64_sve, s)) { | 51 | |
53 | return false; | 52 | - TCGv_i64 addr2 = tcg_temp_new_i64(); |
54 | } | 53 | - tcg_gen_addi_i64(addr2, addr, 8); |
55 | + s->is_nonstreaming = true; | 54 | - tcg_gen_qemu_ld_i64(cpu_exclusive_high, addr2, idx, memop); |
56 | if (!sve_access_check(s)) { | 55 | + memop = finalize_memop_atom(s, MO_128 | MO_ALIGN_16, |
57 | return true; | 56 | + MO_ATOM_IFALIGN_PAIR); |
58 | } | 57 | + tcg_gen_qemu_ld_i128(t16, addr, idx, memop); |
59 | @@ -XXX,XX +XXX,XX @@ static bool trans_LDNT1_zprz(DisasContext *s, arg_LD1_zprz *a) | 58 | |
60 | if (!dc_isar_feature(aa64_sve2, s)) { | 59 | + if (s->be_data == MO_LE) { |
61 | return false; | 60 | + tcg_gen_extr_i128_i64(cpu_exclusive_val, |
62 | } | 61 | + cpu_exclusive_high, t16); |
63 | + s->is_nonstreaming = true; | 62 | + } else { |
64 | if (!sve_access_check(s)) { | 63 | + tcg_gen_extr_i128_i64(cpu_exclusive_high, |
65 | return true; | 64 | + cpu_exclusive_val, t16); |
66 | } | 65 | + } |
67 | @@ -XXX,XX +XXX,XX @@ static bool trans_ST1_zprz(DisasContext *s, arg_ST1_zprz *a) | 66 | tcg_gen_mov_i64(cpu_reg(s, rt), cpu_exclusive_val); |
68 | if (!dc_isar_feature(aa64_sve, s)) { | 67 | tcg_gen_mov_i64(cpu_reg(s, rt2), cpu_exclusive_high); |
69 | return false; | 68 | } |
70 | } | 69 | } else { |
71 | + s->is_nonstreaming = true; | 70 | - memop |= size | MO_ALIGN; |
72 | if (!sve_access_check(s)) { | 71 | + memop = finalize_memop(s, size | MO_ALIGN); |
73 | return true; | 72 | tcg_gen_qemu_ld_i64(cpu_exclusive_val, addr, idx, memop); |
74 | } | 73 | tcg_gen_mov_i64(cpu_reg(s, rt), cpu_exclusive_val); |
75 | @@ -XXX,XX +XXX,XX @@ static bool trans_ST1_zpiz(DisasContext *s, arg_ST1_zpiz *a) | ||
76 | if (!dc_isar_feature(aa64_sve, s)) { | ||
77 | return false; | ||
78 | } | ||
79 | + s->is_nonstreaming = true; | ||
80 | if (!sve_access_check(s)) { | ||
81 | return true; | ||
82 | } | ||
83 | @@ -XXX,XX +XXX,XX @@ static bool trans_STNT1_zprz(DisasContext *s, arg_ST1_zprz *a) | ||
84 | if (!dc_isar_feature(aa64_sve2, s)) { | ||
85 | return false; | ||
86 | } | ||
87 | + s->is_nonstreaming = true; | ||
88 | if (!sve_access_check(s)) { | ||
89 | return true; | ||
90 | } | 74 | } |
91 | -- | 75 | -- |
92 | 2.25.1 | 76 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Add a TCGv_ptr base argument, which will be cpu_env for SVE. | 3 | While we don't require 16-byte atomicity here, using a single larger |
4 | We will reuse this for SME save and restore array insns. | 4 | operation simplifies the code. Introduce finalize_memop_asimd for this. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-22-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-6-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/translate-a64.h | 3 +++ | 11 | target/arm/tcg/translate.h | 24 +++++++++++++++++++++++ |
12 | target/arm/translate-sve.c | 48 ++++++++++++++++++++++++++++---------- | 12 | target/arm/tcg/translate-a64.c | 35 +++++++++++----------------------- |
13 | 2 files changed, 39 insertions(+), 12 deletions(-) | 13 | 2 files changed, 35 insertions(+), 24 deletions(-) |
14 | 14 | ||
15 | diff --git a/target/arm/translate-a64.h b/target/arm/translate-a64.h | 15 | diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h |
16 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/translate-a64.h | 17 | --- a/target/arm/tcg/translate.h |
18 | +++ b/target/arm/translate-a64.h | 18 | +++ b/target/arm/tcg/translate.h |
19 | @@ -XXX,XX +XXX,XX @@ void gen_gvec_xar(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs, | 19 | @@ -XXX,XX +XXX,XX @@ static inline MemOp finalize_memop_pair(DisasContext *s, MemOp opc) |
20 | uint32_t rm_ofs, int64_t shift, | 20 | return finalize_memop_atom(s, opc, atom); |
21 | uint32_t opr_sz, uint32_t max_sz); | 21 | } |
22 | 22 | ||
23 | +void gen_sve_ldr(DisasContext *s, TCGv_ptr, int vofs, int len, int rn, int imm); | 23 | +/** |
24 | +void gen_sve_str(DisasContext *s, TCGv_ptr, int vofs, int len, int rn, int imm); | 24 | + * finalize_memop_asimd: |
25 | + * @s: DisasContext | ||
26 | + * @opc: size+sign+align of the memory operation | ||
27 | + * | ||
28 | + * Like finalize_memop_atom, but with atomicity of AccessType_ASIMD. | ||
29 | + */ | ||
30 | +static inline MemOp finalize_memop_asimd(DisasContext *s, MemOp opc) | ||
31 | +{ | ||
32 | + /* | ||
33 | + * In the pseudocode for Mem[], with AccessType_ASIMD, size == 16, | ||
34 | + * if IsAligned(8), the first case provides separate atomicity for | ||
35 | + * the pair of 64-bit accesses. If !IsAligned(8), the middle cases | ||
36 | + * do not apply, and we're left with the final case of no atomicity. | ||
37 | + * Thus MO_ATOM_IFALIGN_PAIR. | ||
38 | + * | ||
39 | + * For other sizes, normal LSE2 rules apply. | ||
40 | + */ | ||
41 | + if ((opc & MO_SIZE) == MO_128) { | ||
42 | + return finalize_memop_atom(s, opc, MO_ATOM_IFALIGN_PAIR); | ||
43 | + } | ||
44 | + return finalize_memop(s, opc); | ||
45 | +} | ||
25 | + | 46 | + |
26 | #endif /* TARGET_ARM_TRANSLATE_A64_H */ | 47 | /** |
27 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 48 | * asimd_imm_const: Expand an encoded SIMD constant value |
49 | * | ||
50 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c | ||
28 | index XXXXXXX..XXXXXXX 100644 | 51 | index XXXXXXX..XXXXXXX 100644 |
29 | --- a/target/arm/translate-sve.c | 52 | --- a/target/arm/tcg/translate-a64.c |
30 | +++ b/target/arm/translate-sve.c | 53 | +++ b/target/arm/tcg/translate-a64.c |
31 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(UCVTF_dd, aa64_sve, gen_gvec_fpst_arg_zpz, | 54 | @@ -XXX,XX +XXX,XX @@ static void do_fp_st(DisasContext *s, int srcidx, TCGv_i64 tcg_addr, int size) |
32 | * The load should begin at the address Rn + IMM. | ||
33 | */ | ||
34 | |||
35 | -static void do_ldr(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | ||
36 | +void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
37 | + int len, int rn, int imm) | ||
38 | { | 55 | { |
39 | int len_align = QEMU_ALIGN_DOWN(len, 8); | 56 | /* This writes the bottom N bits of a 128 bit wide vector to memory */ |
40 | int len_remain = len % 8; | 57 | TCGv_i64 tmplo = tcg_temp_new_i64(); |
41 | @@ -XXX,XX +XXX,XX @@ static void do_ldr(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | 58 | - MemOp mop; |
42 | t0 = tcg_temp_new_i64(); | 59 | + MemOp mop = finalize_memop_asimd(s, size); |
43 | for (i = 0; i < len_align; i += 8) { | 60 | |
44 | tcg_gen_qemu_ld_i64(t0, clean_addr, midx, MO_LEUQ); | 61 | tcg_gen_ld_i64(tmplo, cpu_env, fp_reg_offset(s, srcidx, MO_64)); |
45 | - tcg_gen_st_i64(t0, cpu_env, vofs + i); | 62 | |
46 | + tcg_gen_st_i64(t0, base, vofs + i); | 63 | - if (size < 4) { |
47 | tcg_gen_addi_i64(clean_addr, clean_addr, 8); | 64 | - mop = finalize_memop(s, size); |
48 | } | 65 | + if (size < MO_128) { |
49 | tcg_temp_free_i64(t0); | 66 | tcg_gen_qemu_st_i64(tmplo, tcg_addr, get_mem_index(s), mop); |
50 | @@ -XXX,XX +XXX,XX @@ static void do_ldr(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | 67 | } else { |
51 | clean_addr = new_tmp_a64_local(s); | 68 | - bool be = s->be_data == MO_BE; |
52 | tcg_gen_mov_i64(clean_addr, t0); | 69 | - TCGv_i64 tcg_hiaddr = tcg_temp_new_i64(); |
53 | 70 | TCGv_i64 tmphi = tcg_temp_new_i64(); | |
54 | + if (base != cpu_env) { | 71 | + TCGv_i128 t16 = tcg_temp_new_i128(); |
55 | + TCGv_ptr b = tcg_temp_local_new_ptr(); | 72 | |
56 | + tcg_gen_mov_ptr(b, base); | 73 | tcg_gen_ld_i64(tmphi, cpu_env, fp_reg_hi_offset(s, srcidx)); |
57 | + base = b; | 74 | + tcg_gen_concat_i64_i128(t16, tmplo, tmphi); |
58 | + } | 75 | |
59 | + | 76 | - mop = s->be_data | MO_UQ; |
60 | gen_set_label(loop); | 77 | - tcg_gen_qemu_st_i64(be ? tmphi : tmplo, tcg_addr, get_mem_index(s), |
61 | 78 | - mop | (s->align_mem ? MO_ALIGN_16 : 0)); | |
62 | t0 = tcg_temp_new_i64(); | 79 | - tcg_gen_addi_i64(tcg_hiaddr, tcg_addr, 8); |
63 | @@ -XXX,XX +XXX,XX @@ static void do_ldr(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | 80 | - tcg_gen_qemu_st_i64(be ? tmplo : tmphi, tcg_hiaddr, |
64 | tcg_gen_addi_i64(clean_addr, clean_addr, 8); | 81 | - get_mem_index(s), mop); |
65 | 82 | + tcg_gen_qemu_st_i128(t16, tcg_addr, get_mem_index(s), mop); | |
66 | tp = tcg_temp_new_ptr(); | ||
67 | - tcg_gen_add_ptr(tp, cpu_env, i); | ||
68 | + tcg_gen_add_ptr(tp, base, i); | ||
69 | tcg_gen_addi_ptr(i, i, 8); | ||
70 | tcg_gen_st_i64(t0, tp, vofs); | ||
71 | tcg_temp_free_ptr(tp); | ||
72 | @@ -XXX,XX +XXX,XX @@ static void do_ldr(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | ||
73 | |||
74 | tcg_gen_brcondi_ptr(TCG_COND_LTU, i, len_align, loop); | ||
75 | tcg_temp_free_ptr(i); | ||
76 | + | ||
77 | + if (base != cpu_env) { | ||
78 | + tcg_temp_free_ptr(base); | ||
79 | + assert(len_remain == 0); | ||
80 | + } | ||
81 | } | ||
82 | |||
83 | /* | ||
84 | @@ -XXX,XX +XXX,XX @@ static void do_ldr(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | ||
85 | default: | ||
86 | g_assert_not_reached(); | ||
87 | } | ||
88 | - tcg_gen_st_i64(t0, cpu_env, vofs + len_align); | ||
89 | + tcg_gen_st_i64(t0, base, vofs + len_align); | ||
90 | tcg_temp_free_i64(t0); | ||
91 | } | 83 | } |
92 | } | 84 | } |
93 | 85 | ||
94 | /* Similarly for stores. */ | 86 | @@ -XXX,XX +XXX,XX @@ static void do_fp_ld(DisasContext *s, int destidx, TCGv_i64 tcg_addr, int size) |
95 | -static void do_str(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | 87 | /* This always zero-extends and writes to a full 128 bit wide vector */ |
96 | +void gen_sve_str(DisasContext *s, TCGv_ptr base, int vofs, | 88 | TCGv_i64 tmplo = tcg_temp_new_i64(); |
97 | + int len, int rn, int imm) | 89 | TCGv_i64 tmphi = NULL; |
98 | { | 90 | - MemOp mop; |
99 | int len_align = QEMU_ALIGN_DOWN(len, 8); | 91 | + MemOp mop = finalize_memop_asimd(s, size); |
100 | int len_remain = len % 8; | 92 | |
101 | @@ -XXX,XX +XXX,XX @@ static void do_str(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | 93 | - if (size < 4) { |
102 | 94 | - mop = finalize_memop(s, size); | |
103 | t0 = tcg_temp_new_i64(); | 95 | + if (size < MO_128) { |
104 | for (i = 0; i < len_align; i += 8) { | 96 | tcg_gen_qemu_ld_i64(tmplo, tcg_addr, get_mem_index(s), mop); |
105 | - tcg_gen_ld_i64(t0, cpu_env, vofs + i); | 97 | } else { |
106 | + tcg_gen_ld_i64(t0, base, vofs + i); | 98 | - bool be = s->be_data == MO_BE; |
107 | tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUQ); | 99 | - TCGv_i64 tcg_hiaddr; |
108 | tcg_gen_addi_i64(clean_addr, clean_addr, 8); | 100 | + TCGv_i128 t16 = tcg_temp_new_i128(); |
109 | } | ||
110 | @@ -XXX,XX +XXX,XX @@ static void do_str(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | ||
111 | clean_addr = new_tmp_a64_local(s); | ||
112 | tcg_gen_mov_i64(clean_addr, t0); | ||
113 | |||
114 | + if (base != cpu_env) { | ||
115 | + TCGv_ptr b = tcg_temp_local_new_ptr(); | ||
116 | + tcg_gen_mov_ptr(b, base); | ||
117 | + base = b; | ||
118 | + } | ||
119 | + | 101 | + |
120 | gen_set_label(loop); | 102 | + tcg_gen_qemu_ld_i128(t16, tcg_addr, get_mem_index(s), mop); |
121 | 103 | ||
122 | t0 = tcg_temp_new_i64(); | 104 | tmphi = tcg_temp_new_i64(); |
123 | tp = tcg_temp_new_ptr(); | 105 | - tcg_hiaddr = tcg_temp_new_i64(); |
124 | - tcg_gen_add_ptr(tp, cpu_env, i); | 106 | - |
125 | + tcg_gen_add_ptr(tp, base, i); | 107 | - mop = s->be_data | MO_UQ; |
126 | tcg_gen_ld_i64(t0, tp, vofs); | 108 | - tcg_gen_qemu_ld_i64(be ? tmphi : tmplo, tcg_addr, get_mem_index(s), |
127 | tcg_gen_addi_ptr(i, i, 8); | 109 | - mop | (s->align_mem ? MO_ALIGN_16 : 0)); |
128 | tcg_temp_free_ptr(tp); | 110 | - tcg_gen_addi_i64(tcg_hiaddr, tcg_addr, 8); |
129 | @@ -XXX,XX +XXX,XX @@ static void do_str(DisasContext *s, uint32_t vofs, int len, int rn, int imm) | 111 | - tcg_gen_qemu_ld_i64(be ? tmplo : tmphi, tcg_hiaddr, |
130 | 112 | - get_mem_index(s), mop); | |
131 | tcg_gen_brcondi_ptr(TCG_COND_LTU, i, len_align, loop); | 113 | + tcg_gen_extr_i128_i64(tmplo, tmphi, t16); |
132 | tcg_temp_free_ptr(i); | ||
133 | + | ||
134 | + if (base != cpu_env) { | ||
135 | + tcg_temp_free_ptr(base); | ||
136 | + assert(len_remain == 0); | ||
137 | + } | ||
138 | } | 114 | } |
139 | 115 | ||
140 | /* Predicate register stores can be any multiple of 2. */ | 116 | tcg_gen_st_i64(tmplo, cpu_env, fp_reg_offset(s, destidx, MO_64)); |
141 | if (len_remain) { | ||
142 | t0 = tcg_temp_new_i64(); | ||
143 | - tcg_gen_ld_i64(t0, cpu_env, vofs + len_align); | ||
144 | + tcg_gen_ld_i64(t0, base, vofs + len_align); | ||
145 | |||
146 | switch (len_remain) { | ||
147 | case 2: | ||
148 | @@ -XXX,XX +XXX,XX @@ static bool trans_LDR_zri(DisasContext *s, arg_rri *a) | ||
149 | if (sve_access_check(s)) { | ||
150 | int size = vec_full_reg_size(s); | ||
151 | int off = vec_full_reg_offset(s, a->rd); | ||
152 | - do_ldr(s, off, size, a->rn, a->imm * size); | ||
153 | + gen_sve_ldr(s, cpu_env, off, size, a->rn, a->imm * size); | ||
154 | } | ||
155 | return true; | ||
156 | } | ||
157 | @@ -XXX,XX +XXX,XX @@ static bool trans_LDR_pri(DisasContext *s, arg_rri *a) | ||
158 | if (sve_access_check(s)) { | ||
159 | int size = pred_full_reg_size(s); | ||
160 | int off = pred_full_reg_offset(s, a->rd); | ||
161 | - do_ldr(s, off, size, a->rn, a->imm * size); | ||
162 | + gen_sve_ldr(s, cpu_env, off, size, a->rn, a->imm * size); | ||
163 | } | ||
164 | return true; | ||
165 | } | ||
166 | @@ -XXX,XX +XXX,XX @@ static bool trans_STR_zri(DisasContext *s, arg_rri *a) | ||
167 | if (sve_access_check(s)) { | ||
168 | int size = vec_full_reg_size(s); | ||
169 | int off = vec_full_reg_offset(s, a->rd); | ||
170 | - do_str(s, off, size, a->rn, a->imm * size); | ||
171 | + gen_sve_str(s, cpu_env, off, size, a->rn, a->imm * size); | ||
172 | } | ||
173 | return true; | ||
174 | } | ||
175 | @@ -XXX,XX +XXX,XX @@ static bool trans_STR_pri(DisasContext *s, arg_rri *a) | ||
176 | if (sve_access_check(s)) { | ||
177 | int size = pred_full_reg_size(s); | ||
178 | int off = pred_full_reg_offset(s, a->rd); | ||
179 | - do_str(s, off, size, a->rn, a->imm * size); | ||
180 | + gen_sve_str(s, cpu_env, off, size, a->rn, a->imm * size); | ||
181 | } | ||
182 | return true; | ||
183 | } | ||
184 | -- | 117 | -- |
185 | 2.25.1 | 118 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap | 3 | This fixes a bug in that these two insns should have been using atomic |
4 | if full a64 support is not enabled in streaming mode. | 4 | 16-byte stores, since MTE is ARMv8.5 and LSE2 is mandatory from ARMv8.4. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-14-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-7-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/sme-fa64.decode | 2 -- | 11 | target/arm/tcg/translate-a64.c | 17 ++++++++++------- |
12 | target/arm/translate-sve.c | 2 ++ | 12 | 1 file changed, 10 insertions(+), 7 deletions(-) |
13 | 2 files changed, 2 insertions(+), 2 deletions(-) | ||
14 | 13 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 14 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
16 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 16 | --- a/target/arm/tcg/translate-a64.c |
18 | +++ b/target/arm/sme-fa64.decode | 17 | +++ b/target/arm/tcg/translate-a64.c |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 18 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_tag(DisasContext *s, uint32_t insn) |
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 19 | |
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 20 | if (is_zero) { |
22 | 21 | TCGv_i64 clean_addr = clean_data_tbi(s, addr); | |
23 | -FAIL 1010 010- ---- ---- 011- ---- ---- ---- # SVE contiguous FF load (scalar+scalar) | 22 | - TCGv_i64 tcg_zero = tcg_constant_i64(0); |
24 | -FAIL 1010 010- ---1 ---- 101- ---- ---- ---- # SVE contiguous NF load (scalar+imm) | 23 | + TCGv_i64 zero64 = tcg_constant_i64(0); |
25 | FAIL 1010 010- -01- ---- 000- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+scalar) | 24 | + TCGv_i128 zero128 = tcg_temp_new_i128(); |
26 | FAIL 1010 010- -010 ---- 001- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+imm) | 25 | int mem_index = get_mem_index(s); |
27 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 26 | - int i, n = (1 + is_pair) << LOG2_TAG_GRANULE; |
28 | index XXXXXXX..XXXXXXX 100644 | 27 | + MemOp mop = finalize_memop(s, MO_128 | MO_ALIGN); |
29 | --- a/target/arm/translate-sve.c | 28 | |
30 | +++ b/target/arm/translate-sve.c | 29 | - tcg_gen_qemu_st_i64(tcg_zero, clean_addr, mem_index, |
31 | @@ -XXX,XX +XXX,XX @@ static bool trans_LDFF1_zprr(DisasContext *s, arg_rprr_load *a) | 30 | - MO_UQ | MO_ALIGN_16); |
32 | if (!dc_isar_feature(aa64_sve, s)) { | 31 | - for (i = 8; i < n; i += 8) { |
33 | return false; | 32 | - tcg_gen_addi_i64(clean_addr, clean_addr, 8); |
33 | - tcg_gen_qemu_st_i64(tcg_zero, clean_addr, mem_index, MO_UQ); | ||
34 | + tcg_gen_concat_i64_i128(zero128, zero64, zero64); | ||
35 | + | ||
36 | + /* This is 1 or 2 atomic 16-byte operations. */ | ||
37 | + tcg_gen_qemu_st_i128(zero128, clean_addr, mem_index, mop); | ||
38 | + if (is_pair) { | ||
39 | + tcg_gen_addi_i64(clean_addr, clean_addr, 16); | ||
40 | + tcg_gen_qemu_st_i128(zero128, clean_addr, mem_index, mop); | ||
41 | } | ||
34 | } | 42 | } |
35 | + s->is_nonstreaming = true; | 43 | |
36 | if (sve_access_check(s)) { | ||
37 | TCGv_i64 addr = new_tmp_a64(s); | ||
38 | tcg_gen_shli_i64(addr, cpu_reg(s, a->rm), dtype_msz(a->dtype)); | ||
39 | @@ -XXX,XX +XXX,XX @@ static bool trans_LDNF1_zpri(DisasContext *s, arg_rpri_load *a) | ||
40 | if (!dc_isar_feature(aa64_sve, s)) { | ||
41 | return false; | ||
42 | } | ||
43 | + s->is_nonstreaming = true; | ||
44 | if (sve_access_check(s)) { | ||
45 | int vsz = vec_full_reg_size(s); | ||
46 | int elements = vsz >> dtype_esz[a->dtype]; | ||
47 | -- | 44 | -- |
48 | 2.25.1 | 45 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | |||
3 | Round len_align to 16 instead of 8, handling an odd 8-byte as part | ||
4 | of the tail. Use MO_ATOM_NONE to indicate that all of these memory | ||
5 | ops have only byte atomicity. | ||
2 | 6 | ||
3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Message-id: 20220708151540.18136-39-richard.henderson@linaro.org | 9 | Message-id: 20230530191438.411344-8-richard.henderson@linaro.org |
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 11 | --- |
8 | linux-user/aarch64/signal.c | 3 +++ | 12 | target/arm/tcg/translate-sve.c | 95 +++++++++++++++++++++++++--------- |
9 | 1 file changed, 3 insertions(+) | 13 | 1 file changed, 70 insertions(+), 25 deletions(-) |
10 | 14 | ||
11 | diff --git a/linux-user/aarch64/signal.c b/linux-user/aarch64/signal.c | 15 | diff --git a/target/arm/tcg/translate-sve.c b/target/arm/tcg/translate-sve.c |
12 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/linux-user/aarch64/signal.c | 17 | --- a/target/arm/tcg/translate-sve.c |
14 | +++ b/linux-user/aarch64/signal.c | 18 | +++ b/target/arm/tcg/translate-sve.c |
15 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 19 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(UCVTF_dd, aa64_sve, gen_gvec_fpst_arg_zpz, |
16 | __get_user(extra_size, | 20 | void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, |
17 | &((struct target_extra_context *)ctx)->size); | 21 | int len, int rn, int imm) |
18 | extra = lock_user(VERIFY_READ, extra_datap, extra_size, 0); | 22 | { |
19 | + if (!extra) { | 23 | - int len_align = QEMU_ALIGN_DOWN(len, 8); |
20 | + return 1; | 24 | - int len_remain = len % 8; |
21 | + } | 25 | - int nparts = len / 8 + ctpop8(len_remain); |
22 | break; | 26 | + int len_align = QEMU_ALIGN_DOWN(len, 16); |
27 | + int len_remain = len % 16; | ||
28 | + int nparts = len / 16 + ctpop8(len_remain); | ||
29 | int midx = get_mem_index(s); | ||
30 | TCGv_i64 dirty_addr, clean_addr, t0, t1; | ||
31 | + TCGv_i128 t16; | ||
32 | |||
33 | dirty_addr = tcg_temp_new_i64(); | ||
34 | tcg_gen_addi_i64(dirty_addr, cpu_reg_sp(s, rn), imm); | ||
35 | @@ -XXX,XX +XXX,XX @@ void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
36 | int i; | ||
37 | |||
38 | t0 = tcg_temp_new_i64(); | ||
39 | - for (i = 0; i < len_align; i += 8) { | ||
40 | - tcg_gen_qemu_ld_i64(t0, clean_addr, midx, MO_LEUQ); | ||
41 | + t1 = tcg_temp_new_i64(); | ||
42 | + t16 = tcg_temp_new_i128(); | ||
43 | + | ||
44 | + for (i = 0; i < len_align; i += 16) { | ||
45 | + tcg_gen_qemu_ld_i128(t16, clean_addr, midx, | ||
46 | + MO_LE | MO_128 | MO_ATOM_NONE); | ||
47 | + tcg_gen_extr_i128_i64(t0, t1, t16); | ||
48 | tcg_gen_st_i64(t0, base, vofs + i); | ||
49 | - tcg_gen_addi_i64(clean_addr, clean_addr, 8); | ||
50 | + tcg_gen_st_i64(t1, base, vofs + i + 8); | ||
51 | + tcg_gen_addi_i64(clean_addr, clean_addr, 16); | ||
52 | } | ||
53 | } else { | ||
54 | TCGLabel *loop = gen_new_label(); | ||
55 | @@ -XXX,XX +XXX,XX @@ void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
56 | tcg_gen_movi_ptr(i, 0); | ||
57 | gen_set_label(loop); | ||
58 | |||
59 | - t0 = tcg_temp_new_i64(); | ||
60 | - tcg_gen_qemu_ld_i64(t0, clean_addr, midx, MO_LEUQ); | ||
61 | - tcg_gen_addi_i64(clean_addr, clean_addr, 8); | ||
62 | + t16 = tcg_temp_new_i128(); | ||
63 | + tcg_gen_qemu_ld_i128(t16, clean_addr, midx, | ||
64 | + MO_LE | MO_128 | MO_ATOM_NONE); | ||
65 | + tcg_gen_addi_i64(clean_addr, clean_addr, 16); | ||
66 | |||
67 | tp = tcg_temp_new_ptr(); | ||
68 | tcg_gen_add_ptr(tp, base, i); | ||
69 | - tcg_gen_addi_ptr(i, i, 8); | ||
70 | + tcg_gen_addi_ptr(i, i, 16); | ||
71 | + | ||
72 | + t0 = tcg_temp_new_i64(); | ||
73 | + t1 = tcg_temp_new_i64(); | ||
74 | + tcg_gen_extr_i128_i64(t0, t1, t16); | ||
75 | + | ||
76 | tcg_gen_st_i64(t0, tp, vofs); | ||
77 | + tcg_gen_st_i64(t1, tp, vofs + 8); | ||
78 | |||
79 | tcg_gen_brcondi_ptr(TCG_COND_LTU, i, len_align, loop); | ||
80 | } | ||
81 | @@ -XXX,XX +XXX,XX @@ void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
82 | * Predicate register loads can be any multiple of 2. | ||
83 | * Note that we still store the entire 64-bit unit into cpu_env. | ||
84 | */ | ||
85 | + if (len_remain >= 8) { | ||
86 | + t0 = tcg_temp_new_i64(); | ||
87 | + tcg_gen_qemu_ld_i64(t0, clean_addr, midx, MO_LEUQ | MO_ATOM_NONE); | ||
88 | + tcg_gen_st_i64(t0, base, vofs + len_align); | ||
89 | + len_remain -= 8; | ||
90 | + len_align += 8; | ||
91 | + if (len_remain) { | ||
92 | + tcg_gen_addi_i64(clean_addr, clean_addr, 8); | ||
93 | + } | ||
94 | + } | ||
95 | if (len_remain) { | ||
96 | t0 = tcg_temp_new_i64(); | ||
97 | switch (len_remain) { | ||
98 | @@ -XXX,XX +XXX,XX @@ void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
99 | case 4: | ||
100 | case 8: | ||
101 | tcg_gen_qemu_ld_i64(t0, clean_addr, midx, | ||
102 | - MO_LE | ctz32(len_remain)); | ||
103 | + MO_LE | ctz32(len_remain) | MO_ATOM_NONE); | ||
104 | break; | ||
105 | |||
106 | case 6: | ||
107 | t1 = tcg_temp_new_i64(); | ||
108 | - tcg_gen_qemu_ld_i64(t0, clean_addr, midx, MO_LEUL); | ||
109 | + tcg_gen_qemu_ld_i64(t0, clean_addr, midx, MO_LEUL | MO_ATOM_NONE); | ||
110 | tcg_gen_addi_i64(clean_addr, clean_addr, 4); | ||
111 | - tcg_gen_qemu_ld_i64(t1, clean_addr, midx, MO_LEUW); | ||
112 | + tcg_gen_qemu_ld_i64(t1, clean_addr, midx, MO_LEUW | MO_ATOM_NONE); | ||
113 | tcg_gen_deposit_i64(t0, t0, t1, 32, 32); | ||
114 | break; | ||
115 | |||
116 | @@ -XXX,XX +XXX,XX @@ void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
117 | void gen_sve_str(DisasContext *s, TCGv_ptr base, int vofs, | ||
118 | int len, int rn, int imm) | ||
119 | { | ||
120 | - int len_align = QEMU_ALIGN_DOWN(len, 8); | ||
121 | - int len_remain = len % 8; | ||
122 | - int nparts = len / 8 + ctpop8(len_remain); | ||
123 | + int len_align = QEMU_ALIGN_DOWN(len, 16); | ||
124 | + int len_remain = len % 16; | ||
125 | + int nparts = len / 16 + ctpop8(len_remain); | ||
126 | int midx = get_mem_index(s); | ||
127 | - TCGv_i64 dirty_addr, clean_addr, t0; | ||
128 | + TCGv_i64 dirty_addr, clean_addr, t0, t1; | ||
129 | + TCGv_i128 t16; | ||
130 | |||
131 | dirty_addr = tcg_temp_new_i64(); | ||
132 | tcg_gen_addi_i64(dirty_addr, cpu_reg_sp(s, rn), imm); | ||
133 | @@ -XXX,XX +XXX,XX @@ void gen_sve_str(DisasContext *s, TCGv_ptr base, int vofs, | ||
134 | int i; | ||
135 | |||
136 | t0 = tcg_temp_new_i64(); | ||
137 | + t1 = tcg_temp_new_i64(); | ||
138 | + t16 = tcg_temp_new_i128(); | ||
139 | for (i = 0; i < len_align; i += 8) { | ||
140 | tcg_gen_ld_i64(t0, base, vofs + i); | ||
141 | - tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUQ); | ||
142 | - tcg_gen_addi_i64(clean_addr, clean_addr, 8); | ||
143 | + tcg_gen_ld_i64(t1, base, vofs + i + 8); | ||
144 | + tcg_gen_concat_i64_i128(t16, t0, t1); | ||
145 | + tcg_gen_qemu_st_i128(t16, clean_addr, midx, | ||
146 | + MO_LE | MO_128 | MO_ATOM_NONE); | ||
147 | + tcg_gen_addi_i64(clean_addr, clean_addr, 16); | ||
148 | } | ||
149 | } else { | ||
150 | TCGLabel *loop = gen_new_label(); | ||
151 | @@ -XXX,XX +XXX,XX @@ void gen_sve_str(DisasContext *s, TCGv_ptr base, int vofs, | ||
152 | gen_set_label(loop); | ||
153 | |||
154 | t0 = tcg_temp_new_i64(); | ||
155 | + t1 = tcg_temp_new_i64(); | ||
156 | tp = tcg_temp_new_ptr(); | ||
157 | tcg_gen_add_ptr(tp, base, i); | ||
158 | tcg_gen_ld_i64(t0, tp, vofs); | ||
159 | - tcg_gen_addi_ptr(i, i, 8); | ||
160 | + tcg_gen_ld_i64(t1, tp, vofs + 8); | ||
161 | + tcg_gen_addi_ptr(i, i, 16); | ||
162 | |||
163 | - tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUQ); | ||
164 | - tcg_gen_addi_i64(clean_addr, clean_addr, 8); | ||
165 | + t16 = tcg_temp_new_i128(); | ||
166 | + tcg_gen_concat_i64_i128(t16, t0, t1); | ||
167 | + | ||
168 | + tcg_gen_qemu_st_i128(t16, clean_addr, midx, MO_LEUQ); | ||
169 | + tcg_gen_addi_i64(clean_addr, clean_addr, 16); | ||
170 | |||
171 | tcg_gen_brcondi_ptr(TCG_COND_LTU, i, len_align, loop); | ||
172 | } | ||
173 | |||
174 | /* Predicate register stores can be any multiple of 2. */ | ||
175 | + if (len_remain >= 8) { | ||
176 | + t0 = tcg_temp_new_i64(); | ||
177 | + tcg_gen_st_i64(t0, base, vofs + len_align); | ||
178 | + tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUQ | MO_ATOM_NONE); | ||
179 | + len_remain -= 8; | ||
180 | + len_align += 8; | ||
181 | + if (len_remain) { | ||
182 | + tcg_gen_addi_i64(clean_addr, clean_addr, 8); | ||
183 | + } | ||
184 | + } | ||
185 | if (len_remain) { | ||
186 | t0 = tcg_temp_new_i64(); | ||
187 | tcg_gen_ld_i64(t0, base, vofs + len_align); | ||
188 | @@ -XXX,XX +XXX,XX @@ void gen_sve_str(DisasContext *s, TCGv_ptr base, int vofs, | ||
189 | case 4: | ||
190 | case 8: | ||
191 | tcg_gen_qemu_st_i64(t0, clean_addr, midx, | ||
192 | - MO_LE | ctz32(len_remain)); | ||
193 | + MO_LE | ctz32(len_remain) | MO_ATOM_NONE); | ||
194 | break; | ||
195 | |||
196 | case 6: | ||
197 | - tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUL); | ||
198 | + tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUL | MO_ATOM_NONE); | ||
199 | tcg_gen_addi_i64(clean_addr, clean_addr, 4); | ||
200 | tcg_gen_shri_i64(t0, t0, 32); | ||
201 | - tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUW); | ||
202 | + tcg_gen_qemu_st_i64(t0, clean_addr, midx, MO_LEUW | MO_ATOM_NONE); | ||
203 | break; | ||
23 | 204 | ||
24 | default: | 205 | default: |
25 | -- | 206 | -- |
26 | 2.25.1 | 207 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap | 3 | No need to duplicate this check across multiple call sites. |
4 | if full a64 support is not enabled in streaming mode. | ||
5 | 4 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-6-richard.henderson@linaro.org | 7 | Message-id: 20230530191438.411344-9-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 9 | --- |
11 | target/arm/sme-fa64.decode | 2 -- | 10 | target/arm/tcg/translate-a64.c | 44 ++++++++++++++++------------------ |
12 | target/arm/translate-sve.c | 9 ++++++--- | 11 | 1 file changed, 21 insertions(+), 23 deletions(-) |
13 | 2 files changed, 6 insertions(+), 5 deletions(-) | ||
14 | 12 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 13 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
16 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 15 | --- a/target/arm/tcg/translate-a64.c |
18 | +++ b/target/arm/sme-fa64.decode | 16 | +++ b/target/arm/tcg/translate-a64.c |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 17 | @@ -XXX,XX +XXX,XX @@ static void disas_b_exc_sys(DisasContext *s, uint32_t insn) |
20 | 18 | * races in multi-threaded linux-user and when MTTCG softmmu is | |
21 | FAIL 0000 0100 --1- ---- 1011 -0-- ---- ---- # FTSSEL, FEXPA | 19 | * enabled. |
22 | FAIL 0000 0101 --10 0001 100- ---- ---- ---- # COMPACT | 20 | */ |
23 | -FAIL 0010 0101 --01 100- 1111 000- ---0 ---- # RDFFR, RDFFRS | 21 | -static void gen_load_exclusive(DisasContext *s, int rt, int rt2, |
24 | -FAIL 0010 0101 --10 1--- 1001 ---- ---- ---- # WRFFR, SETFFR | 22 | - TCGv_i64 addr, int size, bool is_pair) |
25 | FAIL 0100 0101 --0- ---- 1011 ---- ---- ---- # BDEP, BEXT, BGRP | 23 | +static void gen_load_exclusive(DisasContext *s, int rt, int rt2, int rn, |
26 | FAIL 0100 0101 000- ---- 0110 1--- ---- ---- # PMULLB, PMULLT (128b result) | 24 | + int size, bool is_pair) |
27 | FAIL 0110 0100 --1- ---- 1110 01-- ---- ---- # FMMLA, BFMMLA | 25 | { |
28 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 26 | int idx = get_mem_index(s); |
29 | index XXXXXXX..XXXXXXX 100644 | 27 | MemOp memop; |
30 | --- a/target/arm/translate-sve.c | 28 | + TCGv_i64 dirty_addr, clean_addr; |
31 | +++ b/target/arm/translate-sve.c | ||
32 | @@ -XXX,XX +XXX,XX @@ static bool do_predset(DisasContext *s, int esz, int rd, int pat, bool setflag) | ||
33 | TRANS_FEAT(PTRUE, aa64_sve, do_predset, a->esz, a->rd, a->pat, a->s) | ||
34 | |||
35 | /* Note pat == 31 is #all, to set all elements. */ | ||
36 | -TRANS_FEAT(SETFFR, aa64_sve, do_predset, 0, FFR_PRED_NUM, 31, false) | ||
37 | +TRANS_FEAT_NONSTREAMING(SETFFR, aa64_sve, | ||
38 | + do_predset, 0, FFR_PRED_NUM, 31, false) | ||
39 | |||
40 | /* Note pat == 32 is #unimp, to set no elements. */ | ||
41 | TRANS_FEAT(PFALSE, aa64_sve, do_predset, 0, a->rd, 32, false) | ||
42 | @@ -XXX,XX +XXX,XX @@ static bool trans_RDFFR_p(DisasContext *s, arg_RDFFR_p *a) | ||
43 | .rd = a->rd, .pg = a->pg, .s = a->s, | ||
44 | .rn = FFR_PRED_NUM, .rm = FFR_PRED_NUM, | ||
45 | }; | ||
46 | + | 29 | + |
47 | + s->is_nonstreaming = true; | 30 | + s->is_ldex = true; |
48 | return trans_AND_pppp(s, &alt_a); | 31 | + dirty_addr = cpu_reg_sp(s, rn); |
32 | + clean_addr = gen_mte_check1(s, dirty_addr, false, rn != 31, size); | ||
33 | |||
34 | g_assert(size <= 3); | ||
35 | if (is_pair) { | ||
36 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, | ||
37 | if (size == 2) { | ||
38 | /* The pair must be single-copy atomic for the doubleword. */ | ||
39 | memop = finalize_memop(s, MO_64 | MO_ALIGN); | ||
40 | - tcg_gen_qemu_ld_i64(cpu_exclusive_val, addr, idx, memop); | ||
41 | + tcg_gen_qemu_ld_i64(cpu_exclusive_val, clean_addr, idx, memop); | ||
42 | if (s->be_data == MO_LE) { | ||
43 | tcg_gen_extract_i64(cpu_reg(s, rt), cpu_exclusive_val, 0, 32); | ||
44 | tcg_gen_extract_i64(cpu_reg(s, rt2), cpu_exclusive_val, 32, 32); | ||
45 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, | ||
46 | |||
47 | memop = finalize_memop_atom(s, MO_128 | MO_ALIGN_16, | ||
48 | MO_ATOM_IFALIGN_PAIR); | ||
49 | - tcg_gen_qemu_ld_i128(t16, addr, idx, memop); | ||
50 | + tcg_gen_qemu_ld_i128(t16, clean_addr, idx, memop); | ||
51 | |||
52 | if (s->be_data == MO_LE) { | ||
53 | tcg_gen_extr_i128_i64(cpu_exclusive_val, | ||
54 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, | ||
55 | } | ||
56 | } else { | ||
57 | memop = finalize_memop(s, size | MO_ALIGN); | ||
58 | - tcg_gen_qemu_ld_i64(cpu_exclusive_val, addr, idx, memop); | ||
59 | + tcg_gen_qemu_ld_i64(cpu_exclusive_val, clean_addr, idx, memop); | ||
60 | tcg_gen_mov_i64(cpu_reg(s, rt), cpu_exclusive_val); | ||
61 | } | ||
62 | - tcg_gen_mov_i64(cpu_exclusive_addr, addr); | ||
63 | + tcg_gen_mov_i64(cpu_exclusive_addr, clean_addr); | ||
49 | } | 64 | } |
50 | 65 | ||
51 | -TRANS_FEAT(RDFFR, aa64_sve, do_mov_p, a->rd, FFR_PRED_NUM) | 66 | static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, |
52 | -TRANS_FEAT(WRFFR, aa64_sve, do_mov_p, FFR_PRED_NUM, a->rn) | 67 | - TCGv_i64 addr, int size, int is_pair) |
53 | +TRANS_FEAT_NONSTREAMING(RDFFR, aa64_sve, do_mov_p, a->rd, FFR_PRED_NUM) | 68 | + int rn, int size, int is_pair) |
54 | +TRANS_FEAT_NONSTREAMING(WRFFR, aa64_sve, do_mov_p, FFR_PRED_NUM, a->rn) | 69 | { |
55 | 70 | /* if (env->exclusive_addr == addr && env->exclusive_val == [addr] | |
56 | static bool do_pfirst_pnext(DisasContext *s, arg_rr_esz *a, | 71 | * && (!is_pair || env->exclusive_high == [addr + datasize])) { |
57 | void (*gen_fn)(TCGv_i32, TCGv_ptr, | 72 | @@ -XXX,XX +XXX,XX @@ static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, |
73 | */ | ||
74 | TCGLabel *fail_label = gen_new_label(); | ||
75 | TCGLabel *done_label = gen_new_label(); | ||
76 | - TCGv_i64 tmp; | ||
77 | + TCGv_i64 tmp, dirty_addr, clean_addr; | ||
78 | |||
79 | - tcg_gen_brcond_i64(TCG_COND_NE, addr, cpu_exclusive_addr, fail_label); | ||
80 | + dirty_addr = cpu_reg_sp(s, rn); | ||
81 | + clean_addr = gen_mte_check1(s, dirty_addr, true, rn != 31, size); | ||
82 | + | ||
83 | + tcg_gen_brcond_i64(TCG_COND_NE, clean_addr, cpu_exclusive_addr, fail_label); | ||
84 | |||
85 | tmp = tcg_temp_new_i64(); | ||
86 | if (is_pair) { | ||
87 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
88 | if (is_lasr) { | ||
89 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_STRL); | ||
90 | } | ||
91 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
92 | - true, rn != 31, size); | ||
93 | - gen_store_exclusive(s, rs, rt, rt2, clean_addr, size, false); | ||
94 | + gen_store_exclusive(s, rs, rt, rt2, rn, size, false); | ||
95 | return; | ||
96 | |||
97 | case 0x4: /* LDXR */ | ||
98 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
99 | if (rn == 31) { | ||
100 | gen_check_sp_alignment(s); | ||
101 | } | ||
102 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
103 | - false, rn != 31, size); | ||
104 | - s->is_ldex = true; | ||
105 | - gen_load_exclusive(s, rt, rt2, clean_addr, size, false); | ||
106 | + gen_load_exclusive(s, rt, rt2, rn, size, false); | ||
107 | if (is_lasr) { | ||
108 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_LDAQ); | ||
109 | } | ||
110 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
111 | if (is_lasr) { | ||
112 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_STRL); | ||
113 | } | ||
114 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
115 | - true, rn != 31, size); | ||
116 | - gen_store_exclusive(s, rs, rt, rt2, clean_addr, size, true); | ||
117 | + gen_store_exclusive(s, rs, rt, rt2, rn, size, true); | ||
118 | return; | ||
119 | } | ||
120 | if (rt2 == 31 | ||
121 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
122 | if (rn == 31) { | ||
123 | gen_check_sp_alignment(s); | ||
124 | } | ||
125 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
126 | - false, rn != 31, size); | ||
127 | - s->is_ldex = true; | ||
128 | - gen_load_exclusive(s, rt, rt2, clean_addr, size, true); | ||
129 | + gen_load_exclusive(s, rt, rt2, rn, size, true); | ||
130 | if (is_lasr) { | ||
131 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_LDAQ); | ||
132 | } | ||
58 | -- | 133 | -- |
59 | 2.25.1 | 134 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | These prctl set the Streaming SVE vector length, which may | 3 | This is required for LSE2, where the pair must be treated atomically if |
4 | be completely different from the Normal SVE vector length. | 4 | it does not cross a 16-byte boundary. But it simplifies the code to do |
5 | this always. | ||
5 | 6 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-43-richard.henderson@linaro.org | 9 | Message-id: 20230530191438.411344-10-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | linux-user/aarch64/target_prctl.h | 54 +++++++++++++++++++++++++++++++ | 12 | target/arm/tcg/translate-a64.c | 70 ++++++++++++++++++++++++++-------- |
12 | linux-user/syscall.c | 16 +++++++++ | 13 | 1 file changed, 55 insertions(+), 15 deletions(-) |
13 | 2 files changed, 70 insertions(+) | ||
14 | 14 | ||
15 | diff --git a/linux-user/aarch64/target_prctl.h b/linux-user/aarch64/target_prctl.h | 15 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
16 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/linux-user/aarch64/target_prctl.h | 17 | --- a/target/arm/tcg/translate-a64.c |
18 | +++ b/linux-user/aarch64/target_prctl.h | 18 | +++ b/target/arm/tcg/translate-a64.c |
19 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_sve_get_vl(CPUArchState *env) | 19 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pair(DisasContext *s, uint32_t insn) |
20 | { | 20 | } else { |
21 | ARMCPU *cpu = env_archcpu(env); | 21 | TCGv_i64 tcg_rt = cpu_reg(s, rt); |
22 | if (cpu_isar_feature(aa64_sve, cpu)) { | 22 | TCGv_i64 tcg_rt2 = cpu_reg(s, rt2); |
23 | + /* PSTATE.SM is always unset on syscall entry. */ | 23 | + MemOp mop = size + 1; |
24 | return sve_vq(env) * 16; | ||
25 | } | ||
26 | return -TARGET_EINVAL; | ||
27 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_sve_set_vl(CPUArchState *env, abi_long arg2) | ||
28 | && arg2 >= 0 && arg2 <= 512 * 16 && !(arg2 & 15)) { | ||
29 | uint32_t vq, old_vq; | ||
30 | |||
31 | + /* PSTATE.SM is always unset on syscall entry. */ | ||
32 | old_vq = sve_vq(env); | ||
33 | |||
34 | /* | ||
35 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_sve_set_vl(CPUArchState *env, abi_long arg2) | ||
36 | } | ||
37 | #define do_prctl_sve_set_vl do_prctl_sve_set_vl | ||
38 | |||
39 | +static abi_long do_prctl_sme_get_vl(CPUArchState *env) | ||
40 | +{ | ||
41 | + ARMCPU *cpu = env_archcpu(env); | ||
42 | + if (cpu_isar_feature(aa64_sme, cpu)) { | ||
43 | + return sme_vq(env) * 16; | ||
44 | + } | ||
45 | + return -TARGET_EINVAL; | ||
46 | +} | ||
47 | +#define do_prctl_sme_get_vl do_prctl_sme_get_vl | ||
48 | + | ||
49 | +static abi_long do_prctl_sme_set_vl(CPUArchState *env, abi_long arg2) | ||
50 | +{ | ||
51 | + /* | ||
52 | + * We cannot support either PR_SME_SET_VL_ONEXEC or PR_SME_VL_INHERIT. | ||
53 | + * Note the kernel definition of sve_vl_valid allows for VQ=512, | ||
54 | + * i.e. VL=8192, even though the architectural maximum is VQ=16. | ||
55 | + */ | ||
56 | + if (cpu_isar_feature(aa64_sme, env_archcpu(env)) | ||
57 | + && arg2 >= 0 && arg2 <= 512 * 16 && !(arg2 & 15)) { | ||
58 | + int vq, old_vq; | ||
59 | + | ||
60 | + old_vq = sme_vq(env); | ||
61 | + | 24 | + |
62 | + /* | 25 | + /* |
63 | + * Bound the value of vq, so that we know that it fits into | 26 | + * With LSE2, non-sign-extending pairs are treated atomically if |
64 | + * the 4-bit field in SMCR_EL1. Because PSTATE.SM is cleared | 27 | + * aligned, and if unaligned one of the pair will be completely |
65 | + * on syscall entry, we are not modifying the current SVE | 28 | + * within a 16-byte block and that element will be atomic. |
66 | + * vector length. | 29 | + * Otherwise each element is separately atomic. |
30 | + * In all cases, issue one operation with the correct atomicity. | ||
31 | + * | ||
32 | + * This treats sign-extending loads like zero-extending loads, | ||
33 | + * since that reuses the most code below. | ||
67 | + */ | 34 | + */ |
68 | + vq = MAX(arg2 / 16, 1); | 35 | + if (s->align_mem) { |
69 | + vq = MIN(vq, 16); | 36 | + mop |= (size == 2 ? MO_ALIGN_4 : MO_ALIGN_8); |
70 | + env->vfp.smcr_el[1] = | 37 | + } |
71 | + FIELD_DP64(env->vfp.smcr_el[1], SMCR, LEN, vq - 1); | 38 | + mop = finalize_memop_pair(s, mop); |
39 | |||
40 | if (is_load) { | ||
41 | - TCGv_i64 tmp = tcg_temp_new_i64(); | ||
42 | + if (size == 2) { | ||
43 | + int o2 = s->be_data == MO_LE ? 32 : 0; | ||
44 | + int o1 = o2 ^ 32; | ||
45 | |||
46 | - /* Do not modify tcg_rt before recognizing any exception | ||
47 | - * from the second load. | ||
48 | - */ | ||
49 | - do_gpr_ld(s, tmp, clean_addr, size + is_signed * MO_SIGN, | ||
50 | - false, false, 0, false, false); | ||
51 | - tcg_gen_addi_i64(clean_addr, clean_addr, 1 << size); | ||
52 | - do_gpr_ld(s, tcg_rt2, clean_addr, size + is_signed * MO_SIGN, | ||
53 | - false, false, 0, false, false); | ||
54 | + tcg_gen_qemu_ld_i64(tcg_rt, clean_addr, get_mem_index(s), mop); | ||
55 | + if (is_signed) { | ||
56 | + tcg_gen_sextract_i64(tcg_rt2, tcg_rt, o2, 32); | ||
57 | + tcg_gen_sextract_i64(tcg_rt, tcg_rt, o1, 32); | ||
58 | + } else { | ||
59 | + tcg_gen_extract_i64(tcg_rt2, tcg_rt, o2, 32); | ||
60 | + tcg_gen_extract_i64(tcg_rt, tcg_rt, o1, 32); | ||
61 | + } | ||
62 | + } else { | ||
63 | + TCGv_i128 tmp = tcg_temp_new_i128(); | ||
64 | |||
65 | - tcg_gen_mov_i64(tcg_rt, tmp); | ||
66 | + tcg_gen_qemu_ld_i128(tmp, clean_addr, get_mem_index(s), mop); | ||
67 | + if (s->be_data == MO_LE) { | ||
68 | + tcg_gen_extr_i128_i64(tcg_rt, tcg_rt2, tmp); | ||
69 | + } else { | ||
70 | + tcg_gen_extr_i128_i64(tcg_rt2, tcg_rt, tmp); | ||
71 | + } | ||
72 | + } | ||
73 | } else { | ||
74 | - do_gpr_st(s, tcg_rt, clean_addr, size, | ||
75 | - false, 0, false, false); | ||
76 | - tcg_gen_addi_i64(clean_addr, clean_addr, 1 << size); | ||
77 | - do_gpr_st(s, tcg_rt2, clean_addr, size, | ||
78 | - false, 0, false, false); | ||
79 | + if (size == 2) { | ||
80 | + TCGv_i64 tmp = tcg_temp_new_i64(); | ||
72 | + | 81 | + |
73 | + /* Delay rebuilding hflags until we know if ZA must change. */ | 82 | + if (s->be_data == MO_LE) { |
74 | + vq = sve_vqm1_for_el_sm(env, 0, true) + 1; | 83 | + tcg_gen_concat32_i64(tmp, tcg_rt, tcg_rt2); |
84 | + } else { | ||
85 | + tcg_gen_concat32_i64(tmp, tcg_rt2, tcg_rt); | ||
86 | + } | ||
87 | + tcg_gen_qemu_st_i64(tmp, clean_addr, get_mem_index(s), mop); | ||
88 | + } else { | ||
89 | + TCGv_i128 tmp = tcg_temp_new_i128(); | ||
75 | + | 90 | + |
76 | + if (vq != old_vq) { | 91 | + if (s->be_data == MO_LE) { |
77 | + /* | 92 | + tcg_gen_concat_i64_i128(tmp, tcg_rt, tcg_rt2); |
78 | + * PSTATE.ZA state is cleared on any change to SVL. | 93 | + } else { |
79 | + * We need not call arm_rebuild_hflags because PSTATE.SM was | 94 | + tcg_gen_concat_i64_i128(tmp, tcg_rt2, tcg_rt); |
80 | + * cleared on syscall entry, so this hasn't changed VL. | 95 | + } |
81 | + */ | 96 | + tcg_gen_qemu_st_i128(tmp, clean_addr, get_mem_index(s), mop); |
82 | + env->svcr = FIELD_DP64(env->svcr, SVCR, ZA, 0); | 97 | + } |
83 | + arm_rebuild_hflags(env); | 98 | } |
84 | + } | 99 | } |
85 | + return vq * 16; | 100 | |
86 | + } | ||
87 | + return -TARGET_EINVAL; | ||
88 | +} | ||
89 | +#define do_prctl_sme_set_vl do_prctl_sme_set_vl | ||
90 | + | ||
91 | static abi_long do_prctl_reset_keys(CPUArchState *env, abi_long arg2) | ||
92 | { | ||
93 | ARMCPU *cpu = env_archcpu(env); | ||
94 | diff --git a/linux-user/syscall.c b/linux-user/syscall.c | ||
95 | index XXXXXXX..XXXXXXX 100644 | ||
96 | --- a/linux-user/syscall.c | ||
97 | +++ b/linux-user/syscall.c | ||
98 | @@ -XXX,XX +XXX,XX @@ abi_long do_arch_prctl(CPUX86State *env, int code, abi_ulong addr) | ||
99 | #ifndef PR_SET_SYSCALL_USER_DISPATCH | ||
100 | # define PR_SET_SYSCALL_USER_DISPATCH 59 | ||
101 | #endif | ||
102 | +#ifndef PR_SME_SET_VL | ||
103 | +# define PR_SME_SET_VL 63 | ||
104 | +# define PR_SME_GET_VL 64 | ||
105 | +# define PR_SME_VL_LEN_MASK 0xffff | ||
106 | +# define PR_SME_VL_INHERIT (1 << 17) | ||
107 | +#endif | ||
108 | |||
109 | #include "target_prctl.h" | ||
110 | |||
111 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl_inval1(CPUArchState *env, abi_long arg2) | ||
112 | #ifndef do_prctl_set_unalign | ||
113 | #define do_prctl_set_unalign do_prctl_inval1 | ||
114 | #endif | ||
115 | +#ifndef do_prctl_sme_get_vl | ||
116 | +#define do_prctl_sme_get_vl do_prctl_inval0 | ||
117 | +#endif | ||
118 | +#ifndef do_prctl_sme_set_vl | ||
119 | +#define do_prctl_sme_set_vl do_prctl_inval1 | ||
120 | +#endif | ||
121 | |||
122 | static abi_long do_prctl(CPUArchState *env, abi_long option, abi_long arg2, | ||
123 | abi_long arg3, abi_long arg4, abi_long arg5) | ||
124 | @@ -XXX,XX +XXX,XX @@ static abi_long do_prctl(CPUArchState *env, abi_long option, abi_long arg2, | ||
125 | return do_prctl_sve_get_vl(env); | ||
126 | case PR_SVE_SET_VL: | ||
127 | return do_prctl_sve_set_vl(env, arg2); | ||
128 | + case PR_SME_GET_VL: | ||
129 | + return do_prctl_sme_get_vl(env); | ||
130 | + case PR_SME_SET_VL: | ||
131 | + return do_prctl_sme_set_vl(env, arg2); | ||
132 | case PR_PAC_RESET_KEYS: | ||
133 | if (arg3 || arg4 || arg5) { | ||
134 | return -TARGET_EINVAL; | ||
135 | -- | 101 | -- |
136 | 2.25.1 | 102 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Fold the return value setting into the goto, so each | 3 | We are going to need the complete memop beforehand, |
4 | point of failure need not do both. | 4 | so let's not compute it twice. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-37-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-11-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | linux-user/aarch64/signal.c | 26 +++++++++++--------------- | 11 | target/arm/tcg/translate-a64.c | 61 +++++++++++++++++++--------------- |
12 | 1 file changed, 11 insertions(+), 15 deletions(-) | 12 | 1 file changed, 35 insertions(+), 26 deletions(-) |
13 | 13 | ||
14 | diff --git a/linux-user/aarch64/signal.c b/linux-user/aarch64/signal.c | 14 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
15 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/linux-user/aarch64/signal.c | 16 | --- a/target/arm/tcg/translate-a64.c |
17 | +++ b/linux-user/aarch64/signal.c | 17 | +++ b/target/arm/tcg/translate-a64.c |
18 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 18 | @@ -XXX,XX +XXX,XX @@ static void do_gpr_st_memidx(DisasContext *s, TCGv_i64 source, |
19 | struct target_sve_context *sve = NULL; | 19 | unsigned int iss_srt, |
20 | uint64_t extra_datap = 0; | 20 | bool iss_sf, bool iss_ar) |
21 | bool used_extra = false; | 21 | { |
22 | - bool err = false; | 22 | - memop = finalize_memop(s, memop); |
23 | int vq = 0, sve_size = 0; | 23 | tcg_gen_qemu_st_i64(source, tcg_addr, memidx, memop); |
24 | 24 | ||
25 | target_restore_general_frame(env, sf); | 25 | if (iss_valid) { |
26 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 26 | @@ -XXX,XX +XXX,XX @@ static void do_gpr_ld_memidx(DisasContext *s, TCGv_i64 dest, TCGv_i64 tcg_addr, |
27 | switch (magic) { | 27 | bool iss_valid, unsigned int iss_srt, |
28 | case 0: | 28 | bool iss_sf, bool iss_ar) |
29 | if (size != 0) { | 29 | { |
30 | - err = true; | 30 | - memop = finalize_memop(s, memop); |
31 | - goto exit; | 31 | tcg_gen_qemu_ld_i64(dest, tcg_addr, memidx, memop); |
32 | + goto err; | 32 | |
33 | } | 33 | if (extend && (memop & MO_SIGN)) { |
34 | if (used_extra) { | 34 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) |
35 | ctx = NULL; | 35 | int o2_L_o1_o0 = extract32(insn, 21, 3) * 2 | is_lasr; |
36 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 36 | int size = extract32(insn, 30, 2); |
37 | 37 | TCGv_i64 clean_addr; | |
38 | case TARGET_FPSIMD_MAGIC: | 38 | + MemOp memop; |
39 | if (fpsimd || size != sizeof(struct target_fpsimd_context)) { | 39 | |
40 | - err = true; | 40 | switch (o2_L_o1_o0) { |
41 | - goto exit; | 41 | case 0x0: /* STXR */ |
42 | + goto err; | 42 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) |
43 | } | 43 | gen_check_sp_alignment(s); |
44 | fpsimd = (struct target_fpsimd_context *)ctx; | 44 | } |
45 | break; | 45 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_STRL); |
46 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 46 | + /* TODO: ARMv8.4-LSE SCTLR.nAA */ |
47 | break; | 47 | + memop = finalize_memop(s, size | MO_ALIGN); |
48 | } | 48 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), |
49 | } | 49 | true, rn != 31, size); |
50 | - err = true; | 50 | - /* TODO: ARMv8.4-LSE SCTLR.nAA */ |
51 | - goto exit; | 51 | - do_gpr_st(s, cpu_reg(s, rt), clean_addr, size | MO_ALIGN, true, rt, |
52 | + goto err; | 52 | + do_gpr_st(s, cpu_reg(s, rt), clean_addr, memop, true, rt, |
53 | 53 | disas_ldst_compute_iss_sf(size, false, 0), is_lasr); | |
54 | case TARGET_EXTRA_MAGIC: | 54 | return; |
55 | if (extra || size != sizeof(struct target_extra_context)) { | 55 | |
56 | - err = true; | 56 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) |
57 | - goto exit; | 57 | if (rn == 31) { |
58 | + goto err; | 58 | gen_check_sp_alignment(s); |
59 | } | 59 | } |
60 | __get_user(extra_datap, | 60 | + /* TODO: ARMv8.4-LSE SCTLR.nAA */ |
61 | &((struct target_extra_context *)ctx)->datap); | 61 | + memop = finalize_memop(s, size | MO_ALIGN); |
62 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 62 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), |
63 | /* Unknown record -- we certainly didn't generate it. | 63 | false, rn != 31, size); |
64 | * Did we in fact get out of sync? | 64 | - /* TODO: ARMv8.4-LSE SCTLR.nAA */ |
65 | */ | 65 | - do_gpr_ld(s, cpu_reg(s, rt), clean_addr, size | MO_ALIGN, false, true, |
66 | - err = true; | 66 | + do_gpr_ld(s, cpu_reg(s, rt), clean_addr, memop, false, true, |
67 | - goto exit; | 67 | rt, disas_ldst_compute_iss_sf(size, false, 0), is_lasr); |
68 | + goto err; | 68 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_LDAQ); |
69 | } | 69 | return; |
70 | ctx = (void *)ctx + size; | 70 | @@ -XXX,XX +XXX,XX @@ static void disas_ld_lit(DisasContext *s, uint32_t insn) |
71 | } | ||
72 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | ||
73 | if (fpsimd) { | ||
74 | target_restore_fpsimd_record(env, fpsimd); | ||
75 | } else { | 71 | } else { |
76 | - err = true; | 72 | /* Only unsigned 32bit loads target 32bit registers. */ |
77 | + goto err; | 73 | bool iss_sf = opc != 0; |
78 | } | 74 | + MemOp memop = finalize_memop(s, size + is_signed * MO_SIGN); |
79 | 75 | ||
80 | /* SVE data, if present, overwrites FPSIMD data. */ | 76 | - do_gpr_ld(s, tcg_rt, clean_addr, size + is_signed * MO_SIGN, |
81 | if (sve) { | 77 | - false, true, rt, iss_sf, false); |
82 | target_restore_sve_record(env, sve, vq); | 78 | + do_gpr_ld(s, tcg_rt, clean_addr, memop, false, true, rt, iss_sf, false); |
83 | } | 79 | } |
84 | - | ||
85 | - exit: | ||
86 | unlock_user(extra, extra_datap, 0); | ||
87 | - return err; | ||
88 | + return 0; | ||
89 | + | ||
90 | + err: | ||
91 | + unlock_user(extra, extra_datap, 0); | ||
92 | + return 1; | ||
93 | } | 80 | } |
94 | 81 | ||
95 | static abi_ulong get_sigframe(struct target_sigaction *ka, | 82 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, |
83 | bool post_index; | ||
84 | bool writeback; | ||
85 | int memidx; | ||
86 | - | ||
87 | + MemOp memop; | ||
88 | TCGv_i64 clean_addr, dirty_addr; | ||
89 | |||
90 | if (is_vector) { | ||
91 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, | ||
92 | return; | ||
93 | } | ||
94 | is_store = (opc == 0); | ||
95 | - is_signed = extract32(opc, 1, 1); | ||
96 | + is_signed = !is_store && extract32(opc, 1, 1); | ||
97 | is_extended = (size < 3) && extract32(opc, 0, 1); | ||
98 | } | ||
99 | |||
100 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, | ||
101 | } | ||
102 | |||
103 | memidx = is_unpriv ? get_a64_user_mem_index(s) : get_mem_index(s); | ||
104 | + memop = finalize_memop(s, size + is_signed * MO_SIGN); | ||
105 | + | ||
106 | clean_addr = gen_mte_check1_mmuidx(s, dirty_addr, is_store, | ||
107 | writeback || rn != 31, | ||
108 | size, is_unpriv, memidx); | ||
109 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, | ||
110 | bool iss_sf = disas_ldst_compute_iss_sf(size, is_signed, opc); | ||
111 | |||
112 | if (is_store) { | ||
113 | - do_gpr_st_memidx(s, tcg_rt, clean_addr, size, memidx, | ||
114 | + do_gpr_st_memidx(s, tcg_rt, clean_addr, memop, memidx, | ||
115 | iss_valid, rt, iss_sf, false); | ||
116 | } else { | ||
117 | - do_gpr_ld_memidx(s, tcg_rt, clean_addr, size + is_signed * MO_SIGN, | ||
118 | + do_gpr_ld_memidx(s, tcg_rt, clean_addr, memop, | ||
119 | is_extended, memidx, | ||
120 | iss_valid, rt, iss_sf, false); | ||
121 | } | ||
122 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_roffset(DisasContext *s, uint32_t insn, | ||
123 | bool is_signed = false; | ||
124 | bool is_store = false; | ||
125 | bool is_extended = false; | ||
126 | - | ||
127 | TCGv_i64 tcg_rm, clean_addr, dirty_addr; | ||
128 | + MemOp memop; | ||
129 | |||
130 | if (extract32(opt, 1, 1) == 0) { | ||
131 | unallocated_encoding(s); | ||
132 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_roffset(DisasContext *s, uint32_t insn, | ||
133 | return; | ||
134 | } | ||
135 | is_store = (opc == 0); | ||
136 | - is_signed = extract32(opc, 1, 1); | ||
137 | + is_signed = !is_store && extract32(opc, 1, 1); | ||
138 | is_extended = (size < 3) && extract32(opc, 0, 1); | ||
139 | } | ||
140 | |||
141 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_roffset(DisasContext *s, uint32_t insn, | ||
142 | ext_and_shift_reg(tcg_rm, tcg_rm, opt, shift ? size : 0); | ||
143 | |||
144 | tcg_gen_add_i64(dirty_addr, dirty_addr, tcg_rm); | ||
145 | + | ||
146 | + memop = finalize_memop(s, size + is_signed * MO_SIGN); | ||
147 | clean_addr = gen_mte_check1(s, dirty_addr, is_store, true, size); | ||
148 | |||
149 | if (is_vector) { | ||
150 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_roffset(DisasContext *s, uint32_t insn, | ||
151 | } else { | ||
152 | TCGv_i64 tcg_rt = cpu_reg(s, rt); | ||
153 | bool iss_sf = disas_ldst_compute_iss_sf(size, is_signed, opc); | ||
154 | + | ||
155 | if (is_store) { | ||
156 | - do_gpr_st(s, tcg_rt, clean_addr, size, | ||
157 | + do_gpr_st(s, tcg_rt, clean_addr, memop, | ||
158 | true, rt, iss_sf, false); | ||
159 | } else { | ||
160 | - do_gpr_ld(s, tcg_rt, clean_addr, size + is_signed * MO_SIGN, | ||
161 | + do_gpr_ld(s, tcg_rt, clean_addr, memop, | ||
162 | is_extended, true, rt, iss_sf, false); | ||
163 | } | ||
164 | } | ||
165 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_unsigned_imm(DisasContext *s, uint32_t insn, | ||
166 | int rn = extract32(insn, 5, 5); | ||
167 | unsigned int imm12 = extract32(insn, 10, 12); | ||
168 | unsigned int offset; | ||
169 | - | ||
170 | TCGv_i64 clean_addr, dirty_addr; | ||
171 | - | ||
172 | bool is_store; | ||
173 | bool is_signed = false; | ||
174 | bool is_extended = false; | ||
175 | + MemOp memop; | ||
176 | |||
177 | if (is_vector) { | ||
178 | size |= (opc & 2) << 1; | ||
179 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_unsigned_imm(DisasContext *s, uint32_t insn, | ||
180 | return; | ||
181 | } | ||
182 | is_store = (opc == 0); | ||
183 | - is_signed = extract32(opc, 1, 1); | ||
184 | + is_signed = !is_store && extract32(opc, 1, 1); | ||
185 | is_extended = (size < 3) && extract32(opc, 0, 1); | ||
186 | } | ||
187 | |||
188 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_unsigned_imm(DisasContext *s, uint32_t insn, | ||
189 | dirty_addr = read_cpu_reg_sp(s, rn, 1); | ||
190 | offset = imm12 << size; | ||
191 | tcg_gen_addi_i64(dirty_addr, dirty_addr, offset); | ||
192 | + | ||
193 | + memop = finalize_memop(s, size + is_signed * MO_SIGN); | ||
194 | clean_addr = gen_mte_check1(s, dirty_addr, is_store, rn != 31, size); | ||
195 | |||
196 | if (is_vector) { | ||
197 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_unsigned_imm(DisasContext *s, uint32_t insn, | ||
198 | TCGv_i64 tcg_rt = cpu_reg(s, rt); | ||
199 | bool iss_sf = disas_ldst_compute_iss_sf(size, is_signed, opc); | ||
200 | if (is_store) { | ||
201 | - do_gpr_st(s, tcg_rt, clean_addr, size, | ||
202 | - true, rt, iss_sf, false); | ||
203 | + do_gpr_st(s, tcg_rt, clean_addr, memop, true, rt, iss_sf, false); | ||
204 | } else { | ||
205 | - do_gpr_ld(s, tcg_rt, clean_addr, size + is_signed * MO_SIGN, | ||
206 | + do_gpr_ld(s, tcg_rt, clean_addr, memop, | ||
207 | is_extended, true, rt, iss_sf, false); | ||
208 | } | ||
209 | } | ||
210 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_atomic(DisasContext *s, uint32_t insn, | ||
211 | bool a = extract32(insn, 23, 1); | ||
212 | TCGv_i64 tcg_rs, tcg_rt, clean_addr; | ||
213 | AtomicThreeOpFn *fn = NULL; | ||
214 | - MemOp mop = s->be_data | size | MO_ALIGN; | ||
215 | + MemOp mop = finalize_memop(s, size | MO_ALIGN); | ||
216 | |||
217 | if (is_vector || !dc_isar_feature(aa64_atomics, s)) { | ||
218 | unallocated_encoding(s); | ||
219 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_atomic(DisasContext *s, uint32_t insn, | ||
220 | * full load-acquire (we only need "load-acquire processor consistent"), | ||
221 | * but we choose to implement them as full LDAQ. | ||
222 | */ | ||
223 | - do_gpr_ld(s, cpu_reg(s, rt), clean_addr, size, false, | ||
224 | + do_gpr_ld(s, cpu_reg(s, rt), clean_addr, mop, false, | ||
225 | true, rt, disas_ldst_compute_iss_sf(size, false, 0), true); | ||
226 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_LDAQ); | ||
227 | return; | ||
228 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pac(DisasContext *s, uint32_t insn, | ||
229 | bool use_key_a = !extract32(insn, 23, 1); | ||
230 | int offset; | ||
231 | TCGv_i64 clean_addr, dirty_addr, tcg_rt; | ||
232 | + MemOp memop; | ||
233 | |||
234 | if (size != 3 || is_vector || !dc_isar_feature(aa64_pauth, s)) { | ||
235 | unallocated_encoding(s); | ||
236 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pac(DisasContext *s, uint32_t insn, | ||
237 | offset = sextract32(offset << size, 0, 10 + size); | ||
238 | tcg_gen_addi_i64(dirty_addr, dirty_addr, offset); | ||
239 | |||
240 | + memop = finalize_memop(s, size); | ||
241 | + | ||
242 | /* Note that "clean" and "dirty" here refer to TBI not PAC. */ | ||
243 | clean_addr = gen_mte_check1(s, dirty_addr, false, | ||
244 | is_wback || rn != 31, size); | ||
245 | |||
246 | tcg_rt = cpu_reg(s, rt); | ||
247 | - do_gpr_ld(s, tcg_rt, clean_addr, size, | ||
248 | + do_gpr_ld(s, tcg_rt, clean_addr, memop, | ||
249 | /* extend */ false, /* iss_valid */ !is_wback, | ||
250 | /* iss_srt */ rt, /* iss_sf */ true, /* iss_ar */ false); | ||
251 | |||
252 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_ldapr_stlr(DisasContext *s, uint32_t insn) | ||
253 | } | ||
254 | |||
255 | /* TODO: ARMv8.4-LSE SCTLR.nAA */ | ||
256 | - mop = size | MO_ALIGN; | ||
257 | + mop = finalize_memop(s, size | MO_ALIGN); | ||
258 | |||
259 | switch (opc) { | ||
260 | case 0: /* STLURB */ | ||
96 | -- | 261 | -- |
97 | 2.25.1 | 262 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Set the SM bit in the SVE record on signal delivery, create the ZA record. | 3 | We are going to need the complete memop beforehand, |
4 | Restore SM and ZA state according to the records present on return. | 4 | so let's not compute it twice. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org> | ||
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-41-richard.henderson@linaro.org | 9 | Message-id: 20230530191438.411344-12-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | linux-user/aarch64/signal.c | 167 +++++++++++++++++++++++++++++++++--- | 12 | target/arm/tcg/translate-a64.c | 43 ++++++++++++++++++---------------- |
12 | 1 file changed, 154 insertions(+), 13 deletions(-) | 13 | 1 file changed, 23 insertions(+), 20 deletions(-) |
13 | 14 | ||
14 | diff --git a/linux-user/aarch64/signal.c b/linux-user/aarch64/signal.c | 15 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
15 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/linux-user/aarch64/signal.c | 17 | --- a/target/arm/tcg/translate-a64.c |
17 | +++ b/linux-user/aarch64/signal.c | 18 | +++ b/target/arm/tcg/translate-a64.c |
18 | @@ -XXX,XX +XXX,XX @@ struct target_sve_context { | 19 | @@ -XXX,XX +XXX,XX @@ static void do_gpr_ld(DisasContext *s, TCGv_i64 dest, TCGv_i64 tcg_addr, |
19 | 20 | /* | |
20 | #define TARGET_SVE_SIG_FLAG_SM 1 | 21 | * Store from FP register to memory |
21 | 22 | */ | |
22 | +#define TARGET_ZA_MAGIC 0x54366345 | 23 | -static void do_fp_st(DisasContext *s, int srcidx, TCGv_i64 tcg_addr, int size) |
24 | +static void do_fp_st(DisasContext *s, int srcidx, TCGv_i64 tcg_addr, MemOp mop) | ||
25 | { | ||
26 | /* This writes the bottom N bits of a 128 bit wide vector to memory */ | ||
27 | TCGv_i64 tmplo = tcg_temp_new_i64(); | ||
28 | - MemOp mop = finalize_memop_asimd(s, size); | ||
29 | |||
30 | tcg_gen_ld_i64(tmplo, cpu_env, fp_reg_offset(s, srcidx, MO_64)); | ||
31 | |||
32 | - if (size < MO_128) { | ||
33 | + if ((mop & MO_SIZE) < MO_128) { | ||
34 | tcg_gen_qemu_st_i64(tmplo, tcg_addr, get_mem_index(s), mop); | ||
35 | } else { | ||
36 | TCGv_i64 tmphi = tcg_temp_new_i64(); | ||
37 | @@ -XXX,XX +XXX,XX @@ static void do_fp_st(DisasContext *s, int srcidx, TCGv_i64 tcg_addr, int size) | ||
38 | /* | ||
39 | * Load from memory to FP register | ||
40 | */ | ||
41 | -static void do_fp_ld(DisasContext *s, int destidx, TCGv_i64 tcg_addr, int size) | ||
42 | +static void do_fp_ld(DisasContext *s, int destidx, TCGv_i64 tcg_addr, MemOp mop) | ||
43 | { | ||
44 | /* This always zero-extends and writes to a full 128 bit wide vector */ | ||
45 | TCGv_i64 tmplo = tcg_temp_new_i64(); | ||
46 | TCGv_i64 tmphi = NULL; | ||
47 | - MemOp mop = finalize_memop_asimd(s, size); | ||
48 | |||
49 | - if (size < MO_128) { | ||
50 | + if ((mop & MO_SIZE) < MO_128) { | ||
51 | tcg_gen_qemu_ld_i64(tmplo, tcg_addr, get_mem_index(s), mop); | ||
52 | } else { | ||
53 | TCGv_i128 t16 = tcg_temp_new_i128(); | ||
54 | @@ -XXX,XX +XXX,XX @@ static void disas_ld_lit(DisasContext *s, uint32_t insn) | ||
55 | bool is_signed = false; | ||
56 | int size = 2; | ||
57 | TCGv_i64 tcg_rt, clean_addr; | ||
58 | + MemOp memop; | ||
59 | |||
60 | if (is_vector) { | ||
61 | if (opc == 3) { | ||
62 | @@ -XXX,XX +XXX,XX @@ static void disas_ld_lit(DisasContext *s, uint32_t insn) | ||
63 | if (!fp_access_check(s)) { | ||
64 | return; | ||
65 | } | ||
66 | + memop = finalize_memop_asimd(s, size); | ||
67 | } else { | ||
68 | if (opc == 3) { | ||
69 | /* PRFM (literal) : prefetch */ | ||
70 | @@ -XXX,XX +XXX,XX @@ static void disas_ld_lit(DisasContext *s, uint32_t insn) | ||
71 | } | ||
72 | size = 2 + extract32(opc, 0, 1); | ||
73 | is_signed = extract32(opc, 1, 1); | ||
74 | + memop = finalize_memop(s, size + is_signed * MO_SIGN); | ||
75 | } | ||
76 | |||
77 | tcg_rt = cpu_reg(s, rt); | ||
78 | |||
79 | clean_addr = tcg_temp_new_i64(); | ||
80 | gen_pc_plus_diff(s, clean_addr, imm); | ||
23 | + | 81 | + |
24 | +struct target_za_context { | 82 | if (is_vector) { |
25 | + struct target_aarch64_ctx head; | 83 | - do_fp_ld(s, rt, clean_addr, size); |
26 | + uint16_t vl; | 84 | + do_fp_ld(s, rt, clean_addr, memop); |
27 | + uint16_t reserved[3]; | 85 | } else { |
28 | + /* The actual ZA data immediately follows. */ | 86 | /* Only unsigned 32bit loads target 32bit registers. */ |
29 | +}; | 87 | bool iss_sf = opc != 0; |
30 | + | 88 | - MemOp memop = finalize_memop(s, size + is_signed * MO_SIGN); |
31 | +#define TARGET_ZA_SIG_REGS_OFFSET \ | 89 | - |
32 | + QEMU_ALIGN_UP(sizeof(struct target_za_context), TARGET_SVE_VQ_BYTES) | 90 | do_gpr_ld(s, tcg_rt, clean_addr, memop, false, true, rt, iss_sf, false); |
33 | +#define TARGET_ZA_SIG_ZAV_OFFSET(VQ, N) \ | ||
34 | + (TARGET_ZA_SIG_REGS_OFFSET + (VQ) * TARGET_SVE_VQ_BYTES * (N)) | ||
35 | +#define TARGET_ZA_SIG_CONTEXT_SIZE(VQ) \ | ||
36 | + TARGET_ZA_SIG_ZAV_OFFSET(VQ, VQ * TARGET_SVE_VQ_BYTES) | ||
37 | + | ||
38 | struct target_rt_sigframe { | ||
39 | struct target_siginfo info; | ||
40 | struct target_ucontext uc; | ||
41 | @@ -XXX,XX +XXX,XX @@ static void target_setup_end_record(struct target_aarch64_ctx *end) | ||
42 | } | ||
43 | |||
44 | static void target_setup_sve_record(struct target_sve_context *sve, | ||
45 | - CPUARMState *env, int vq, int size) | ||
46 | + CPUARMState *env, int size) | ||
47 | { | ||
48 | - int i, j; | ||
49 | + int i, j, vq = sve_vq(env); | ||
50 | |||
51 | memset(sve, 0, sizeof(*sve)); | ||
52 | __put_user(TARGET_SVE_MAGIC, &sve->head.magic); | ||
53 | @@ -XXX,XX +XXX,XX @@ static void target_setup_sve_record(struct target_sve_context *sve, | ||
54 | } | 91 | } |
55 | } | 92 | } |
56 | 93 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pair(DisasContext *s, uint32_t insn) | |
57 | +static void target_setup_za_record(struct target_za_context *za, | 94 | (wback || rn != 31) && !set_tag, 2 << size); |
58 | + CPUARMState *env, int size) | 95 | |
59 | +{ | 96 | if (is_vector) { |
60 | + int vq = sme_vq(env); | 97 | + MemOp mop = finalize_memop_asimd(s, size); |
61 | + int vl = vq * TARGET_SVE_VQ_BYTES; | ||
62 | + int i, j; | ||
63 | + | 98 | + |
64 | + memset(za, 0, sizeof(*za)); | 99 | if (is_load) { |
65 | + __put_user(TARGET_ZA_MAGIC, &za->head.magic); | 100 | - do_fp_ld(s, rt, clean_addr, size); |
66 | + __put_user(size, &za->head.size); | 101 | + do_fp_ld(s, rt, clean_addr, mop); |
67 | + __put_user(vl, &za->vl); | 102 | } else { |
68 | + | 103 | - do_fp_st(s, rt, clean_addr, size); |
69 | + if (size == TARGET_ZA_SIG_CONTEXT_SIZE(0)) { | 104 | + do_fp_st(s, rt, clean_addr, mop); |
70 | + return; | 105 | } |
71 | + } | 106 | tcg_gen_addi_i64(clean_addr, clean_addr, 1 << size); |
72 | + assert(size == TARGET_ZA_SIG_CONTEXT_SIZE(vq)); | 107 | if (is_load) { |
73 | + | 108 | - do_fp_ld(s, rt2, clean_addr, size); |
74 | + /* | 109 | + do_fp_ld(s, rt2, clean_addr, mop); |
75 | + * Note that ZA vectors are stored as a byte stream, | 110 | } else { |
76 | + * with each byte element at a subsequent address. | 111 | - do_fp_st(s, rt2, clean_addr, size); |
77 | + */ | 112 | + do_fp_st(s, rt2, clean_addr, mop); |
78 | + for (i = 0; i < vl; ++i) { | 113 | } |
79 | + uint64_t *z = (void *)za + TARGET_ZA_SIG_ZAV_OFFSET(vq, i); | 114 | } else { |
80 | + for (j = 0; j < vq * 2; ++j) { | 115 | TCGv_i64 tcg_rt = cpu_reg(s, rt); |
81 | + __put_user_e(env->zarray[i].d[j], z + j, le); | 116 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, |
82 | + } | 117 | if (!fp_access_check(s)) { |
83 | + } | 118 | return; |
84 | +} | 119 | } |
85 | + | 120 | + memop = finalize_memop_asimd(s, size); |
86 | static void target_restore_general_frame(CPUARMState *env, | 121 | } else { |
87 | struct target_rt_sigframe *sf) | 122 | if (size == 3 && opc == 2) { |
88 | { | 123 | /* PRFM - prefetch */ |
89 | @@ -XXX,XX +XXX,XX @@ static void target_restore_fpsimd_record(CPUARMState *env, | 124 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, |
90 | 125 | is_store = (opc == 0); | |
91 | static bool target_restore_sve_record(CPUARMState *env, | 126 | is_signed = !is_store && extract32(opc, 1, 1); |
92 | struct target_sve_context *sve, | 127 | is_extended = (size < 3) && extract32(opc, 0, 1); |
93 | - int size) | 128 | + memop = finalize_memop(s, size + is_signed * MO_SIGN); |
94 | + int size, int *svcr) | ||
95 | { | ||
96 | - int i, j, vl, vq; | ||
97 | + int i, j, vl, vq, flags; | ||
98 | + bool sm; | ||
99 | |||
100 | - if (!cpu_isar_feature(aa64_sve, env_archcpu(env))) { | ||
101 | + __get_user(vl, &sve->vl); | ||
102 | + __get_user(flags, &sve->flags); | ||
103 | + | ||
104 | + sm = flags & TARGET_SVE_SIG_FLAG_SM; | ||
105 | + | ||
106 | + /* The cpu must support Streaming or Non-streaming SVE. */ | ||
107 | + if (sm | ||
108 | + ? !cpu_isar_feature(aa64_sme, env_archcpu(env)) | ||
109 | + : !cpu_isar_feature(aa64_sve, env_archcpu(env))) { | ||
110 | return false; | ||
111 | } | 129 | } |
112 | 130 | ||
113 | - __get_user(vl, &sve->vl); | 131 | switch (idx) { |
114 | - vq = sve_vq(env); | 132 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, |
115 | + /* | ||
116 | + * Note that we cannot use sve_vq() because that depends on the | ||
117 | + * current setting of PSTATE.SM, not the state to be restored. | ||
118 | + */ | ||
119 | + vq = sve_vqm1_for_el_sm(env, 0, sm) + 1; | ||
120 | |||
121 | /* Reject mismatched VL. */ | ||
122 | if (vl != vq * TARGET_SVE_VQ_BYTES) { | ||
123 | @@ -XXX,XX +XXX,XX @@ static bool target_restore_sve_record(CPUARMState *env, | ||
124 | return false; | ||
125 | } | 133 | } |
126 | 134 | ||
127 | + *svcr = FIELD_DP64(*svcr, SVCR, SM, sm); | 135 | memidx = is_unpriv ? get_a64_user_mem_index(s) : get_mem_index(s); |
128 | + | 136 | - memop = finalize_memop(s, size + is_signed * MO_SIGN); |
129 | /* | 137 | |
130 | * Note that SVE regs are stored as a byte stream, with each byte element | 138 | clean_addr = gen_mte_check1_mmuidx(s, dirty_addr, is_store, |
131 | * at a subsequent address. This corresponds to a little-endian load | 139 | writeback || rn != 31, |
132 | @@ -XXX,XX +XXX,XX @@ static bool target_restore_sve_record(CPUARMState *env, | 140 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_imm9(DisasContext *s, uint32_t insn, |
133 | return true; | 141 | |
134 | } | 142 | if (is_vector) { |
135 | 143 | if (is_store) { | |
136 | +static bool target_restore_za_record(CPUARMState *env, | 144 | - do_fp_st(s, rt, clean_addr, size); |
137 | + struct target_za_context *za, | 145 | + do_fp_st(s, rt, clean_addr, memop); |
138 | + int size, int *svcr) | 146 | } else { |
139 | +{ | 147 | - do_fp_ld(s, rt, clean_addr, size); |
140 | + int i, j, vl, vq; | 148 | + do_fp_ld(s, rt, clean_addr, memop); |
141 | + | 149 | } |
142 | + if (!cpu_isar_feature(aa64_sme, env_archcpu(env))) { | 150 | } else { |
143 | + return false; | 151 | TCGv_i64 tcg_rt = cpu_reg(s, rt); |
144 | + } | 152 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_roffset(DisasContext *s, uint32_t insn, |
145 | + | 153 | |
146 | + __get_user(vl, &za->vl); | 154 | if (is_vector) { |
147 | + vq = sme_vq(env); | 155 | if (is_store) { |
148 | + | 156 | - do_fp_st(s, rt, clean_addr, size); |
149 | + /* Reject mismatched VL. */ | 157 | + do_fp_st(s, rt, clean_addr, memop); |
150 | + if (vl != vq * TARGET_SVE_VQ_BYTES) { | 158 | } else { |
151 | + return false; | 159 | - do_fp_ld(s, rt, clean_addr, size); |
152 | + } | 160 | + do_fp_ld(s, rt, clean_addr, memop); |
153 | + | 161 | } |
154 | + /* Accept empty record -- used to clear PSTATE.ZA. */ | 162 | } else { |
155 | + if (size <= TARGET_ZA_SIG_CONTEXT_SIZE(0)) { | 163 | TCGv_i64 tcg_rt = cpu_reg(s, rt); |
156 | + return true; | 164 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_unsigned_imm(DisasContext *s, uint32_t insn, |
157 | + } | 165 | |
158 | + | 166 | if (is_vector) { |
159 | + /* Reject non-empty but incomplete record. */ | 167 | if (is_store) { |
160 | + if (size < TARGET_ZA_SIG_CONTEXT_SIZE(vq)) { | 168 | - do_fp_st(s, rt, clean_addr, size); |
161 | + return false; | 169 | + do_fp_st(s, rt, clean_addr, memop); |
162 | + } | 170 | } else { |
163 | + | 171 | - do_fp_ld(s, rt, clean_addr, size); |
164 | + *svcr = FIELD_DP64(*svcr, SVCR, ZA, 1); | 172 | + do_fp_ld(s, rt, clean_addr, memop); |
165 | + | 173 | } |
166 | + for (i = 0; i < vl; ++i) { | 174 | } else { |
167 | + uint64_t *z = (void *)za + TARGET_ZA_SIG_ZAV_OFFSET(vq, i); | 175 | TCGv_i64 tcg_rt = cpu_reg(s, rt); |
168 | + for (j = 0; j < vq * 2; ++j) { | ||
169 | + __get_user_e(env->zarray[i].d[j], z + j, le); | ||
170 | + } | ||
171 | + } | ||
172 | + return true; | ||
173 | +} | ||
174 | + | ||
175 | static int target_restore_sigframe(CPUARMState *env, | ||
176 | struct target_rt_sigframe *sf) | ||
177 | { | ||
178 | struct target_aarch64_ctx *ctx, *extra = NULL; | ||
179 | struct target_fpsimd_context *fpsimd = NULL; | ||
180 | struct target_sve_context *sve = NULL; | ||
181 | + struct target_za_context *za = NULL; | ||
182 | uint64_t extra_datap = 0; | ||
183 | bool used_extra = false; | ||
184 | int sve_size = 0; | ||
185 | + int za_size = 0; | ||
186 | + int svcr = 0; | ||
187 | |||
188 | target_restore_general_frame(env, sf); | ||
189 | |||
190 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | ||
191 | sve_size = size; | ||
192 | break; | ||
193 | |||
194 | + case TARGET_ZA_MAGIC: | ||
195 | + if (za || size < sizeof(struct target_za_context)) { | ||
196 | + goto err; | ||
197 | + } | ||
198 | + za = (struct target_za_context *)ctx; | ||
199 | + za_size = size; | ||
200 | + break; | ||
201 | + | ||
202 | case TARGET_EXTRA_MAGIC: | ||
203 | if (extra || size != sizeof(struct target_extra_context)) { | ||
204 | goto err; | ||
205 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | ||
206 | } | ||
207 | |||
208 | /* SVE data, if present, overwrites FPSIMD data. */ | ||
209 | - if (sve && !target_restore_sve_record(env, sve, sve_size)) { | ||
210 | + if (sve && !target_restore_sve_record(env, sve, sve_size, &svcr)) { | ||
211 | goto err; | ||
212 | } | ||
213 | + if (za && !target_restore_za_record(env, za, za_size, &svcr)) { | ||
214 | + goto err; | ||
215 | + } | ||
216 | + if (env->svcr != svcr) { | ||
217 | + env->svcr = svcr; | ||
218 | + arm_rebuild_hflags(env); | ||
219 | + } | ||
220 | unlock_user(extra, extra_datap, 0); | ||
221 | return 0; | ||
222 | |||
223 | @@ -XXX,XX +XXX,XX @@ static void target_setup_frame(int usig, struct target_sigaction *ka, | ||
224 | .total_size = offsetof(struct target_rt_sigframe, | ||
225 | uc.tuc_mcontext.__reserved), | ||
226 | }; | ||
227 | - int fpsimd_ofs, fr_ofs, sve_ofs = 0, vq = 0, sve_size = 0; | ||
228 | + int fpsimd_ofs, fr_ofs, sve_ofs = 0, za_ofs = 0; | ||
229 | + int sve_size = 0, za_size = 0; | ||
230 | struct target_rt_sigframe *frame; | ||
231 | struct target_rt_frame_record *fr; | ||
232 | abi_ulong frame_addr, return_addr; | ||
233 | @@ -XXX,XX +XXX,XX @@ static void target_setup_frame(int usig, struct target_sigaction *ka, | ||
234 | &layout); | ||
235 | |||
236 | /* SVE state needs saving only if it exists. */ | ||
237 | - if (cpu_isar_feature(aa64_sve, env_archcpu(env))) { | ||
238 | - vq = sve_vq(env); | ||
239 | - sve_size = QEMU_ALIGN_UP(TARGET_SVE_SIG_CONTEXT_SIZE(vq), 16); | ||
240 | + if (cpu_isar_feature(aa64_sve, env_archcpu(env)) || | ||
241 | + cpu_isar_feature(aa64_sme, env_archcpu(env))) { | ||
242 | + sve_size = QEMU_ALIGN_UP(TARGET_SVE_SIG_CONTEXT_SIZE(sve_vq(env)), 16); | ||
243 | sve_ofs = alloc_sigframe_space(sve_size, &layout); | ||
244 | } | ||
245 | + if (cpu_isar_feature(aa64_sme, env_archcpu(env))) { | ||
246 | + /* ZA state needs saving only if it is enabled. */ | ||
247 | + if (FIELD_EX64(env->svcr, SVCR, ZA)) { | ||
248 | + za_size = TARGET_ZA_SIG_CONTEXT_SIZE(sme_vq(env)); | ||
249 | + } else { | ||
250 | + za_size = TARGET_ZA_SIG_CONTEXT_SIZE(0); | ||
251 | + } | ||
252 | + za_ofs = alloc_sigframe_space(za_size, &layout); | ||
253 | + } | ||
254 | |||
255 | if (layout.extra_ofs) { | ||
256 | /* Reserve space for the extra end marker. The standard end marker | ||
257 | @@ -XXX,XX +XXX,XX @@ static void target_setup_frame(int usig, struct target_sigaction *ka, | ||
258 | target_setup_end_record((void *)frame + layout.extra_end_ofs); | ||
259 | } | ||
260 | if (sve_ofs) { | ||
261 | - target_setup_sve_record((void *)frame + sve_ofs, env, vq, sve_size); | ||
262 | + target_setup_sve_record((void *)frame + sve_ofs, env, sve_size); | ||
263 | + } | ||
264 | + if (za_ofs) { | ||
265 | + target_setup_za_record((void *)frame + za_ofs, env, za_size); | ||
266 | } | ||
267 | |||
268 | /* Set up the stack frame for unwinding. */ | ||
269 | @@ -XXX,XX +XXX,XX @@ static void target_setup_frame(int usig, struct target_sigaction *ka, | ||
270 | env->btype = 2; | ||
271 | } | ||
272 | |||
273 | + /* | ||
274 | + * Invoke the signal handler with both SM and ZA disabled. | ||
275 | + * When clearing SM, ResetSVEState, per SMSTOP. | ||
276 | + */ | ||
277 | + if (FIELD_EX64(env->svcr, SVCR, SM)) { | ||
278 | + arm_reset_sve_state(env); | ||
279 | + } | ||
280 | + if (env->svcr) { | ||
281 | + env->svcr = 0; | ||
282 | + arm_rebuild_hflags(env); | ||
283 | + } | ||
284 | + | ||
285 | if (info) { | ||
286 | tswap_siginfo(&frame->info, info); | ||
287 | env->xregs[1] = frame_addr + offsetof(struct target_rt_sigframe, info); | ||
288 | -- | 176 | -- |
289 | 2.25.1 | 177 | 2.34.1 |
178 | |||
179 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | The pseudocode for CheckSVEEnabled gains a check for Streaming | 3 | Pass the completed memop to gen_mte_check1_mmuidx. |
4 | SVE mode, and for SME present but SVE absent. | 4 | For the moment, do nothing more than extract the size. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-17-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-13-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/translate-a64.c | 22 ++++++++++++++++------ | 11 | target/arm/tcg/translate-a64.h | 2 +- |
12 | 1 file changed, 16 insertions(+), 6 deletions(-) | 12 | target/arm/tcg/translate-a64.c | 82 ++++++++++++++++++---------------- |
13 | target/arm/tcg/translate-sve.c | 7 +-- | ||
14 | 3 files changed, 49 insertions(+), 42 deletions(-) | ||
13 | 15 | ||
14 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 16 | diff --git a/target/arm/tcg/translate-a64.h b/target/arm/tcg/translate-a64.h |
15 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/translate-a64.c | 18 | --- a/target/arm/tcg/translate-a64.h |
17 | +++ b/target/arm/translate-a64.c | 19 | +++ b/target/arm/tcg/translate-a64.h |
18 | @@ -XXX,XX +XXX,XX @@ static bool fp_access_check(DisasContext *s) | 20 | @@ -XXX,XX +XXX,XX @@ static inline bool sme_smza_enabled_check(DisasContext *s) |
19 | return true; | 21 | |
22 | TCGv_i64 clean_data_tbi(DisasContext *s, TCGv_i64 addr); | ||
23 | TCGv_i64 gen_mte_check1(DisasContext *s, TCGv_i64 addr, bool is_write, | ||
24 | - bool tag_checked, int log2_size); | ||
25 | + bool tag_checked, MemOp memop); | ||
26 | TCGv_i64 gen_mte_checkN(DisasContext *s, TCGv_i64 addr, bool is_write, | ||
27 | bool tag_checked, int size); | ||
28 | |||
29 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/tcg/translate-a64.c | ||
32 | +++ b/target/arm/tcg/translate-a64.c | ||
33 | @@ -XXX,XX +XXX,XX @@ static void gen_probe_access(DisasContext *s, TCGv_i64 ptr, | ||
34 | */ | ||
35 | static TCGv_i64 gen_mte_check1_mmuidx(DisasContext *s, TCGv_i64 addr, | ||
36 | bool is_write, bool tag_checked, | ||
37 | - int log2_size, bool is_unpriv, | ||
38 | + MemOp memop, bool is_unpriv, | ||
39 | int core_idx) | ||
40 | { | ||
41 | if (tag_checked && s->mte_active[is_unpriv]) { | ||
42 | @@ -XXX,XX +XXX,XX @@ static TCGv_i64 gen_mte_check1_mmuidx(DisasContext *s, TCGv_i64 addr, | ||
43 | desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid); | ||
44 | desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma); | ||
45 | desc = FIELD_DP32(desc, MTEDESC, WRITE, is_write); | ||
46 | - desc = FIELD_DP32(desc, MTEDESC, SIZEM1, (1 << log2_size) - 1); | ||
47 | + desc = FIELD_DP32(desc, MTEDESC, SIZEM1, memop_size(memop) - 1); | ||
48 | |||
49 | ret = tcg_temp_new_i64(); | ||
50 | gen_helper_mte_check(ret, cpu_env, tcg_constant_i32(desc), addr); | ||
51 | @@ -XXX,XX +XXX,XX @@ static TCGv_i64 gen_mte_check1_mmuidx(DisasContext *s, TCGv_i64 addr, | ||
20 | } | 52 | } |
21 | 53 | ||
22 | -/* Check that SVE access is enabled. If it is, return true. | 54 | TCGv_i64 gen_mte_check1(DisasContext *s, TCGv_i64 addr, bool is_write, |
23 | +/* | 55 | - bool tag_checked, int log2_size) |
24 | + * Check that SVE access is enabled. If it is, return true. | 56 | + bool tag_checked, MemOp memop) |
25 | * If not, emit code to generate an appropriate exception and return false. | ||
26 | + * This function corresponds to CheckSVEEnabled(). | ||
27 | */ | ||
28 | bool sve_access_check(DisasContext *s) | ||
29 | { | 57 | { |
30 | - if (s->sve_excp_el) { | 58 | - return gen_mte_check1_mmuidx(s, addr, is_write, tag_checked, log2_size, |
31 | - assert(!s->sve_access_checked); | 59 | + return gen_mte_check1_mmuidx(s, addr, is_write, tag_checked, memop, |
32 | - s->sve_access_checked = true; | 60 | false, get_mem_index(s)); |
33 | - | 61 | } |
34 | + if (s->pstate_sm || !dc_isar_feature(aa64_sve, s)) { | 62 | |
35 | + assert(dc_isar_feature(aa64_sme, s)); | 63 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, int rn, |
36 | + if (!sme_sm_enabled_check(s)) { | 64 | int size, bool is_pair) |
37 | + goto fail_exit; | 65 | { |
38 | + } | 66 | int idx = get_mem_index(s); |
39 | + } else if (s->sve_excp_el) { | 67 | - MemOp memop; |
40 | gen_exception_insn_el(s, s->pc_curr, EXCP_UDEF, | 68 | TCGv_i64 dirty_addr, clean_addr; |
41 | syn_sve_access_trap(), s->sve_excp_el); | 69 | + MemOp memop; |
42 | - return false; | ||
43 | + goto fail_exit; | ||
44 | } | ||
45 | s->sve_access_checked = true; | ||
46 | return fp_access_check(s); | ||
47 | + | 70 | + |
48 | + fail_exit: | 71 | + /* |
49 | + /* Assert that we only raise one exception per instruction. */ | 72 | + * For pairs: |
50 | + assert(!s->sve_access_checked); | 73 | + * if size == 2, the operation is single-copy atomic for the doubleword. |
51 | + s->sve_access_checked = true; | 74 | + * if size == 3, the operation is single-copy atomic for *each* doubleword, |
52 | + return false; | 75 | + * not the entire quadword, however it must be quadword aligned. |
76 | + */ | ||
77 | + memop = size + is_pair; | ||
78 | + if (memop == MO_128) { | ||
79 | + memop = finalize_memop_atom(s, MO_128 | MO_ALIGN, | ||
80 | + MO_ATOM_IFALIGN_PAIR); | ||
81 | + } else { | ||
82 | + memop = finalize_memop(s, memop | MO_ALIGN); | ||
83 | + } | ||
84 | |||
85 | s->is_ldex = true; | ||
86 | dirty_addr = cpu_reg_sp(s, rn); | ||
87 | - clean_addr = gen_mte_check1(s, dirty_addr, false, rn != 31, size); | ||
88 | + clean_addr = gen_mte_check1(s, dirty_addr, false, rn != 31, memop); | ||
89 | |||
90 | g_assert(size <= 3); | ||
91 | if (is_pair) { | ||
92 | g_assert(size >= 2); | ||
93 | if (size == 2) { | ||
94 | - /* The pair must be single-copy atomic for the doubleword. */ | ||
95 | - memop = finalize_memop(s, MO_64 | MO_ALIGN); | ||
96 | tcg_gen_qemu_ld_i64(cpu_exclusive_val, clean_addr, idx, memop); | ||
97 | if (s->be_data == MO_LE) { | ||
98 | tcg_gen_extract_i64(cpu_reg(s, rt), cpu_exclusive_val, 0, 32); | ||
99 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, int rn, | ||
100 | tcg_gen_extract_i64(cpu_reg(s, rt2), cpu_exclusive_val, 0, 32); | ||
101 | } | ||
102 | } else { | ||
103 | - /* | ||
104 | - * The pair must be single-copy atomic for *each* doubleword, not | ||
105 | - * the entire quadword, however it must be quadword aligned. | ||
106 | - * Expose the complete load to tcg, for ease of tlb lookup, | ||
107 | - * but indicate that only 8-byte atomicity is required. | ||
108 | - */ | ||
109 | TCGv_i128 t16 = tcg_temp_new_i128(); | ||
110 | |||
111 | - memop = finalize_memop_atom(s, MO_128 | MO_ALIGN_16, | ||
112 | - MO_ATOM_IFALIGN_PAIR); | ||
113 | tcg_gen_qemu_ld_i128(t16, clean_addr, idx, memop); | ||
114 | |||
115 | if (s->be_data == MO_LE) { | ||
116 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, int rn, | ||
117 | tcg_gen_mov_i64(cpu_reg(s, rt2), cpu_exclusive_high); | ||
118 | } | ||
119 | } else { | ||
120 | - memop = finalize_memop(s, size | MO_ALIGN); | ||
121 | tcg_gen_qemu_ld_i64(cpu_exclusive_val, clean_addr, idx, memop); | ||
122 | tcg_gen_mov_i64(cpu_reg(s, rt), cpu_exclusive_val); | ||
123 | } | ||
124 | @@ -XXX,XX +XXX,XX @@ static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, | ||
125 | TCGLabel *fail_label = gen_new_label(); | ||
126 | TCGLabel *done_label = gen_new_label(); | ||
127 | TCGv_i64 tmp, dirty_addr, clean_addr; | ||
128 | + MemOp memop; | ||
129 | + | ||
130 | + memop = (size + is_pair) | MO_ALIGN; | ||
131 | + memop = finalize_memop(s, memop); | ||
132 | |||
133 | dirty_addr = cpu_reg_sp(s, rn); | ||
134 | - clean_addr = gen_mte_check1(s, dirty_addr, true, rn != 31, size); | ||
135 | + clean_addr = gen_mte_check1(s, dirty_addr, true, rn != 31, memop); | ||
136 | |||
137 | tcg_gen_brcond_i64(TCG_COND_NE, clean_addr, cpu_exclusive_addr, fail_label); | ||
138 | |||
139 | @@ -XXX,XX +XXX,XX @@ static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, | ||
140 | } | ||
141 | tcg_gen_atomic_cmpxchg_i64(tmp, cpu_exclusive_addr, | ||
142 | cpu_exclusive_val, tmp, | ||
143 | - get_mem_index(s), | ||
144 | - MO_64 | MO_ALIGN | s->be_data); | ||
145 | + get_mem_index(s), memop); | ||
146 | tcg_gen_setcond_i64(TCG_COND_NE, tmp, tmp, cpu_exclusive_val); | ||
147 | } else { | ||
148 | TCGv_i128 t16 = tcg_temp_new_i128(); | ||
149 | @@ -XXX,XX +XXX,XX @@ static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, | ||
150 | } | ||
151 | |||
152 | tcg_gen_atomic_cmpxchg_i128(t16, cpu_exclusive_addr, c16, t16, | ||
153 | - get_mem_index(s), | ||
154 | - MO_128 | MO_ALIGN | s->be_data); | ||
155 | + get_mem_index(s), memop); | ||
156 | |||
157 | a = tcg_temp_new_i64(); | ||
158 | b = tcg_temp_new_i64(); | ||
159 | @@ -XXX,XX +XXX,XX @@ static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, | ||
160 | } | ||
161 | } else { | ||
162 | tcg_gen_atomic_cmpxchg_i64(tmp, cpu_exclusive_addr, cpu_exclusive_val, | ||
163 | - cpu_reg(s, rt), get_mem_index(s), | ||
164 | - size | MO_ALIGN | s->be_data); | ||
165 | + cpu_reg(s, rt), get_mem_index(s), memop); | ||
166 | tcg_gen_setcond_i64(TCG_COND_NE, tmp, tmp, cpu_exclusive_val); | ||
167 | } | ||
168 | tcg_gen_mov_i64(cpu_reg(s, rd), tmp); | ||
169 | @@ -XXX,XX +XXX,XX @@ static void gen_compare_and_swap(DisasContext *s, int rs, int rt, | ||
170 | TCGv_i64 tcg_rt = cpu_reg(s, rt); | ||
171 | int memidx = get_mem_index(s); | ||
172 | TCGv_i64 clean_addr; | ||
173 | + MemOp memop; | ||
174 | |||
175 | if (rn == 31) { | ||
176 | gen_check_sp_alignment(s); | ||
177 | } | ||
178 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, size); | ||
179 | - tcg_gen_atomic_cmpxchg_i64(tcg_rs, clean_addr, tcg_rs, tcg_rt, memidx, | ||
180 | - size | MO_ALIGN | s->be_data); | ||
181 | + memop = finalize_memop(s, size | MO_ALIGN); | ||
182 | + clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, memop); | ||
183 | + tcg_gen_atomic_cmpxchg_i64(tcg_rs, clean_addr, tcg_rs, tcg_rt, | ||
184 | + memidx, memop); | ||
53 | } | 185 | } |
54 | 186 | ||
55 | /* | 187 | static void gen_compare_and_swap_pair(DisasContext *s, int rs, int rt, |
188 | @@ -XXX,XX +XXX,XX @@ static void gen_compare_and_swap_pair(DisasContext *s, int rs, int rt, | ||
189 | TCGv_i64 t2 = cpu_reg(s, rt + 1); | ||
190 | TCGv_i64 clean_addr; | ||
191 | int memidx = get_mem_index(s); | ||
192 | + MemOp memop; | ||
193 | |||
194 | if (rn == 31) { | ||
195 | gen_check_sp_alignment(s); | ||
196 | } | ||
197 | |||
198 | /* This is a single atomic access, despite the "pair". */ | ||
199 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, size + 1); | ||
200 | + memop = finalize_memop(s, (size + 1) | MO_ALIGN); | ||
201 | + clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, memop); | ||
202 | |||
203 | if (size == 2) { | ||
204 | TCGv_i64 cmp = tcg_temp_new_i64(); | ||
205 | @@ -XXX,XX +XXX,XX @@ static void gen_compare_and_swap_pair(DisasContext *s, int rs, int rt, | ||
206 | tcg_gen_concat32_i64(cmp, s2, s1); | ||
207 | } | ||
208 | |||
209 | - tcg_gen_atomic_cmpxchg_i64(cmp, clean_addr, cmp, val, memidx, | ||
210 | - MO_64 | MO_ALIGN | s->be_data); | ||
211 | + tcg_gen_atomic_cmpxchg_i64(cmp, clean_addr, cmp, val, memidx, memop); | ||
212 | |||
213 | if (s->be_data == MO_LE) { | ||
214 | tcg_gen_extr32_i64(s1, s2, cmp); | ||
215 | @@ -XXX,XX +XXX,XX @@ static void gen_compare_and_swap_pair(DisasContext *s, int rs, int rt, | ||
216 | tcg_gen_concat_i64_i128(cmp, s2, s1); | ||
217 | } | ||
218 | |||
219 | - tcg_gen_atomic_cmpxchg_i128(cmp, clean_addr, cmp, val, memidx, | ||
220 | - MO_128 | MO_ALIGN | s->be_data); | ||
221 | + tcg_gen_atomic_cmpxchg_i128(cmp, clean_addr, cmp, val, memidx, memop); | ||
222 | |||
223 | if (s->be_data == MO_LE) { | ||
224 | tcg_gen_extr_i128_i64(s1, s2, cmp); | ||
225 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
226 | /* TODO: ARMv8.4-LSE SCTLR.nAA */ | ||
227 | memop = finalize_memop(s, size | MO_ALIGN); | ||
228 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
229 | - true, rn != 31, size); | ||
230 | + true, rn != 31, memop); | ||
231 | do_gpr_st(s, cpu_reg(s, rt), clean_addr, memop, true, rt, | ||
232 | disas_ldst_compute_iss_sf(size, false, 0), is_lasr); | ||
233 | return; | ||
234 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
235 | /* TODO: ARMv8.4-LSE SCTLR.nAA */ | ||
236 | memop = finalize_memop(s, size | MO_ALIGN); | ||
237 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
238 | - false, rn != 31, size); | ||
239 | + false, rn != 31, memop); | ||
240 | do_gpr_ld(s, cpu_reg(s, rt), clean_addr, memop, false, true, | ||
241 | rt, disas_ldst_compute_iss_sf(size, false, 0), is_lasr); | ||
242 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_LDAQ); | ||
243 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_roffset(DisasContext *s, uint32_t insn, | ||
244 | tcg_gen_add_i64(dirty_addr, dirty_addr, tcg_rm); | ||
245 | |||
246 | memop = finalize_memop(s, size + is_signed * MO_SIGN); | ||
247 | - clean_addr = gen_mte_check1(s, dirty_addr, is_store, true, size); | ||
248 | + clean_addr = gen_mte_check1(s, dirty_addr, is_store, true, memop); | ||
249 | |||
250 | if (is_vector) { | ||
251 | if (is_store) { | ||
252 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_reg_unsigned_imm(DisasContext *s, uint32_t insn, | ||
253 | tcg_gen_addi_i64(dirty_addr, dirty_addr, offset); | ||
254 | |||
255 | memop = finalize_memop(s, size + is_signed * MO_SIGN); | ||
256 | - clean_addr = gen_mte_check1(s, dirty_addr, is_store, rn != 31, size); | ||
257 | + clean_addr = gen_mte_check1(s, dirty_addr, is_store, rn != 31, memop); | ||
258 | |||
259 | if (is_vector) { | ||
260 | if (is_store) { | ||
261 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_atomic(DisasContext *s, uint32_t insn, | ||
262 | if (rn == 31) { | ||
263 | gen_check_sp_alignment(s); | ||
264 | } | ||
265 | - clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), false, rn != 31, size); | ||
266 | + clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), false, rn != 31, mop); | ||
267 | |||
268 | if (o3_opc == 014) { | ||
269 | /* | ||
270 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pac(DisasContext *s, uint32_t insn, | ||
271 | |||
272 | /* Note that "clean" and "dirty" here refer to TBI not PAC. */ | ||
273 | clean_addr = gen_mte_check1(s, dirty_addr, false, | ||
274 | - is_wback || rn != 31, size); | ||
275 | + is_wback || rn != 31, memop); | ||
276 | |||
277 | tcg_rt = cpu_reg(s, rt); | ||
278 | do_gpr_ld(s, tcg_rt, clean_addr, memop, | ||
279 | diff --git a/target/arm/tcg/translate-sve.c b/target/arm/tcg/translate-sve.c | ||
280 | index XXXXXXX..XXXXXXX 100644 | ||
281 | --- a/target/arm/tcg/translate-sve.c | ||
282 | +++ b/target/arm/tcg/translate-sve.c | ||
283 | @@ -XXX,XX +XXX,XX @@ static bool trans_LD1R_zpri(DisasContext *s, arg_rpri_load *a) | ||
284 | unsigned msz = dtype_msz(a->dtype); | ||
285 | TCGLabel *over; | ||
286 | TCGv_i64 temp, clean_addr; | ||
287 | + MemOp memop; | ||
288 | |||
289 | if (!dc_isar_feature(aa64_sve, s)) { | ||
290 | return false; | ||
291 | @@ -XXX,XX +XXX,XX @@ static bool trans_LD1R_zpri(DisasContext *s, arg_rpri_load *a) | ||
292 | /* Load the data. */ | ||
293 | temp = tcg_temp_new_i64(); | ||
294 | tcg_gen_addi_i64(temp, cpu_reg_sp(s, a->rn), a->imm << msz); | ||
295 | - clean_addr = gen_mte_check1(s, temp, false, true, msz); | ||
296 | |||
297 | - tcg_gen_qemu_ld_i64(temp, clean_addr, get_mem_index(s), | ||
298 | - finalize_memop(s, dtype_mop[a->dtype])); | ||
299 | + memop = finalize_memop(s, dtype_mop[a->dtype]); | ||
300 | + clean_addr = gen_mte_check1(s, temp, false, true, memop); | ||
301 | + tcg_gen_qemu_ld_i64(temp, clean_addr, get_mem_index(s), memop); | ||
302 | |||
303 | /* Broadcast to *all* elements. */ | ||
304 | tcg_gen_gvec_dup_i64(esz, vec_full_reg_offset(s, a->rd), | ||
56 | -- | 305 | -- |
57 | 2.25.1 | 306 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Move the checks out of the parsing loop and into the | 3 | Pass the individual memop to gen_mte_checkN. |
4 | restore function. This more closely mirrors the code | 4 | For the moment, do nothing with it. |
5 | structure in the kernel, and is slightly clearer. | ||
6 | |||
7 | Reject rather than silently skip incorrect VL and SVE record sizes, | ||
8 | bringing our checks in to line with those the kernel does. | ||
9 | 5 | ||
10 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
11 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
12 | Message-id: 20220708151540.18136-40-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-14-richard.henderson@linaro.org |
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
14 | --- | 10 | --- |
15 | linux-user/aarch64/signal.c | 51 +++++++++++++++++++++++++------------ | 11 | target/arm/tcg/translate-a64.h | 2 +- |
16 | 1 file changed, 35 insertions(+), 16 deletions(-) | 12 | target/arm/tcg/translate-a64.c | 31 +++++++++++++++++++------------ |
13 | target/arm/tcg/translate-sve.c | 4 ++-- | ||
14 | 3 files changed, 22 insertions(+), 15 deletions(-) | ||
17 | 15 | ||
18 | diff --git a/linux-user/aarch64/signal.c b/linux-user/aarch64/signal.c | 16 | diff --git a/target/arm/tcg/translate-a64.h b/target/arm/tcg/translate-a64.h |
19 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/linux-user/aarch64/signal.c | 18 | --- a/target/arm/tcg/translate-a64.h |
21 | +++ b/linux-user/aarch64/signal.c | 19 | +++ b/target/arm/tcg/translate-a64.h |
22 | @@ -XXX,XX +XXX,XX @@ static void target_restore_fpsimd_record(CPUARMState *env, | 20 | @@ -XXX,XX +XXX,XX @@ TCGv_i64 clean_data_tbi(DisasContext *s, TCGv_i64 addr); |
23 | } | 21 | TCGv_i64 gen_mte_check1(DisasContext *s, TCGv_i64 addr, bool is_write, |
24 | } | 22 | bool tag_checked, MemOp memop); |
25 | 23 | TCGv_i64 gen_mte_checkN(DisasContext *s, TCGv_i64 addr, bool is_write, | |
26 | -static void target_restore_sve_record(CPUARMState *env, | 24 | - bool tag_checked, int size); |
27 | - struct target_sve_context *sve, int vq) | 25 | + bool tag_checked, int total_size, MemOp memop); |
28 | +static bool target_restore_sve_record(CPUARMState *env, | 26 | |
29 | + struct target_sve_context *sve, | 27 | /* We should have at some point before trying to access an FP register |
30 | + int size) | 28 | * done the necessary access check, so assert that |
29 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/tcg/translate-a64.c | ||
32 | +++ b/target/arm/tcg/translate-a64.c | ||
33 | @@ -XXX,XX +XXX,XX @@ TCGv_i64 gen_mte_check1(DisasContext *s, TCGv_i64 addr, bool is_write, | ||
34 | * For MTE, check multiple logical sequential accesses. | ||
35 | */ | ||
36 | TCGv_i64 gen_mte_checkN(DisasContext *s, TCGv_i64 addr, bool is_write, | ||
37 | - bool tag_checked, int size) | ||
38 | + bool tag_checked, int total_size, MemOp single_mop) | ||
31 | { | 39 | { |
32 | - int i, j; | 40 | if (tag_checked && s->mte_active[0]) { |
33 | + int i, j, vl, vq; | 41 | TCGv_i64 ret; |
34 | 42 | @@ -XXX,XX +XXX,XX @@ TCGv_i64 gen_mte_checkN(DisasContext *s, TCGv_i64 addr, bool is_write, | |
35 | - /* Note that SVE regs are stored as a byte stream, with each byte element | 43 | desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid); |
36 | + if (!cpu_isar_feature(aa64_sve, env_archcpu(env))) { | 44 | desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma); |
37 | + return false; | 45 | desc = FIELD_DP32(desc, MTEDESC, WRITE, is_write); |
38 | + } | 46 | - desc = FIELD_DP32(desc, MTEDESC, SIZEM1, size - 1); |
39 | + | 47 | + desc = FIELD_DP32(desc, MTEDESC, SIZEM1, total_size - 1); |
40 | + __get_user(vl, &sve->vl); | 48 | |
41 | + vq = sve_vq(env); | 49 | ret = tcg_temp_new_i64(); |
42 | + | 50 | gen_helper_mte_check(ret, cpu_env, tcg_constant_i32(desc), addr); |
43 | + /* Reject mismatched VL. */ | 51 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pair(DisasContext *s, uint32_t insn) |
44 | + if (vl != vq * TARGET_SVE_VQ_BYTES) { | 52 | bool is_vector = extract32(insn, 26, 1); |
45 | + return false; | 53 | bool is_load = extract32(insn, 22, 1); |
46 | + } | 54 | int opc = extract32(insn, 30, 2); |
47 | + | 55 | - |
48 | + /* Accept empty record -- used to clear PSTATE.SM. */ | 56 | bool is_signed = false; |
49 | + if (size <= sizeof(*sve)) { | 57 | bool postindex = false; |
50 | + return true; | 58 | bool wback = false; |
51 | + } | 59 | bool set_tag = false; |
52 | + | 60 | - |
53 | + /* Reject non-empty but incomplete record. */ | 61 | TCGv_i64 clean_addr, dirty_addr; |
54 | + if (size < TARGET_SVE_SIG_CONTEXT_SIZE(vq)) { | 62 | - |
55 | + return false; | 63 | + MemOp mop; |
56 | + } | 64 | int size; |
57 | + | 65 | |
58 | + /* | 66 | if (opc == 3) { |
59 | + * Note that SVE regs are stored as a byte stream, with each byte element | 67 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pair(DisasContext *s, uint32_t insn) |
60 | * at a subsequent address. This corresponds to a little-endian load | ||
61 | * of our 64-bit hunks. | ||
62 | */ | ||
63 | @@ -XXX,XX +XXX,XX @@ static void target_restore_sve_record(CPUARMState *env, | ||
64 | } | ||
65 | } | 68 | } |
66 | } | 69 | } |
67 | + return true; | 70 | |
68 | } | 71 | + if (is_vector) { |
69 | 72 | + mop = finalize_memop_asimd(s, size); | |
70 | static int target_restore_sigframe(CPUARMState *env, | 73 | + } else { |
71 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 74 | + mop = finalize_memop(s, size); |
72 | struct target_sve_context *sve = NULL; | 75 | + } |
73 | uint64_t extra_datap = 0; | 76 | clean_addr = gen_mte_checkN(s, dirty_addr, !is_load, |
74 | bool used_extra = false; | 77 | - (wback || rn != 31) && !set_tag, 2 << size); |
75 | - int vq = 0, sve_size = 0; | 78 | + (wback || rn != 31) && !set_tag, |
76 | + int sve_size = 0; | 79 | + 2 << size, mop); |
77 | 80 | ||
78 | target_restore_general_frame(env, sf); | 81 | if (is_vector) { |
79 | 82 | - MemOp mop = finalize_memop_asimd(s, size); | |
80 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 83 | - |
81 | if (sve || size < sizeof(struct target_sve_context)) { | 84 | + /* LSE2 does not merge FP pairs; leave these as separate operations. */ |
82 | goto err; | 85 | if (is_load) { |
83 | } | 86 | do_fp_ld(s, rt, clean_addr, mop); |
84 | - if (cpu_isar_feature(aa64_sve, env_archcpu(env))) { | 87 | } else { |
85 | - vq = sve_vq(env); | 88 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pair(DisasContext *s, uint32_t insn) |
86 | - sve_size = QEMU_ALIGN_UP(TARGET_SVE_SIG_CONTEXT_SIZE(vq), 16); | 89 | } else { |
87 | - if (size == sve_size) { | 90 | TCGv_i64 tcg_rt = cpu_reg(s, rt); |
88 | - sve = (struct target_sve_context *)ctx; | 91 | TCGv_i64 tcg_rt2 = cpu_reg(s, rt2); |
89 | - break; | 92 | - MemOp mop = size + 1; |
90 | - } | 93 | |
91 | - } | 94 | /* |
92 | - goto err; | 95 | + * We built mop above for the single logical access -- rebuild it |
93 | + sve = (struct target_sve_context *)ctx; | 96 | + * now for the paired operation. |
94 | + sve_size = size; | 97 | + * |
95 | + break; | 98 | * With LSE2, non-sign-extending pairs are treated atomically if |
96 | 99 | * aligned, and if unaligned one of the pair will be completely | |
97 | case TARGET_EXTRA_MAGIC: | 100 | * within a 16-byte block and that element will be atomic. |
98 | if (extra || size != sizeof(struct target_extra_context)) { | 101 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_pair(DisasContext *s, uint32_t insn) |
99 | @@ -XXX,XX +XXX,XX @@ static int target_restore_sigframe(CPUARMState *env, | 102 | * This treats sign-extending loads like zero-extending loads, |
100 | } | 103 | * since that reuses the most code below. |
101 | 104 | */ | |
102 | /* SVE data, if present, overwrites FPSIMD data. */ | 105 | + mop = size + 1; |
103 | - if (sve) { | 106 | if (s->align_mem) { |
104 | - target_restore_sve_record(env, sve, vq); | 107 | mop |= (size == 2 ? MO_ALIGN_4 : MO_ALIGN_8); |
105 | + if (sve && !target_restore_sve_record(env, sve, sve_size)) { | 108 | } |
106 | + goto err; | 109 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_multiple_struct(DisasContext *s, uint32_t insn) |
107 | } | 110 | * promote consecutive little-endian elements below. |
108 | unlock_user(extra, extra_datap, 0); | 111 | */ |
109 | return 0; | 112 | clean_addr = gen_mte_checkN(s, tcg_rn, is_store, is_postidx || rn != 31, |
113 | - total); | ||
114 | + total, finalize_memop(s, size)); | ||
115 | |||
116 | /* | ||
117 | * Consecutive little-endian elements from a single register | ||
118 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_single_struct(DisasContext *s, uint32_t insn) | ||
119 | total = selem << scale; | ||
120 | tcg_rn = cpu_reg_sp(s, rn); | ||
121 | |||
122 | - clean_addr = gen_mte_checkN(s, tcg_rn, !is_load, is_postidx || rn != 31, | ||
123 | - total); | ||
124 | mop = finalize_memop(s, scale); | ||
125 | |||
126 | + clean_addr = gen_mte_checkN(s, tcg_rn, !is_load, is_postidx || rn != 31, | ||
127 | + total, mop); | ||
128 | + | ||
129 | tcg_ebytes = tcg_constant_i64(1 << scale); | ||
130 | for (xs = 0; xs < selem; xs++) { | ||
131 | if (replicate) { | ||
132 | diff --git a/target/arm/tcg/translate-sve.c b/target/arm/tcg/translate-sve.c | ||
133 | index XXXXXXX..XXXXXXX 100644 | ||
134 | --- a/target/arm/tcg/translate-sve.c | ||
135 | +++ b/target/arm/tcg/translate-sve.c | ||
136 | @@ -XXX,XX +XXX,XX @@ void gen_sve_ldr(DisasContext *s, TCGv_ptr base, int vofs, | ||
137 | |||
138 | dirty_addr = tcg_temp_new_i64(); | ||
139 | tcg_gen_addi_i64(dirty_addr, cpu_reg_sp(s, rn), imm); | ||
140 | - clean_addr = gen_mte_checkN(s, dirty_addr, false, rn != 31, len); | ||
141 | + clean_addr = gen_mte_checkN(s, dirty_addr, false, rn != 31, len, MO_8); | ||
142 | |||
143 | /* | ||
144 | * Note that unpredicated load/store of vector/predicate registers | ||
145 | @@ -XXX,XX +XXX,XX @@ void gen_sve_str(DisasContext *s, TCGv_ptr base, int vofs, | ||
146 | |||
147 | dirty_addr = tcg_temp_new_i64(); | ||
148 | tcg_gen_addi_i64(dirty_addr, cpu_reg_sp(s, rn), imm); | ||
149 | - clean_addr = gen_mte_checkN(s, dirty_addr, false, rn != 31, len); | ||
150 | + clean_addr = gen_mte_checkN(s, dirty_addr, false, rn != 31, len, MO_8); | ||
151 | |||
152 | /* Note that unpredicated load/store of vector/predicate registers | ||
153 | * are defined as a stream of bytes, which equates to little-endian | ||
110 | -- | 154 | -- |
111 | 2.25.1 | 155 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | We can reuse the SVE functions for LDR and STR, passing in the | 3 | Fixes a bug in that with SCTLR.A set, we should raise any |
4 | base of the ZA vector and a zero offset. | 4 | alignment fault before raising any MTE check fault. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-23-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-15-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/sme.decode | 7 +++++++ | 11 | target/arm/internals.h | 3 ++- |
12 | target/arm/translate-sme.c | 24 ++++++++++++++++++++++++ | 12 | target/arm/tcg/mte_helper.c | 18 ++++++++++++++++++ |
13 | 2 files changed, 31 insertions(+) | 13 | target/arm/tcg/translate-a64.c | 2 ++ |
14 | 3 files changed, 22 insertions(+), 1 deletion(-) | ||
14 | 15 | ||
15 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | 16 | diff --git a/target/arm/internals.h b/target/arm/internals.h |
16 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme.decode | 18 | --- a/target/arm/internals.h |
18 | +++ b/target/arm/sme.decode | 19 | +++ b/target/arm/internals.h |
19 | @@ -XXX,XX +XXX,XX @@ LDST1 1110000 0 esz:2 st:1 rm:5 v:1 .. pg:3 rn:5 0 za_imm:4 \ | 20 | @@ -XXX,XX +XXX,XX @@ FIELD(MTEDESC, MIDX, 0, 4) |
20 | &ldst rs=%mova_rs | 21 | FIELD(MTEDESC, TBI, 4, 2) |
21 | LDST1 1110000 111 st:1 rm:5 v:1 .. pg:3 rn:5 0 za_imm:4 \ | 22 | FIELD(MTEDESC, TCMA, 6, 2) |
22 | &ldst esz=4 rs=%mova_rs | 23 | FIELD(MTEDESC, WRITE, 8, 1) |
23 | + | 24 | -FIELD(MTEDESC, SIZEM1, 9, SIMD_DATA_BITS - 9) /* size - 1 */ |
24 | +&ldstr rv rn imm | 25 | +FIELD(MTEDESC, ALIGN, 9, 3) |
25 | +@ldstr ....... ... . ...... .. ... rn:5 . imm:4 \ | 26 | +FIELD(MTEDESC, SIZEM1, 12, SIMD_DATA_BITS - 12) /* size - 1 */ |
26 | + &ldstr rv=%mova_rs | 27 | |
27 | + | 28 | bool mte_probe(CPUARMState *env, uint32_t desc, uint64_t ptr); |
28 | +LDR 1110000 100 0 000000 .. 000 ..... 0 .... @ldstr | 29 | uint64_t mte_check(CPUARMState *env, uint32_t desc, uint64_t ptr, uintptr_t ra); |
29 | +STR 1110000 100 1 000000 .. 000 ..... 0 .... @ldstr | 30 | diff --git a/target/arm/tcg/mte_helper.c b/target/arm/tcg/mte_helper.c |
30 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | ||
31 | index XXXXXXX..XXXXXXX 100644 | 31 | index XXXXXXX..XXXXXXX 100644 |
32 | --- a/target/arm/translate-sme.c | 32 | --- a/target/arm/tcg/mte_helper.c |
33 | +++ b/target/arm/translate-sme.c | 33 | +++ b/target/arm/tcg/mte_helper.c |
34 | @@ -XXX,XX +XXX,XX @@ static bool trans_LDST1(DisasContext *s, arg_LDST1 *a) | 34 | @@ -XXX,XX +XXX,XX @@ uint64_t mte_check(CPUARMState *env, uint32_t desc, uint64_t ptr, uintptr_t ra) |
35 | tcg_temp_free_i64(addr); | 35 | |
36 | return true; | 36 | uint64_t HELPER(mte_check)(CPUARMState *env, uint32_t desc, uint64_t ptr) |
37 | } | 37 | { |
38 | + | 38 | + /* |
39 | +typedef void GenLdStR(DisasContext *, TCGv_ptr, int, int, int, int); | 39 | + * R_XCHFJ: Alignment check not caused by memory type is priority 1, |
40 | + | 40 | + * higher than any translation fault. When MTE is disabled, tcg |
41 | +static bool do_ldst_r(DisasContext *s, arg_ldstr *a, GenLdStR *fn) | 41 | + * performs the alignment check during the code generated for the |
42 | +{ | 42 | + * memory access. With MTE enabled, we must check this here before |
43 | + int svl = streaming_vec_reg_size(s); | 43 | + * raising any translation fault in allocation_tag_mem. |
44 | + int imm = a->imm; | 44 | + */ |
45 | + TCGv_ptr base; | 45 | + unsigned align = FIELD_EX32(desc, MTEDESC, ALIGN); |
46 | + | 46 | + if (unlikely(align)) { |
47 | + if (!sme_za_enabled_check(s)) { | 47 | + align = (1u << align) - 1; |
48 | + return true; | 48 | + if (unlikely(ptr & align)) { |
49 | + int idx = FIELD_EX32(desc, MTEDESC, MIDX); | ||
50 | + bool w = FIELD_EX32(desc, MTEDESC, WRITE); | ||
51 | + MMUAccessType type = w ? MMU_DATA_STORE : MMU_DATA_LOAD; | ||
52 | + arm_cpu_do_unaligned_access(env_cpu(env), ptr, type, idx, GETPC()); | ||
53 | + } | ||
49 | + } | 54 | + } |
50 | + | 55 | + |
51 | + /* ZA[n] equates to ZA0H.B[n]. */ | 56 | return mte_check(env, desc, ptr, GETPC()); |
52 | + base = get_tile_rowcol(s, MO_8, a->rv, imm, false); | 57 | } |
53 | + | 58 | |
54 | + fn(s, base, 0, svl, a->rn, imm * svl); | 59 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
55 | + | 60 | index XXXXXXX..XXXXXXX 100644 |
56 | + tcg_temp_free_ptr(base); | 61 | --- a/target/arm/tcg/translate-a64.c |
57 | + return true; | 62 | +++ b/target/arm/tcg/translate-a64.c |
58 | +} | 63 | @@ -XXX,XX +XXX,XX @@ static TCGv_i64 gen_mte_check1_mmuidx(DisasContext *s, TCGv_i64 addr, |
59 | + | 64 | desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid); |
60 | +TRANS_FEAT(LDR, aa64_sme, do_ldst_r, a, gen_sve_ldr) | 65 | desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma); |
61 | +TRANS_FEAT(STR, aa64_sme, do_ldst_r, a, gen_sve_str) | 66 | desc = FIELD_DP32(desc, MTEDESC, WRITE, is_write); |
67 | + desc = FIELD_DP32(desc, MTEDESC, ALIGN, get_alignment_bits(memop)); | ||
68 | desc = FIELD_DP32(desc, MTEDESC, SIZEM1, memop_size(memop) - 1); | ||
69 | |||
70 | ret = tcg_temp_new_i64(); | ||
71 | @@ -XXX,XX +XXX,XX @@ TCGv_i64 gen_mte_checkN(DisasContext *s, TCGv_i64 addr, bool is_write, | ||
72 | desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid); | ||
73 | desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma); | ||
74 | desc = FIELD_DP32(desc, MTEDESC, WRITE, is_write); | ||
75 | + desc = FIELD_DP32(desc, MTEDESC, ALIGN, get_alignment_bits(single_mop)); | ||
76 | desc = FIELD_DP32(desc, MTEDESC, SIZEM1, total_size - 1); | ||
77 | |||
78 | ret = tcg_temp_new_i64(); | ||
62 | -- | 79 | -- |
63 | 2.25.1 | 80 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | |||
3 | This new behaviour is in the ARM pseudocode function | ||
4 | AArch64.CheckFPAdvSIMDEnabled, which applies to AArch32 | ||
5 | via AArch32.CheckAdvSIMDOrFPEnabled when the EL to which | ||
6 | the trap would be delivered is in AArch64 mode. | ||
7 | |||
8 | Given that ARMv9 drops support for AArch32 outside EL0, the trap EL | ||
9 | detection ought to be trivially true, but the pseudocode still contains | ||
10 | a number of conditions, and QEMU has not yet committed to dropping A32 | ||
11 | support for EL[12] when v9 features are present. | ||
12 | |||
13 | Since the computation of SME_TRAP_NONSTREAMING is necessarily different | ||
14 | for the two modes, we might as well preserve bits within TBFLAG_ANY and | ||
15 | allocate separate bits within TBFLAG_A32 and TBFLAG_A64 instead. | ||
16 | |||
17 | Note that DDI0616A.a has typos for bits [22:21] of LD1RO in the table | ||
18 | of instructions illegal in streaming mode. | ||
19 | 2 | ||
20 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
21 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
22 | Message-id: 20220708151540.18136-4-richard.henderson@linaro.org | 5 | Message-id: 20230530191438.411344-16-richard.henderson@linaro.org |
23 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
24 | --- | 7 | --- |
25 | target/arm/cpu.h | 7 +++ | 8 | target/arm/cpu.h | 3 ++- |
26 | target/arm/translate.h | 4 ++ | 9 | target/arm/tcg/translate.h | 2 ++ |
27 | target/arm/sme-fa64.decode | 90 ++++++++++++++++++++++++++++++++++++++ | 10 | target/arm/tcg/hflags.c | 6 ++++++ |
28 | target/arm/helper.c | 41 +++++++++++++++++ | 11 | target/arm/tcg/translate-a64.c | 1 + |
29 | target/arm/translate-a64.c | 40 ++++++++++++++++- | 12 | 4 files changed, 11 insertions(+), 1 deletion(-) |
30 | target/arm/translate-vfp.c | 12 +++++ | ||
31 | target/arm/translate.c | 2 + | ||
32 | target/arm/meson.build | 1 + | ||
33 | 8 files changed, 195 insertions(+), 2 deletions(-) | ||
34 | create mode 100644 target/arm/sme-fa64.decode | ||
35 | 13 | ||
36 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h | 14 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
37 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
38 | --- a/target/arm/cpu.h | 16 | --- a/target/arm/cpu.h |
39 | +++ b/target/arm/cpu.h | 17 | +++ b/target/arm/cpu.h |
40 | @@ -XXX,XX +XXX,XX @@ FIELD(TBFLAG_A32, HSTR_ACTIVE, 9, 1) | 18 | @@ -XXX,XX +XXX,XX @@ void pmu_init(ARMCPU *cpu); |
41 | * the same thing as the current security state of the processor! | 19 | #define SCTLR_D (1U << 5) /* up to v5; RAO in v6 */ |
42 | */ | 20 | #define SCTLR_CP15BEN (1U << 5) /* v7 onward */ |
43 | FIELD(TBFLAG_A32, NS, 10, 1) | 21 | #define SCTLR_L (1U << 6) /* up to v5; RAO in v6 and v7; RAZ in v8 */ |
44 | +/* | 22 | -#define SCTLR_nAA (1U << 6) /* when v8.4-LSE is implemented */ |
45 | + * Indicates that SME Streaming mode is active, and SMCR_ELx.FA64 is not. | 23 | +#define SCTLR_nAA (1U << 6) /* when FEAT_LSE2 is implemented */ |
46 | + * This requires an SME trap from AArch32 mode when using NEON. | 24 | #define SCTLR_B (1U << 7) /* up to v6; RAZ in v7 */ |
47 | + */ | 25 | #define SCTLR_ITD (1U << 7) /* v8 onward */ |
48 | +FIELD(TBFLAG_A32, SME_TRAP_NONSTREAMING, 11, 1) | 26 | #define SCTLR_S (1U << 8) /* up to v6; RAZ in v7 */ |
49 | 27 | @@ -XXX,XX +XXX,XX @@ FIELD(TBFLAG_A64, SVL, 24, 4) | |
50 | /* | 28 | /* Indicates that SME Streaming mode is active, and SMCR_ELx.FA64 is not. */ |
51 | * Bit usage when in AArch32 state, for M-profile only. | 29 | FIELD(TBFLAG_A64, SME_TRAP_NONSTREAMING, 28, 1) |
52 | @@ -XXX,XX +XXX,XX @@ FIELD(TBFLAG_A64, SMEEXC_EL, 20, 2) | 30 | FIELD(TBFLAG_A64, FGT_ERET, 29, 1) |
53 | FIELD(TBFLAG_A64, PSTATE_SM, 22, 1) | 31 | +FIELD(TBFLAG_A64, NAA, 30, 1) |
54 | FIELD(TBFLAG_A64, PSTATE_ZA, 23, 1) | ||
55 | FIELD(TBFLAG_A64, SVL, 24, 4) | ||
56 | +/* Indicates that SME Streaming mode is active, and SMCR_ELx.FA64 is not. */ | ||
57 | +FIELD(TBFLAG_A64, SME_TRAP_NONSTREAMING, 28, 1) | ||
58 | 32 | ||
59 | /* | 33 | /* |
60 | * Helpers for using the above. | 34 | * Helpers for using the above. |
61 | diff --git a/target/arm/translate.h b/target/arm/translate.h | 35 | diff --git a/target/arm/tcg/translate.h b/target/arm/tcg/translate.h |
62 | index XXXXXXX..XXXXXXX 100644 | 36 | index XXXXXXX..XXXXXXX 100644 |
63 | --- a/target/arm/translate.h | 37 | --- a/target/arm/tcg/translate.h |
64 | +++ b/target/arm/translate.h | 38 | +++ b/target/arm/tcg/translate.h |
65 | @@ -XXX,XX +XXX,XX @@ typedef struct DisasContext { | 39 | @@ -XXX,XX +XXX,XX @@ typedef struct DisasContext { |
66 | bool pstate_sm; | 40 | bool fgt_eret; |
67 | /* True if PSTATE.ZA is set. */ | 41 | /* True if fine-grained trap on SVC is enabled */ |
68 | bool pstate_za; | 42 | bool fgt_svc; |
69 | + /* True if non-streaming insns should raise an SME Streaming exception. */ | 43 | + /* True if FEAT_LSE2 SCTLR_ELx.nAA is set */ |
70 | + bool sme_trap_nonstreaming; | 44 | + bool naa; |
71 | + /* True if the current instruction is non-streaming. */ | ||
72 | + bool is_nonstreaming; | ||
73 | /* True if MVE insns are definitely not predicated by VPR or LTPSIZE */ | ||
74 | bool mve_no_pred; | ||
75 | /* | 45 | /* |
76 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 46 | * >= 0, a copy of PSTATE.BTYPE, which will be 0 without v8.5-BTI. |
77 | new file mode 100644 | 47 | * < 0, set by the current instruction. |
78 | index XXXXXXX..XXXXXXX | 48 | diff --git a/target/arm/tcg/hflags.c b/target/arm/tcg/hflags.c |
79 | --- /dev/null | ||
80 | +++ b/target/arm/sme-fa64.decode | ||
81 | @@ -XXX,XX +XXX,XX @@ | ||
82 | +# AArch64 SME allowed instruction decoding | ||
83 | +# | ||
84 | +# Copyright (c) 2022 Linaro, Ltd | ||
85 | +# | ||
86 | +# This library is free software; you can redistribute it and/or | ||
87 | +# modify it under the terms of the GNU Lesser General Public | ||
88 | +# License as published by the Free Software Foundation; either | ||
89 | +# version 2.1 of the License, or (at your option) any later version. | ||
90 | +# | ||
91 | +# This library is distributed in the hope that it will be useful, | ||
92 | +# but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
93 | +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
94 | +# Lesser General Public License for more details. | ||
95 | +# | ||
96 | +# You should have received a copy of the GNU Lesser General Public | ||
97 | +# License along with this library; if not, see <http://www.gnu.org/licenses/>. | ||
98 | + | ||
99 | +# | ||
100 | +# This file is processed by scripts/decodetree.py | ||
101 | +# | ||
102 | + | ||
103 | +# These patterns are taken from Appendix E1.1 of DDI0616 A.a, | ||
104 | +# Arm Architecture Reference Manual Supplement, | ||
105 | +# The Scalable Matrix Extension (SME), for Armv9-A | ||
106 | + | ||
107 | +{ | ||
108 | + [ | ||
109 | + OK 0-00 1110 0000 0001 0010 11-- ---- ---- # SMOV W|Xd,Vn.B[0] | ||
110 | + OK 0-00 1110 0000 0010 0010 11-- ---- ---- # SMOV W|Xd,Vn.H[0] | ||
111 | + OK 0100 1110 0000 0100 0010 11-- ---- ---- # SMOV Xd,Vn.S[0] | ||
112 | + OK 0000 1110 0000 0001 0011 11-- ---- ---- # UMOV Wd,Vn.B[0] | ||
113 | + OK 0000 1110 0000 0010 0011 11-- ---- ---- # UMOV Wd,Vn.H[0] | ||
114 | + OK 0000 1110 0000 0100 0011 11-- ---- ---- # UMOV Wd,Vn.S[0] | ||
115 | + OK 0100 1110 0000 1000 0011 11-- ---- ---- # UMOV Xd,Vn.D[0] | ||
116 | + ] | ||
117 | + FAIL 0--0 111- ---- ---- ---- ---- ---- ---- # Advanced SIMD vector operations | ||
118 | +} | ||
119 | + | ||
120 | +{ | ||
121 | + [ | ||
122 | + OK 0101 1110 --1- ---- 11-1 11-- ---- ---- # FMULX/FRECPS/FRSQRTS (scalar) | ||
123 | + OK 0101 1110 -10- ---- 00-1 11-- ---- ---- # FMULX/FRECPS/FRSQRTS (scalar, FP16) | ||
124 | + OK 01-1 1110 1-10 0001 11-1 10-- ---- ---- # FRECPE/FRSQRTE/FRECPX (scalar) | ||
125 | + OK 01-1 1110 1111 1001 11-1 10-- ---- ---- # FRECPE/FRSQRTE/FRECPX (scalar, FP16) | ||
126 | + ] | ||
127 | + FAIL 01-1 111- ---- ---- ---- ---- ---- ---- # Advanced SIMD single-element operations | ||
128 | +} | ||
129 | + | ||
130 | +FAIL 0-00 110- ---- ---- ---- ---- ---- ---- # Advanced SIMD structure load/store | ||
131 | +FAIL 1100 1110 ---- ---- ---- ---- ---- ---- # Advanced SIMD cryptography extensions | ||
132 | +FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | ||
133 | + | ||
134 | +# These are the "avoidance of doubt" final table of Illegal Advanced SIMD instructions | ||
135 | +# We don't actually need to include these, as the default is OK. | ||
136 | +# -001 111- ---- ---- ---- ---- ---- ---- # Scalar floating-point operations | ||
137 | +# --10 110- ---- ---- ---- ---- ---- ---- # Load/store pair of FP registers | ||
138 | +# --01 1100 ---- ---- ---- ---- ---- ---- # Load FP register (PC-relative literal) | ||
139 | +# --11 1100 --0- ---- ---- ---- ---- ---- # Load/store FP register (unscaled imm) | ||
140 | +# --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | ||
141 | +# --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | ||
142 | + | ||
143 | +FAIL 0000 0100 --1- ---- 1010 ---- ---- ---- # ADR | ||
144 | +FAIL 0000 0100 --1- ---- 1011 -0-- ---- ---- # FTSSEL, FEXPA | ||
145 | +FAIL 0000 0101 --10 0001 100- ---- ---- ---- # COMPACT | ||
146 | +FAIL 0010 0101 --01 100- 1111 000- ---0 ---- # RDFFR, RDFFRS | ||
147 | +FAIL 0010 0101 --10 1--- 1001 ---- ---- ---- # WRFFR, SETFFR | ||
148 | +FAIL 0100 0101 --0- ---- 1011 ---- ---- ---- # BDEP, BEXT, BGRP | ||
149 | +FAIL 0100 0101 000- ---- 0110 1--- ---- ---- # PMULLB, PMULLT (128b result) | ||
150 | +FAIL 0110 0100 --1- ---- 1110 01-- ---- ---- # FMMLA, BFMMLA | ||
151 | +FAIL 0110 0101 --0- ---- 0000 11-- ---- ---- # FTSMUL | ||
152 | +FAIL 0110 0101 --01 0--- 100- ---- ---- ---- # FTMAD | ||
153 | +FAIL 0110 0101 --01 1--- 001- ---- ---- ---- # FADDA | ||
154 | +FAIL 0100 0101 --0- ---- 1001 10-- ---- ---- # SMMLA, UMMLA, USMMLA | ||
155 | +FAIL 0100 0101 --1- ---- 1--- ---- ---- ---- # SVE2 string/histo/crypto instructions | ||
156 | +FAIL 1000 010- -00- ---- 10-- ---- ---- ---- # SVE2 32-bit gather NT load (vector+scalar) | ||
157 | +FAIL 1000 010- -00- ---- 111- ---- ---- ---- # SVE 32-bit gather prefetch (vector+imm) | ||
158 | +FAIL 1000 0100 0-1- ---- 0--- ---- ---- ---- # SVE 32-bit gather prefetch (scalar+vector) | ||
159 | +FAIL 1000 010- -01- ---- 1--- ---- ---- ---- # SVE 32-bit gather load (vector+imm) | ||
160 | +FAIL 1000 0100 0-0- ---- 0--- ---- ---- ---- # SVE 32-bit gather load byte (scalar+vector) | ||
161 | +FAIL 1000 0100 1--- ---- 0--- ---- ---- ---- # SVE 32-bit gather load half (scalar+vector) | ||
162 | +FAIL 1000 0101 0--- ---- 0--- ---- ---- ---- # SVE 32-bit gather load word (scalar+vector) | ||
163 | +FAIL 1010 010- ---- ---- 011- ---- ---- ---- # SVE contiguous FF load (scalar+scalar) | ||
164 | +FAIL 1010 010- ---1 ---- 101- ---- ---- ---- # SVE contiguous NF load (scalar+imm) | ||
165 | +FAIL 1010 010- -01- ---- 000- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+scalar) | ||
166 | +FAIL 1010 010- -010 ---- 001- ---- ---- ---- # SVE load & replicate 32 bytes (scalar+imm) | ||
167 | +FAIL 1100 010- ---- ---- ---- ---- ---- ---- # SVE 64-bit gather load/prefetch | ||
168 | +FAIL 1110 010- -00- ---- 001- ---- ---- ---- # SVE2 64-bit scatter NT store (vector+scalar) | ||
169 | +FAIL 1110 010- -10- ---- 001- ---- ---- ---- # SVE2 32-bit scatter NT store (vector+scalar) | ||
170 | +FAIL 1110 010- ---- ---- 1-0- ---- ---- ---- # SVE scatter store (scalar+32-bit vector) | ||
171 | +FAIL 1110 010- ---- ---- 101- ---- ---- ---- # SVE scatter store (misc) | ||
172 | diff --git a/target/arm/helper.c b/target/arm/helper.c | ||
173 | index XXXXXXX..XXXXXXX 100644 | 49 | index XXXXXXX..XXXXXXX 100644 |
174 | --- a/target/arm/helper.c | 50 | --- a/target/arm/tcg/hflags.c |
175 | +++ b/target/arm/helper.c | 51 | +++ b/target/arm/tcg/hflags.c |
176 | @@ -XXX,XX +XXX,XX @@ int sme_exception_el(CPUARMState *env, int el) | 52 | @@ -XXX,XX +XXX,XX @@ static CPUARMTBFlags rebuild_hflags_a64(CPUARMState *env, int el, int fp_el, |
177 | return 0; | 53 | } |
178 | } | 54 | } |
179 | 55 | ||
180 | +/* This corresponds to the ARM pseudocode function IsFullA64Enabled(). */ | 56 | + if (cpu_isar_feature(aa64_lse2, env_archcpu(env))) { |
181 | +static bool sme_fa64(CPUARMState *env, int el) | 57 | + if (sctlr & SCTLR_nAA) { |
182 | +{ | 58 | + DP_TBFLAG_A64(flags, NAA, 1); |
183 | + if (!cpu_isar_feature(aa64_sme_fa64, env_archcpu(env))) { | ||
184 | + return false; | ||
185 | + } | ||
186 | + | ||
187 | + if (el <= 1 && !el_is_in_host(env, el)) { | ||
188 | + if (!FIELD_EX64(env->vfp.smcr_el[1], SMCR, FA64)) { | ||
189 | + return false; | ||
190 | + } | ||
191 | + } | ||
192 | + if (el <= 2 && arm_is_el2_enabled(env)) { | ||
193 | + if (!FIELD_EX64(env->vfp.smcr_el[2], SMCR, FA64)) { | ||
194 | + return false; | ||
195 | + } | ||
196 | + } | ||
197 | + if (arm_feature(env, ARM_FEATURE_EL3)) { | ||
198 | + if (!FIELD_EX64(env->vfp.smcr_el[3], SMCR, FA64)) { | ||
199 | + return false; | ||
200 | + } | 59 | + } |
201 | + } | 60 | + } |
202 | + | 61 | + |
203 | + return true; | 62 | /* Compute the condition for using AccType_UNPRIV for LDTR et al. */ |
204 | +} | 63 | if (!(env->pstate & PSTATE_UAO)) { |
205 | + | 64 | switch (mmu_idx) { |
206 | /* | 65 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
207 | * Given that SVE is enabled, return the vector length for EL. | ||
208 | */ | ||
209 | @@ -XXX,XX +XXX,XX @@ static CPUARMTBFlags rebuild_hflags_a32(CPUARMState *env, int fp_el, | ||
210 | DP_TBFLAG_ANY(flags, PSTATE__IL, 1); | ||
211 | } | ||
212 | |||
213 | + /* | ||
214 | + * The SME exception we are testing for is raised via | ||
215 | + * AArch64.CheckFPAdvSIMDEnabled(), as called from | ||
216 | + * AArch32.CheckAdvSIMDOrFPEnabled(). | ||
217 | + */ | ||
218 | + if (el == 0 | ||
219 | + && FIELD_EX64(env->svcr, SVCR, SM) | ||
220 | + && (!arm_is_el2_enabled(env) | ||
221 | + || (arm_el_is_aa64(env, 2) && !(env->cp15.hcr_el2 & HCR_TGE))) | ||
222 | + && arm_el_is_aa64(env, 1) | ||
223 | + && !sme_fa64(env, el)) { | ||
224 | + DP_TBFLAG_A32(flags, SME_TRAP_NONSTREAMING, 1); | ||
225 | + } | ||
226 | + | ||
227 | return rebuild_hflags_common_32(env, fp_el, mmu_idx, flags); | ||
228 | } | ||
229 | |||
230 | @@ -XXX,XX +XXX,XX @@ static CPUARMTBFlags rebuild_hflags_a64(CPUARMState *env, int el, int fp_el, | ||
231 | } | ||
232 | if (FIELD_EX64(env->svcr, SVCR, SM)) { | ||
233 | DP_TBFLAG_A64(flags, PSTATE_SM, 1); | ||
234 | + DP_TBFLAG_A64(flags, SME_TRAP_NONSTREAMING, !sme_fa64(env, el)); | ||
235 | } | ||
236 | DP_TBFLAG_A64(flags, PSTATE_ZA, FIELD_EX64(env->svcr, SVCR, ZA)); | ||
237 | } | ||
238 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
239 | index XXXXXXX..XXXXXXX 100644 | 66 | index XXXXXXX..XXXXXXX 100644 |
240 | --- a/target/arm/translate-a64.c | 67 | --- a/target/arm/tcg/translate-a64.c |
241 | +++ b/target/arm/translate-a64.c | 68 | +++ b/target/arm/tcg/translate-a64.c |
242 | @@ -XXX,XX +XXX,XX @@ static void do_vec_ld(DisasContext *s, int destidx, int element, | ||
243 | * unallocated-encoding checks (otherwise the syndrome information | ||
244 | * for the resulting exception will be incorrect). | ||
245 | */ | ||
246 | -static bool fp_access_check(DisasContext *s) | ||
247 | +static bool fp_access_check_only(DisasContext *s) | ||
248 | { | ||
249 | if (s->fp_excp_el) { | ||
250 | assert(!s->fp_access_checked); | ||
251 | @@ -XXX,XX +XXX,XX @@ static bool fp_access_check(DisasContext *s) | ||
252 | return true; | ||
253 | } | ||
254 | |||
255 | +static bool fp_access_check(DisasContext *s) | ||
256 | +{ | ||
257 | + if (!fp_access_check_only(s)) { | ||
258 | + return false; | ||
259 | + } | ||
260 | + if (s->sme_trap_nonstreaming && s->is_nonstreaming) { | ||
261 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
262 | + syn_smetrap(SME_ET_Streaming, false)); | ||
263 | + return false; | ||
264 | + } | ||
265 | + return true; | ||
266 | +} | ||
267 | + | ||
268 | /* Check that SVE access is enabled. If it is, return true. | ||
269 | * If not, emit code to generate an appropriate exception and return false. | ||
270 | */ | ||
271 | @@ -XXX,XX +XXX,XX @@ static void handle_sys(DisasContext *s, uint32_t insn, bool isread, | ||
272 | default: | ||
273 | g_assert_not_reached(); | ||
274 | } | ||
275 | - if ((ri->type & ARM_CP_FPU) && !fp_access_check(s)) { | ||
276 | + if ((ri->type & ARM_CP_FPU) && !fp_access_check_only(s)) { | ||
277 | return; | ||
278 | } else if ((ri->type & ARM_CP_SVE) && !sve_access_check(s)) { | ||
279 | return; | ||
280 | @@ -XXX,XX +XXX,XX @@ static void disas_data_proc_simd_fp(DisasContext *s, uint32_t insn) | ||
281 | } | ||
282 | } | ||
283 | |||
284 | +/* | ||
285 | + * Include the generated SME FA64 decoder. | ||
286 | + */ | ||
287 | + | ||
288 | +#include "decode-sme-fa64.c.inc" | ||
289 | + | ||
290 | +static bool trans_OK(DisasContext *s, arg_OK *a) | ||
291 | +{ | ||
292 | + return true; | ||
293 | +} | ||
294 | + | ||
295 | +static bool trans_FAIL(DisasContext *s, arg_OK *a) | ||
296 | +{ | ||
297 | + s->is_nonstreaming = true; | ||
298 | + return true; | ||
299 | +} | ||
300 | + | ||
301 | /** | ||
302 | * is_guarded_page: | ||
303 | * @env: The cpu environment | ||
304 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_init_disas_context(DisasContextBase *dcbase, | 69 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_init_disas_context(DisasContextBase *dcbase, |
305 | dc->mte_active[1] = EX_TBFLAG_A64(tb_flags, MTE0_ACTIVE); | ||
306 | dc->pstate_sm = EX_TBFLAG_A64(tb_flags, PSTATE_SM); | 70 | dc->pstate_sm = EX_TBFLAG_A64(tb_flags, PSTATE_SM); |
307 | dc->pstate_za = EX_TBFLAG_A64(tb_flags, PSTATE_ZA); | 71 | dc->pstate_za = EX_TBFLAG_A64(tb_flags, PSTATE_ZA); |
308 | + dc->sme_trap_nonstreaming = EX_TBFLAG_A64(tb_flags, SME_TRAP_NONSTREAMING); | 72 | dc->sme_trap_nonstreaming = EX_TBFLAG_A64(tb_flags, SME_TRAP_NONSTREAMING); |
73 | + dc->naa = EX_TBFLAG_A64(tb_flags, NAA); | ||
309 | dc->vec_len = 0; | 74 | dc->vec_len = 0; |
310 | dc->vec_stride = 0; | 75 | dc->vec_stride = 0; |
311 | dc->cp_regs = arm_cpu->cp_regs; | 76 | dc->cp_regs = arm_cpu->cp_regs; |
312 | @@ -XXX,XX +XXX,XX @@ static void aarch64_tr_translate_insn(DisasContextBase *dcbase, CPUState *cpu) | ||
313 | } | ||
314 | } | ||
315 | |||
316 | + s->is_nonstreaming = false; | ||
317 | + if (s->sme_trap_nonstreaming) { | ||
318 | + disas_sme_fa64(s, insn); | ||
319 | + } | ||
320 | + | ||
321 | switch (extract32(insn, 25, 4)) { | ||
322 | case 0x0: | ||
323 | if (!extract32(insn, 31, 1) || !disas_sme(s, insn)) { | ||
324 | diff --git a/target/arm/translate-vfp.c b/target/arm/translate-vfp.c | ||
325 | index XXXXXXX..XXXXXXX 100644 | ||
326 | --- a/target/arm/translate-vfp.c | ||
327 | +++ b/target/arm/translate-vfp.c | ||
328 | @@ -XXX,XX +XXX,XX @@ static bool vfp_access_check_a(DisasContext *s, bool ignore_vfp_enabled) | ||
329 | return false; | ||
330 | } | ||
331 | |||
332 | + /* | ||
333 | + * Note that rebuild_hflags_a32 has already accounted for being in EL0 | ||
334 | + * and the higher EL in A64 mode, etc. Unlike A64 mode, there do not | ||
335 | + * appear to be any insns which touch VFP which are allowed. | ||
336 | + */ | ||
337 | + if (s->sme_trap_nonstreaming) { | ||
338 | + gen_exception_insn(s, s->pc_curr, EXCP_UDEF, | ||
339 | + syn_smetrap(SME_ET_Streaming, | ||
340 | + s->base.pc_next - s->pc_curr == 2)); | ||
341 | + return false; | ||
342 | + } | ||
343 | + | ||
344 | if (!s->vfp_enabled && !ignore_vfp_enabled) { | ||
345 | assert(!arm_dc_feature(s, ARM_FEATURE_M)); | ||
346 | unallocated_encoding(s); | ||
347 | diff --git a/target/arm/translate.c b/target/arm/translate.c | ||
348 | index XXXXXXX..XXXXXXX 100644 | ||
349 | --- a/target/arm/translate.c | ||
350 | +++ b/target/arm/translate.c | ||
351 | @@ -XXX,XX +XXX,XX @@ static void arm_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs) | ||
352 | dc->vec_len = EX_TBFLAG_A32(tb_flags, VECLEN); | ||
353 | dc->vec_stride = EX_TBFLAG_A32(tb_flags, VECSTRIDE); | ||
354 | } | ||
355 | + dc->sme_trap_nonstreaming = | ||
356 | + EX_TBFLAG_A32(tb_flags, SME_TRAP_NONSTREAMING); | ||
357 | } | ||
358 | dc->cp_regs = cpu->cp_regs; | ||
359 | dc->features = env->features; | ||
360 | diff --git a/target/arm/meson.build b/target/arm/meson.build | ||
361 | index XXXXXXX..XXXXXXX 100644 | ||
362 | --- a/target/arm/meson.build | ||
363 | +++ b/target/arm/meson.build | ||
364 | @@ -XXX,XX +XXX,XX @@ | ||
365 | gen = [ | ||
366 | decodetree.process('sve.decode', extra_args: '--decode=disas_sve'), | ||
367 | decodetree.process('sme.decode', extra_args: '--decode=disas_sme'), | ||
368 | + decodetree.process('sme-fa64.decode', extra_args: '--static-decode=disas_sme_fa64'), | ||
369 | decodetree.process('neon-shared.decode', extra_args: '--decode=disas_neon_shared'), | ||
370 | decodetree.process('neon-dp.decode', extra_args: '--decode=disas_neon_dp'), | ||
371 | decodetree.process('neon-ls.decode', extra_args: '--decode=disas_neon_ls'), | ||
372 | -- | 77 | -- |
373 | 2.25.1 | 78 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | FEAT_LSE2 only requires that atomic operations not cross a | ||
4 | 16-byte boundary. Ordered operations may be completely | ||
5 | unaligned if SCTLR.nAA is set. | ||
6 | |||
7 | Because this alignment check is so special, do it by hand. | ||
8 | Make sure not to keep TCG temps live across the branch. | ||
9 | |||
10 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
11 | Message-id: 20230530191438.411344-17-richard.henderson@linaro.org | ||
3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Message-id: 20220708151540.18136-19-richard.henderson@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 14 | --- |
8 | target/arm/helper-sme.h | 2 ++ | 15 | target/arm/tcg/helper-a64.h | 3 + |
9 | target/arm/sme.decode | 4 ++++ | 16 | target/arm/tcg/helper-a64.c | 7 ++ |
10 | target/arm/sme_helper.c | 25 +++++++++++++++++++++++++ | 17 | target/arm/tcg/translate-a64.c | 120 ++++++++++++++++++++++++++------- |
11 | target/arm/translate-sme.c | 13 +++++++++++++ | 18 | 3 files changed, 104 insertions(+), 26 deletions(-) |
12 | 4 files changed, 44 insertions(+) | 19 | |
13 | 20 | diff --git a/target/arm/tcg/helper-a64.h b/target/arm/tcg/helper-a64.h | |
14 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | ||
15 | index XXXXXXX..XXXXXXX 100644 | 21 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/helper-sme.h | 22 | --- a/target/arm/tcg/helper-a64.h |
17 | +++ b/target/arm/helper-sme.h | 23 | +++ b/target/arm/tcg/helper-a64.h |
18 | @@ -XXX,XX +XXX,XX @@ | 24 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_2(st2g_stub, TCG_CALL_NO_WG, void, env, i64) |
19 | 25 | DEF_HELPER_FLAGS_2(ldgm, TCG_CALL_NO_WG, i64, env, i64) | |
20 | DEF_HELPER_FLAGS_2(set_pstate_sm, TCG_CALL_NO_RWG, void, env, i32) | 26 | DEF_HELPER_FLAGS_3(stgm, TCG_CALL_NO_WG, void, env, i64, i64) |
21 | DEF_HELPER_FLAGS_2(set_pstate_za, TCG_CALL_NO_RWG, void, env, i32) | 27 | DEF_HELPER_FLAGS_3(stzgm_tags, TCG_CALL_NO_WG, void, env, i64, i64) |
22 | + | 28 | + |
23 | +DEF_HELPER_FLAGS_3(sme_zero, TCG_CALL_NO_RWG, void, env, i32, i32) | 29 | +DEF_HELPER_FLAGS_4(unaligned_access, TCG_CALL_NO_WG, |
24 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | 30 | + noreturn, env, i64, i32, i32) |
31 | diff --git a/target/arm/tcg/helper-a64.c b/target/arm/tcg/helper-a64.c | ||
25 | index XXXXXXX..XXXXXXX 100644 | 32 | index XXXXXXX..XXXXXXX 100644 |
26 | --- a/target/arm/sme.decode | 33 | --- a/target/arm/tcg/helper-a64.c |
27 | +++ b/target/arm/sme.decode | 34 | +++ b/target/arm/tcg/helper-a64.c |
28 | @@ -XXX,XX +XXX,XX @@ | 35 | @@ -XXX,XX +XXX,XX @@ void HELPER(dc_zva)(CPUARMState *env, uint64_t vaddr_in) |
29 | # | 36 | |
30 | # This file is processed by scripts/decodetree.py | 37 | memset(mem, 0, blocklen); |
31 | # | 38 | } |
32 | + | 39 | + |
33 | +### SME Misc | 40 | +void HELPER(unaligned_access)(CPUARMState *env, uint64_t addr, |
34 | + | 41 | + uint32_t access_type, uint32_t mmu_idx) |
35 | +ZERO 11000000 00 001 00000000000 imm:8 | 42 | +{ |
36 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | 43 | + arm_cpu_do_unaligned_access(env_cpu(env), addr, access_type, |
44 | + mmu_idx, GETPC()); | ||
45 | +} | ||
46 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c | ||
37 | index XXXXXXX..XXXXXXX 100644 | 47 | index XXXXXXX..XXXXXXX 100644 |
38 | --- a/target/arm/sme_helper.c | 48 | --- a/target/arm/tcg/translate-a64.c |
39 | +++ b/target/arm/sme_helper.c | 49 | +++ b/target/arm/tcg/translate-a64.c |
40 | @@ -XXX,XX +XXX,XX @@ void helper_set_pstate_za(CPUARMState *env, uint32_t i) | 50 | @@ -XXX,XX +XXX,XX @@ TCGv_i64 gen_mte_checkN(DisasContext *s, TCGv_i64 addr, bool is_write, |
41 | memset(env->zarray, 0, sizeof(env->zarray)); | 51 | return clean_data_tbi(s, addr); |
42 | } | ||
43 | } | 52 | } |
44 | + | 53 | |
45 | +void helper_sme_zero(CPUARMState *env, uint32_t imm, uint32_t svl) | 54 | +/* |
46 | +{ | 55 | + * Generate the special alignment check that applies to AccType_ATOMIC |
47 | + uint32_t i; | 56 | + * and AccType_ORDERED insns under FEAT_LSE2: the access need not be |
57 | + * naturally aligned, but it must not cross a 16-byte boundary. | ||
58 | + * See AArch64.CheckAlignment(). | ||
59 | + */ | ||
60 | +static void check_lse2_align(DisasContext *s, int rn, int imm, | ||
61 | + bool is_write, MemOp mop) | ||
62 | +{ | ||
63 | + TCGv_i32 tmp; | ||
64 | + TCGv_i64 addr; | ||
65 | + TCGLabel *over_label; | ||
66 | + MMUAccessType type; | ||
67 | + int mmu_idx; | ||
68 | + | ||
69 | + tmp = tcg_temp_new_i32(); | ||
70 | + tcg_gen_extrl_i64_i32(tmp, cpu_reg_sp(s, rn)); | ||
71 | + tcg_gen_addi_i32(tmp, tmp, imm & 15); | ||
72 | + tcg_gen_andi_i32(tmp, tmp, 15); | ||
73 | + tcg_gen_addi_i32(tmp, tmp, memop_size(mop)); | ||
74 | + | ||
75 | + over_label = gen_new_label(); | ||
76 | + tcg_gen_brcondi_i32(TCG_COND_LEU, tmp, 16, over_label); | ||
77 | + | ||
78 | + addr = tcg_temp_new_i64(); | ||
79 | + tcg_gen_addi_i64(addr, cpu_reg_sp(s, rn), imm); | ||
80 | + | ||
81 | + type = is_write ? MMU_DATA_STORE : MMU_DATA_LOAD, | ||
82 | + mmu_idx = get_mem_index(s); | ||
83 | + gen_helper_unaligned_access(cpu_env, addr, tcg_constant_i32(type), | ||
84 | + tcg_constant_i32(mmu_idx)); | ||
85 | + | ||
86 | + gen_set_label(over_label); | ||
87 | + | ||
88 | +} | ||
89 | + | ||
90 | +/* Handle the alignment check for AccType_ATOMIC instructions. */ | ||
91 | +static MemOp check_atomic_align(DisasContext *s, int rn, MemOp mop) | ||
92 | +{ | ||
93 | + MemOp size = mop & MO_SIZE; | ||
94 | + | ||
95 | + if (size == MO_8) { | ||
96 | + return mop; | ||
97 | + } | ||
48 | + | 98 | + |
49 | + /* | 99 | + /* |
50 | + * Special case clearing the entire ZA space. | 100 | + * If size == MO_128, this is a LDXP, and the operation is single-copy |
51 | + * This falls into the CONSTRAINED UNPREDICTABLE zeroing of any | 101 | + * atomic for each doubleword, not the entire quadword; it still must |
52 | + * parts of the ZA storage outside of SVL. | 102 | + * be quadword aligned. |
53 | + */ | 103 | + */ |
54 | + if (imm == 0xff) { | 104 | + if (size == MO_128) { |
55 | + memset(env->zarray, 0, sizeof(env->zarray)); | 105 | + return finalize_memop_atom(s, MO_128 | MO_ALIGN, |
56 | + return; | 106 | + MO_ATOM_IFALIGN_PAIR); |
57 | + } | 107 | + } |
58 | + | 108 | + if (dc_isar_feature(aa64_lse2, s)) { |
59 | + /* | 109 | + check_lse2_align(s, rn, 0, true, mop); |
60 | + * Recall that ZAnH.D[m] is spread across ZA[n+8*m], | 110 | + } else { |
61 | + * so each row is discontiguous within ZA[]. | 111 | + mop |= MO_ALIGN; |
62 | + */ | 112 | + } |
63 | + for (i = 0; i < svl; i++) { | 113 | + return finalize_memop(s, mop); |
64 | + if (imm & (1 << (i % 8))) { | 114 | +} |
65 | + memset(&env->zarray[i], 0, svl); | 115 | + |
66 | + } | 116 | +/* Handle the alignment check for AccType_ORDERED instructions. */ |
67 | + } | 117 | +static MemOp check_ordered_align(DisasContext *s, int rn, int imm, |
68 | +} | 118 | + bool is_write, MemOp mop) |
69 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 119 | +{ |
70 | index XXXXXXX..XXXXXXX 100644 | 120 | + MemOp size = mop & MO_SIZE; |
71 | --- a/target/arm/translate-sme.c | 121 | + |
72 | +++ b/target/arm/translate-sme.c | 122 | + if (size == MO_8) { |
73 | @@ -XXX,XX +XXX,XX @@ | 123 | + return mop; |
74 | */ | 124 | + } |
75 | 125 | + if (size == MO_128) { | |
76 | #include "decode-sme.c.inc" | 126 | + return finalize_memop_atom(s, MO_128 | MO_ALIGN, |
77 | + | 127 | + MO_ATOM_IFALIGN_PAIR); |
78 | + | 128 | + } |
79 | +static bool trans_ZERO(DisasContext *s, arg_ZERO *a) | 129 | + if (!dc_isar_feature(aa64_lse2, s)) { |
80 | +{ | 130 | + mop |= MO_ALIGN; |
81 | + if (!dc_isar_feature(aa64_sme, s)) { | 131 | + } else if (!s->naa) { |
82 | + return false; | 132 | + check_lse2_align(s, rn, imm, is_write, mop); |
83 | + } | 133 | + } |
84 | + if (sme_za_enabled_check(s)) { | 134 | + return finalize_memop(s, mop); |
85 | + gen_helper_sme_zero(cpu_env, tcg_constant_i32(a->imm), | 135 | +} |
86 | + tcg_constant_i32(streaming_vec_reg_size(s))); | 136 | + |
87 | + } | 137 | typedef struct DisasCompare64 { |
88 | + return true; | 138 | TCGCond cond; |
89 | +} | 139 | TCGv_i64 value; |
140 | @@ -XXX,XX +XXX,XX @@ static void gen_load_exclusive(DisasContext *s, int rt, int rt2, int rn, | ||
141 | { | ||
142 | int idx = get_mem_index(s); | ||
143 | TCGv_i64 dirty_addr, clean_addr; | ||
144 | - MemOp memop; | ||
145 | - | ||
146 | - /* | ||
147 | - * For pairs: | ||
148 | - * if size == 2, the operation is single-copy atomic for the doubleword. | ||
149 | - * if size == 3, the operation is single-copy atomic for *each* doubleword, | ||
150 | - * not the entire quadword, however it must be quadword aligned. | ||
151 | - */ | ||
152 | - memop = size + is_pair; | ||
153 | - if (memop == MO_128) { | ||
154 | - memop = finalize_memop_atom(s, MO_128 | MO_ALIGN, | ||
155 | - MO_ATOM_IFALIGN_PAIR); | ||
156 | - } else { | ||
157 | - memop = finalize_memop(s, memop | MO_ALIGN); | ||
158 | - } | ||
159 | + MemOp memop = check_atomic_align(s, rn, size + is_pair); | ||
160 | |||
161 | s->is_ldex = true; | ||
162 | dirty_addr = cpu_reg_sp(s, rn); | ||
163 | @@ -XXX,XX +XXX,XX @@ static void gen_compare_and_swap(DisasContext *s, int rs, int rt, | ||
164 | if (rn == 31) { | ||
165 | gen_check_sp_alignment(s); | ||
166 | } | ||
167 | - memop = finalize_memop(s, size | MO_ALIGN); | ||
168 | + memop = check_atomic_align(s, rn, size); | ||
169 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, memop); | ||
170 | tcg_gen_atomic_cmpxchg_i64(tcg_rs, clean_addr, tcg_rs, tcg_rt, | ||
171 | memidx, memop); | ||
172 | @@ -XXX,XX +XXX,XX @@ static void gen_compare_and_swap_pair(DisasContext *s, int rs, int rt, | ||
173 | } | ||
174 | |||
175 | /* This is a single atomic access, despite the "pair". */ | ||
176 | - memop = finalize_memop(s, (size + 1) | MO_ALIGN); | ||
177 | + memop = check_atomic_align(s, rn, size + 1); | ||
178 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, memop); | ||
179 | |||
180 | if (size == 2) { | ||
181 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
182 | gen_check_sp_alignment(s); | ||
183 | } | ||
184 | tcg_gen_mb(TCG_MO_ALL | TCG_BAR_STRL); | ||
185 | - /* TODO: ARMv8.4-LSE SCTLR.nAA */ | ||
186 | - memop = finalize_memop(s, size | MO_ALIGN); | ||
187 | + memop = check_ordered_align(s, rn, 0, true, size); | ||
188 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
189 | true, rn != 31, memop); | ||
190 | do_gpr_st(s, cpu_reg(s, rt), clean_addr, memop, true, rt, | ||
191 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_excl(DisasContext *s, uint32_t insn) | ||
192 | if (rn == 31) { | ||
193 | gen_check_sp_alignment(s); | ||
194 | } | ||
195 | - /* TODO: ARMv8.4-LSE SCTLR.nAA */ | ||
196 | - memop = finalize_memop(s, size | MO_ALIGN); | ||
197 | + memop = check_ordered_align(s, rn, 0, false, size); | ||
198 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), | ||
199 | false, rn != 31, memop); | ||
200 | do_gpr_ld(s, cpu_reg(s, rt), clean_addr, memop, false, true, | ||
201 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_atomic(DisasContext *s, uint32_t insn, | ||
202 | bool a = extract32(insn, 23, 1); | ||
203 | TCGv_i64 tcg_rs, tcg_rt, clean_addr; | ||
204 | AtomicThreeOpFn *fn = NULL; | ||
205 | - MemOp mop = finalize_memop(s, size | MO_ALIGN); | ||
206 | + MemOp mop = size; | ||
207 | |||
208 | if (is_vector || !dc_isar_feature(aa64_atomics, s)) { | ||
209 | unallocated_encoding(s); | ||
210 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_atomic(DisasContext *s, uint32_t insn, | ||
211 | if (rn == 31) { | ||
212 | gen_check_sp_alignment(s); | ||
213 | } | ||
214 | + | ||
215 | + mop = check_atomic_align(s, rn, mop); | ||
216 | clean_addr = gen_mte_check1(s, cpu_reg_sp(s, rn), false, rn != 31, mop); | ||
217 | |||
218 | if (o3_opc == 014) { | ||
219 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_ldapr_stlr(DisasContext *s, uint32_t insn) | ||
220 | bool is_store = false; | ||
221 | bool extend = false; | ||
222 | bool iss_sf; | ||
223 | - MemOp mop; | ||
224 | + MemOp mop = size; | ||
225 | |||
226 | if (!dc_isar_feature(aa64_rcpc_8_4, s)) { | ||
227 | unallocated_encoding(s); | ||
228 | return; | ||
229 | } | ||
230 | |||
231 | - /* TODO: ARMv8.4-LSE SCTLR.nAA */ | ||
232 | - mop = finalize_memop(s, size | MO_ALIGN); | ||
233 | - | ||
234 | switch (opc) { | ||
235 | case 0: /* STLURB */ | ||
236 | is_store = true; | ||
237 | @@ -XXX,XX +XXX,XX @@ static void disas_ldst_ldapr_stlr(DisasContext *s, uint32_t insn) | ||
238 | gen_check_sp_alignment(s); | ||
239 | } | ||
240 | |||
241 | + mop = check_ordered_align(s, rn, offset, is_store, mop); | ||
242 | + | ||
243 | dirty_addr = read_cpu_reg_sp(s, rn, 1); | ||
244 | tcg_gen_addi_i64(dirty_addr, dirty_addr, offset); | ||
245 | clean_addr = clean_data_tbi(s, dirty_addr); | ||
90 | -- | 246 | -- |
91 | 2.25.1 | 247 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as non-streaming instructions, which should trap | 3 | Push the mte check behind the exclusive_addr check. |
4 | if full a64 support is not enabled in streaming mode. | 4 | Document the several ways that we are still out of spec |
5 | with this implementation. | ||
5 | 6 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-11-richard.henderson@linaro.org | 9 | Message-id: 20230530191438.411344-18-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | target/arm/sme-fa64.decode | 1 - | 12 | target/arm/tcg/translate-a64.c | 42 +++++++++++++++++++++++++++++----- |
12 | target/arm/translate-sve.c | 35 ++++++++++++++++++----------------- | 13 | 1 file changed, 36 insertions(+), 6 deletions(-) |
13 | 2 files changed, 18 insertions(+), 18 deletions(-) | ||
14 | 14 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 15 | diff --git a/target/arm/tcg/translate-a64.c b/target/arm/tcg/translate-a64.c |
16 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 17 | --- a/target/arm/tcg/translate-a64.c |
18 | +++ b/target/arm/sme-fa64.decode | 18 | +++ b/target/arm/tcg/translate-a64.c |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 19 | @@ -XXX,XX +XXX,XX @@ static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2, |
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 20 | */ |
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 21 | TCGLabel *fail_label = gen_new_label(); |
22 | 22 | TCGLabel *done_label = gen_new_label(); | |
23 | -FAIL 0100 0101 --1- ---- 1--- ---- ---- ---- # SVE2 string/histo/crypto instructions | 23 | - TCGv_i64 tmp, dirty_addr, clean_addr; |
24 | FAIL 1000 010- -00- ---- 10-- ---- ---- ---- # SVE2 32-bit gather NT load (vector+scalar) | 24 | + TCGv_i64 tmp, clean_addr; |
25 | FAIL 1000 010- -00- ---- 111- ---- ---- ---- # SVE 32-bit gather prefetch (vector+imm) | 25 | MemOp memop; |
26 | FAIL 1000 0100 0-1- ---- 0--- ---- ---- ---- # SVE 32-bit gather prefetch (scalar+vector) | 26 | |
27 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 27 | - memop = (size + is_pair) | MO_ALIGN; |
28 | index XXXXXXX..XXXXXXX 100644 | 28 | - memop = finalize_memop(s, memop); |
29 | --- a/target/arm/translate-sve.c | 29 | - |
30 | +++ b/target/arm/translate-sve.c | 30 | - dirty_addr = cpu_reg_sp(s, rn); |
31 | @@ -XXX,XX +XXX,XX @@ DO_SVE2_ZZZ_NARROW(RSUBHNT, rsubhnt) | 31 | - clean_addr = gen_mte_check1(s, dirty_addr, true, rn != 31, memop); |
32 | static gen_helper_gvec_flags_4 * const match_fns[4] = { | 32 | + /* |
33 | gen_helper_sve2_match_ppzz_b, gen_helper_sve2_match_ppzz_h, NULL, NULL | 33 | + * FIXME: We are out of spec here. We have recorded only the address |
34 | }; | 34 | + * from load_exclusive, not the entire range, and we assume that the |
35 | -TRANS_FEAT(MATCH, aa64_sve2, do_ppzz_flags, a, match_fns[a->esz]) | 35 | + * size of the access on both sides match. The architecture allows the |
36 | +TRANS_FEAT_NONSTREAMING(MATCH, aa64_sve2, do_ppzz_flags, a, match_fns[a->esz]) | 36 | + * store to be smaller than the load, so long as the stored bytes are |
37 | 37 | + * within the range recorded by the load. | |
38 | static gen_helper_gvec_flags_4 * const nmatch_fns[4] = { | 38 | + */ |
39 | gen_helper_sve2_nmatch_ppzz_b, gen_helper_sve2_nmatch_ppzz_h, NULL, NULL | 39 | |
40 | }; | 40 | + /* See AArch64.ExclusiveMonitorsPass() and AArch64.IsExclusiveVA(). */ |
41 | -TRANS_FEAT(NMATCH, aa64_sve2, do_ppzz_flags, a, nmatch_fns[a->esz]) | 41 | + clean_addr = clean_data_tbi(s, cpu_reg_sp(s, rn)); |
42 | +TRANS_FEAT_NONSTREAMING(NMATCH, aa64_sve2, do_ppzz_flags, a, nmatch_fns[a->esz]) | 42 | tcg_gen_brcond_i64(TCG_COND_NE, clean_addr, cpu_exclusive_addr, fail_label); |
43 | 43 | ||
44 | static gen_helper_gvec_4 * const histcnt_fns[4] = { | 44 | + /* |
45 | NULL, NULL, gen_helper_sve2_histcnt_s, gen_helper_sve2_histcnt_d | 45 | + * The write, and any associated faults, only happen if the virtual |
46 | }; | 46 | + * and physical addresses pass the exclusive monitor check. These |
47 | -TRANS_FEAT(HISTCNT, aa64_sve2, gen_gvec_ool_arg_zpzz, | 47 | + * faults are exceedingly unlikely, because normally the guest uses |
48 | - histcnt_fns[a->esz], a, 0) | 48 | + * the exact same address register for the load_exclusive, and we |
49 | +TRANS_FEAT_NONSTREAMING(HISTCNT, aa64_sve2, gen_gvec_ool_arg_zpzz, | 49 | + * would have recognized these faults there. |
50 | + histcnt_fns[a->esz], a, 0) | 50 | + * |
51 | 51 | + * It is possible to trigger an alignment fault pre-LSE2, e.g. with an | |
52 | -TRANS_FEAT(HISTSEG, aa64_sve2, gen_gvec_ool_arg_zzz, | 52 | + * unaligned 4-byte write within the range of an aligned 8-byte load. |
53 | - a->esz == 0 ? gen_helper_sve2_histseg : NULL, a, 0) | 53 | + * With LSE2, the store would need to cross a 16-byte boundary when the |
54 | +TRANS_FEAT_NONSTREAMING(HISTSEG, aa64_sve2, gen_gvec_ool_arg_zzz, | 54 | + * load did not, which would mean the store is outside the range |
55 | + a->esz == 0 ? gen_helper_sve2_histseg : NULL, a, 0) | 55 | + * recorded for the monitor, which would have failed a corrected monitor |
56 | 56 | + * check above. For now, we assume no size change and retain the | |
57 | DO_ZPZZ_FP(FADDP, aa64_sve2, sve2_faddp_zpzz) | 57 | + * MO_ALIGN to let tcg know what we checked in the load_exclusive. |
58 | DO_ZPZZ_FP(FMAXNMP, aa64_sve2, sve2_fmaxnmp_zpzz) | 58 | + * |
59 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(SQRDCMLAH_zzzz, aa64_sve2, gen_gvec_ool_zzzz, | 59 | + * It is possible to trigger an MTE fault, by performing the load with |
60 | TRANS_FEAT(USDOT_zzzz, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | 60 | + * a virtual address with a valid tag and performing the store with the |
61 | a->esz == 2 ? gen_helper_gvec_usdot_b : NULL, a, 0) | 61 | + * same virtual address and a different invalid tag. |
62 | 62 | + */ | |
63 | -TRANS_FEAT(AESMC, aa64_sve2_aes, gen_gvec_ool_zz, | 63 | + memop = size + is_pair; |
64 | - gen_helper_crypto_aesmc, a->rd, a->rd, a->decrypt) | 64 | + if (memop == MO_128 || !dc_isar_feature(aa64_lse2, s)) { |
65 | +TRANS_FEAT_NONSTREAMING(AESMC, aa64_sve2_aes, gen_gvec_ool_zz, | 65 | + memop |= MO_ALIGN; |
66 | + gen_helper_crypto_aesmc, a->rd, a->rd, a->decrypt) | 66 | + } |
67 | 67 | + memop = finalize_memop(s, memop); | |
68 | -TRANS_FEAT(AESE, aa64_sve2_aes, gen_gvec_ool_arg_zzz, | 68 | + gen_mte_check1(s, cpu_reg_sp(s, rn), true, rn != 31, memop); |
69 | - gen_helper_crypto_aese, a, false) | 69 | + |
70 | -TRANS_FEAT(AESD, aa64_sve2_aes, gen_gvec_ool_arg_zzz, | 70 | tmp = tcg_temp_new_i64(); |
71 | - gen_helper_crypto_aese, a, true) | 71 | if (is_pair) { |
72 | +TRANS_FEAT_NONSTREAMING(AESE, aa64_sve2_aes, gen_gvec_ool_arg_zzz, | 72 | if (size == 2) { |
73 | + gen_helper_crypto_aese, a, false) | ||
74 | +TRANS_FEAT_NONSTREAMING(AESD, aa64_sve2_aes, gen_gvec_ool_arg_zzz, | ||
75 | + gen_helper_crypto_aese, a, true) | ||
76 | |||
77 | -TRANS_FEAT(SM4E, aa64_sve2_sm4, gen_gvec_ool_arg_zzz, | ||
78 | - gen_helper_crypto_sm4e, a, 0) | ||
79 | -TRANS_FEAT(SM4EKEY, aa64_sve2_sm4, gen_gvec_ool_arg_zzz, | ||
80 | - gen_helper_crypto_sm4ekey, a, 0) | ||
81 | +TRANS_FEAT_NONSTREAMING(SM4E, aa64_sve2_sm4, gen_gvec_ool_arg_zzz, | ||
82 | + gen_helper_crypto_sm4e, a, 0) | ||
83 | +TRANS_FEAT_NONSTREAMING(SM4EKEY, aa64_sve2_sm4, gen_gvec_ool_arg_zzz, | ||
84 | + gen_helper_crypto_sm4ekey, a, 0) | ||
85 | |||
86 | -TRANS_FEAT(RAX1, aa64_sve2_sha3, gen_gvec_fn_arg_zzz, gen_gvec_rax1, a) | ||
87 | +TRANS_FEAT_NONSTREAMING(RAX1, aa64_sve2_sha3, gen_gvec_fn_arg_zzz, | ||
88 | + gen_gvec_rax1, a) | ||
89 | |||
90 | TRANS_FEAT(FCVTNT_sh, aa64_sve2, gen_gvec_fpst_arg_zpz, | ||
91 | gen_helper_sve2_fcvtnt_sh, a, 0, FPST_FPCR) | ||
92 | -- | 73 | -- |
93 | 2.25.1 | 74 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap | 3 | We have many other instances of stg in the testsuite; |
4 | if full a64 support is not enabled in streaming mode. | 4 | change these to provide an instance of stz2g. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-10-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-19-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/sme-fa64.decode | 1 - | 11 | tests/tcg/aarch64/mte-7.c | 3 +-- |
12 | target/arm/translate-sve.c | 12 ++++++------ | 12 | 1 file changed, 1 insertion(+), 2 deletions(-) |
13 | 2 files changed, 6 insertions(+), 7 deletions(-) | ||
14 | 13 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 14 | diff --git a/tests/tcg/aarch64/mte-7.c b/tests/tcg/aarch64/mte-7.c |
16 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 16 | --- a/tests/tcg/aarch64/mte-7.c |
18 | +++ b/target/arm/sme-fa64.decode | 17 | +++ b/tests/tcg/aarch64/mte-7.c |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 18 | @@ -XXX,XX +XXX,XX @@ int main(int ac, char **av) |
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 19 | p = (void *)((unsigned long)p | (1ul << 56)); |
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 20 | |
22 | 21 | /* Store tag in sequential granules. */ | |
23 | -FAIL 0100 0101 --0- ---- 1001 10-- ---- ---- # SMMLA, UMMLA, USMMLA | 22 | - asm("stg %0, [%0]" : : "r"(p + 0x0ff0)); |
24 | FAIL 0100 0101 --1- ---- 1--- ---- ---- ---- # SVE2 string/histo/crypto instructions | 23 | - asm("stg %0, [%0]" : : "r"(p + 0x1000)); |
25 | FAIL 1000 010- -00- ---- 10-- ---- ---- ---- # SVE2 32-bit gather NT load (vector+scalar) | 24 | + asm("stz2g %0, [%0]" : : "r"(p + 0x0ff0)); |
26 | FAIL 1000 010- -00- ---- 111- ---- ---- ---- # SVE 32-bit gather prefetch (vector+imm) | 25 | |
27 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 26 | /* |
28 | index XXXXXXX..XXXXXXX 100644 | 27 | * Perform an unaligned store with tag 1 crossing the pages. |
29 | --- a/target/arm/translate-sve.c | ||
30 | +++ b/target/arm/translate-sve.c | ||
31 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(FMLALT_zzxw, aa64_sve2, do_FMLAL_zzxw, a, false, true) | ||
32 | TRANS_FEAT(FMLSLB_zzxw, aa64_sve2, do_FMLAL_zzxw, a, true, false) | ||
33 | TRANS_FEAT(FMLSLT_zzxw, aa64_sve2, do_FMLAL_zzxw, a, true, true) | ||
34 | |||
35 | -TRANS_FEAT(SMMLA, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | ||
36 | - gen_helper_gvec_smmla_b, a, 0) | ||
37 | -TRANS_FEAT(USMMLA, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | ||
38 | - gen_helper_gvec_usmmla_b, a, 0) | ||
39 | -TRANS_FEAT(UMMLA, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | ||
40 | - gen_helper_gvec_ummla_b, a, 0) | ||
41 | +TRANS_FEAT_NONSTREAMING(SMMLA, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | ||
42 | + gen_helper_gvec_smmla_b, a, 0) | ||
43 | +TRANS_FEAT_NONSTREAMING(USMMLA, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | ||
44 | + gen_helper_gvec_usmmla_b, a, 0) | ||
45 | +TRANS_FEAT_NONSTREAMING(UMMLA, aa64_sve_i8mm, gen_gvec_ool_arg_zzzz, | ||
46 | + gen_helper_gvec_ummla_b, a, 0) | ||
47 | |||
48 | TRANS_FEAT(BFDOT_zzzz, aa64_sve_bf16, gen_gvec_ool_arg_zzzz, | ||
49 | gen_helper_gvec_bfdot, a, 0) | ||
50 | -- | 28 | -- |
51 | 2.25.1 | 29 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Mark these as a non-streaming instructions, which should trap | 3 | With -cpu max and FEAT_LSE2, the __aarch64__ section will only raise |
4 | if full a64 support is not enabled in streaming mode. | 4 | an alignment exception when the load crosses a 16-byte boundary. |
5 | 5 | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-9-richard.henderson@linaro.org | 8 | Message-id: 20230530191438.411344-20-richard.henderson@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 10 | --- |
11 | target/arm/sme-fa64.decode | 3 --- | 11 | tests/tcg/multiarch/sigbus.c | 13 +++++++++---- |
12 | target/arm/translate-sve.c | 15 +++++++++++---- | 12 | 1 file changed, 9 insertions(+), 4 deletions(-) |
13 | 2 files changed, 11 insertions(+), 7 deletions(-) | ||
14 | 13 | ||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | 14 | diff --git a/tests/tcg/multiarch/sigbus.c b/tests/tcg/multiarch/sigbus.c |
16 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/sme-fa64.decode | 16 | --- a/tests/tcg/multiarch/sigbus.c |
18 | +++ b/target/arm/sme-fa64.decode | 17 | +++ b/tests/tcg/multiarch/sigbus.c |
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | 18 | @@ -XXX,XX +XXX,XX @@ |
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | 19 | #include <endian.h> |
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | 20 | |
22 | 21 | ||
23 | -FAIL 0110 0101 --0- ---- 0000 11-- ---- ---- # FTSMUL | 22 | -unsigned long long x = 0x8877665544332211ull; |
24 | -FAIL 0110 0101 --01 0--- 100- ---- ---- ---- # FTMAD | 23 | -void * volatile p = (void *)&x + 1; |
25 | -FAIL 0110 0101 --01 1--- 001- ---- ---- ---- # FADDA | 24 | +char x[32] __attribute__((aligned(16))) = { |
26 | FAIL 0100 0101 --0- ---- 1001 10-- ---- ---- # SMMLA, UMMLA, USMMLA | 25 | + 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, |
27 | FAIL 0100 0101 --1- ---- 1--- ---- ---- ---- # SVE2 string/histo/crypto instructions | 26 | + 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, 0x10, |
28 | FAIL 1000 010- -00- ---- 10-- ---- ---- ---- # SVE2 32-bit gather NT load (vector+scalar) | 27 | + 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, 0x18, |
29 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | 28 | + 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, 0x20, |
30 | index XXXXXXX..XXXXXXX 100644 | 29 | +}; |
31 | --- a/target/arm/translate-sve.c | 30 | +void * volatile p = (void *)&x + 15; |
32 | +++ b/target/arm/translate-sve.c | 31 | |
33 | @@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3_ptr * const ftmad_fns[4] = { | 32 | void sigbus(int sig, siginfo_t *info, void *uc) |
34 | NULL, gen_helper_sve_ftmad_h, | 33 | { |
35 | gen_helper_sve_ftmad_s, gen_helper_sve_ftmad_d, | 34 | @@ -XXX,XX +XXX,XX @@ int main() |
36 | }; | 35 | * We might as well validate the unaligned load worked. |
37 | -TRANS_FEAT(FTMAD, aa64_sve, gen_gvec_fpst_zzz, | 36 | */ |
38 | - ftmad_fns[a->esz], a->rd, a->rn, a->rm, a->imm, | 37 | if (BYTE_ORDER == LITTLE_ENDIAN) { |
39 | - a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR) | 38 | - assert(tmp == 0x55443322); |
40 | +TRANS_FEAT_NONSTREAMING(FTMAD, aa64_sve, gen_gvec_fpst_zzz, | 39 | + assert(tmp == 0x13121110); |
41 | + ftmad_fns[a->esz], a->rd, a->rn, a->rm, a->imm, | 40 | } else { |
42 | + a->esz == MO_16 ? FPST_FPCR_F16 : FPST_FPCR) | 41 | - assert(tmp == 0x77665544); |
43 | 42 | + assert(tmp == 0x10111213); | |
44 | /* | ||
45 | *** SVE Floating Point Accumulating Reduction Group | ||
46 | @@ -XXX,XX +XXX,XX @@ static bool trans_FADDA(DisasContext *s, arg_rprr_esz *a) | ||
47 | if (a->esz == 0 || !dc_isar_feature(aa64_sve, s)) { | ||
48 | return false; | ||
49 | } | 43 | } |
50 | + s->is_nonstreaming = true; | 44 | return EXIT_SUCCESS; |
51 | if (!sve_access_check(s)) { | 45 | } |
52 | return true; | ||
53 | } | ||
54 | @@ -XXX,XX +XXX,XX @@ static bool trans_FADDA(DisasContext *s, arg_rprr_esz *a) | ||
55 | DO_FP3(FADD_zzz, fadd) | ||
56 | DO_FP3(FSUB_zzz, fsub) | ||
57 | DO_FP3(FMUL_zzz, fmul) | ||
58 | -DO_FP3(FTSMUL, ftsmul) | ||
59 | DO_FP3(FRECPS, recps) | ||
60 | DO_FP3(FRSQRTS, rsqrts) | ||
61 | |||
62 | #undef DO_FP3 | ||
63 | |||
64 | +static gen_helper_gvec_3_ptr * const ftsmul_fns[4] = { | ||
65 | + NULL, gen_helper_gvec_ftsmul_h, | ||
66 | + gen_helper_gvec_ftsmul_s, gen_helper_gvec_ftsmul_d | ||
67 | +}; | ||
68 | +TRANS_FEAT_NONSTREAMING(FTSMUL, aa64_sve, gen_gvec_fpst_arg_zzz, | ||
69 | + ftsmul_fns[a->esz], a, 0) | ||
70 | + | ||
71 | /* | ||
72 | *** SVE Floating Point Arithmetic - Predicated Group | ||
73 | */ | ||
74 | -- | 46 | -- |
75 | 2.25.1 | 47 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | |||
3 | Note that SME remains effectively disabled for user-only, | ||
4 | because we do not yet set CPACR_EL1.SMEN. This needs to | ||
5 | wait until the kernel ABI is implemented. | ||
6 | 2 | ||
7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
8 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
9 | Message-id: 20220708151540.18136-33-richard.henderson@linaro.org | 5 | Message-id: 20230530191438.411344-21-richard.henderson@linaro.org |
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 7 | --- |
12 | docs/system/arm/emulation.rst | 4 ++++ | 8 | docs/system/arm/emulation.rst | 1 + |
13 | target/arm/cpu64.c | 11 +++++++++++ | 9 | target/arm/tcg/cpu64.c | 1 + |
14 | 2 files changed, 15 insertions(+) | 10 | 2 files changed, 2 insertions(+) |
15 | 11 | ||
16 | diff --git a/docs/system/arm/emulation.rst b/docs/system/arm/emulation.rst | 12 | diff --git a/docs/system/arm/emulation.rst b/docs/system/arm/emulation.rst |
17 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/docs/system/arm/emulation.rst | 14 | --- a/docs/system/arm/emulation.rst |
19 | +++ b/docs/system/arm/emulation.rst | 15 | +++ b/docs/system/arm/emulation.rst |
20 | @@ -XXX,XX +XXX,XX @@ the following architecture extensions: | 16 | @@ -XXX,XX +XXX,XX @@ the following architecture extensions: |
21 | - FEAT_SHA512 (Advanced SIMD SHA512 instructions) | 17 | - FEAT_LRCPC (Load-acquire RCpc instructions) |
22 | - FEAT_SM3 (Advanced SIMD SM3 instructions) | 18 | - FEAT_LRCPC2 (Load-acquire RCpc instructions v2) |
23 | - FEAT_SM4 (Advanced SIMD SM4 instructions) | 19 | - FEAT_LSE (Large System Extensions) |
24 | +- FEAT_SME (Scalable Matrix Extension) | 20 | +- FEAT_LSE2 (Large System Extensions v2) |
25 | +- FEAT_SME_FA64 (Full A64 instruction set in Streaming SVE mode) | 21 | - FEAT_LVA (Large Virtual Address space) |
26 | +- FEAT_SME_F64F64 (Double-precision floating-point outer product instructions) | 22 | - FEAT_MTE (Memory Tagging Extension) |
27 | +- FEAT_SME_I16I64 (16-bit to 64-bit integer widening outer product instructions) | 23 | - FEAT_MTE2 (Memory Tagging Extension) |
28 | - FEAT_SPECRES (Speculation restriction instructions) | 24 | diff --git a/target/arm/tcg/cpu64.c b/target/arm/tcg/cpu64.c |
29 | - FEAT_SSBS (Speculative Store Bypass Safe) | ||
30 | - FEAT_TLBIOS (TLB invalidate instructions in Outer Shareable domain) | ||
31 | diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c | ||
32 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
33 | --- a/target/arm/cpu64.c | 26 | --- a/target/arm/tcg/cpu64.c |
34 | +++ b/target/arm/cpu64.c | 27 | +++ b/target/arm/tcg/cpu64.c |
35 | @@ -XXX,XX +XXX,XX @@ static void aarch64_max_initfn(Object *obj) | 28 | @@ -XXX,XX +XXX,XX @@ void aarch64_max_tcg_initfn(Object *obj) |
36 | */ | 29 | t = FIELD_DP64(t, ID_AA64MMFR2, IESB, 1); /* FEAT_IESB */ |
37 | t = FIELD_DP64(t, ID_AA64PFR1, MTE, 3); /* FEAT_MTE3 */ | 30 | t = FIELD_DP64(t, ID_AA64MMFR2, VARANGE, 1); /* FEAT_LVA */ |
38 | t = FIELD_DP64(t, ID_AA64PFR1, RAS_FRAC, 0); /* FEAT_RASv1p1 + FEAT_DoubleFault */ | 31 | t = FIELD_DP64(t, ID_AA64MMFR2, ST, 1); /* FEAT_TTST */ |
39 | + t = FIELD_DP64(t, ID_AA64PFR1, SME, 1); /* FEAT_SME */ | 32 | + t = FIELD_DP64(t, ID_AA64MMFR2, AT, 1); /* FEAT_LSE2 */ |
40 | t = FIELD_DP64(t, ID_AA64PFR1, CSV2_FRAC, 0); /* FEAT_CSV2_2 */ | 33 | t = FIELD_DP64(t, ID_AA64MMFR2, IDS, 1); /* FEAT_IDST */ |
41 | cpu->isar.id_aa64pfr1 = t; | 34 | t = FIELD_DP64(t, ID_AA64MMFR2, FWB, 1); /* FEAT_S2FWB */ |
42 | 35 | t = FIELD_DP64(t, ID_AA64MMFR2, TTL, 1); /* FEAT_TTL */ | |
43 | @@ -XXX,XX +XXX,XX @@ static void aarch64_max_initfn(Object *obj) | ||
44 | t = FIELD_DP64(t, ID_AA64DFR0, PMUVER, 5); /* FEAT_PMUv3p4 */ | ||
45 | cpu->isar.id_aa64dfr0 = t; | ||
46 | |||
47 | + t = cpu->isar.id_aa64smfr0; | ||
48 | + t = FIELD_DP64(t, ID_AA64SMFR0, F32F32, 1); /* FEAT_SME */ | ||
49 | + t = FIELD_DP64(t, ID_AA64SMFR0, B16F32, 1); /* FEAT_SME */ | ||
50 | + t = FIELD_DP64(t, ID_AA64SMFR0, F16F32, 1); /* FEAT_SME */ | ||
51 | + t = FIELD_DP64(t, ID_AA64SMFR0, I8I32, 0xf); /* FEAT_SME */ | ||
52 | + t = FIELD_DP64(t, ID_AA64SMFR0, F64F64, 1); /* FEAT_SME_F64F64 */ | ||
53 | + t = FIELD_DP64(t, ID_AA64SMFR0, I16I64, 0xf); /* FEAT_SME_I16I64 */ | ||
54 | + t = FIELD_DP64(t, ID_AA64SMFR0, FA64, 1); /* FEAT_SME_FA64 */ | ||
55 | + cpu->isar.id_aa64smfr0 = t; | ||
56 | + | ||
57 | /* Replicate the same data to the 32-bit id registers. */ | ||
58 | aa32_max_features(cpu); | ||
59 | |||
60 | -- | 36 | -- |
61 | 2.25.1 | 37 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Zhuojia Shen <chaosdefinition@hotmail.com> |
---|---|---|---|
2 | 2 | ||
3 | We can handle both exception entry and exception return by | 3 | DC CVAP and DC CVADP instructions can be executed in EL0 on Linux, |
4 | hooking into aarch64_sve_change_el. | 4 | either directly when SCTLR_EL1.UCI == 1 or emulated by the kernel (see |
5 | user_cache_maint_handler() in arch/arm64/kernel/traps.c). | ||
5 | 6 | ||
7 | This patch enables execution of the two instructions in user mode | ||
8 | emulation. | ||
9 | |||
10 | Signed-off-by: Zhuojia Shen <chaosdefinition@hotmail.com> | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 12 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20220708151540.18136-32-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 14 | --- |
11 | target/arm/helper.c | 15 +++++++++++++-- | 15 | target/arm/helper.c | 6 ++---- |
12 | 1 file changed, 13 insertions(+), 2 deletions(-) | 16 | 1 file changed, 2 insertions(+), 4 deletions(-) |
13 | 17 | ||
14 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 18 | diff --git a/target/arm/helper.c b/target/arm/helper.c |
15 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/helper.c | 20 | --- a/target/arm/helper.c |
17 | +++ b/target/arm/helper.c | 21 | +++ b/target/arm/helper.c |
18 | @@ -XXX,XX +XXX,XX @@ void aarch64_sve_change_el(CPUARMState *env, int old_el, | 22 | @@ -XXX,XX +XXX,XX @@ static const ARMCPRegInfo rndr_reginfo[] = { |
19 | return; | 23 | .access = PL0_R, .readfn = rndr_readfn }, |
24 | }; | ||
25 | |||
26 | -#ifndef CONFIG_USER_ONLY | ||
27 | static void dccvap_writefn(CPUARMState *env, const ARMCPRegInfo *opaque, | ||
28 | uint64_t value) | ||
29 | { | ||
30 | @@ -XXX,XX +XXX,XX @@ static void dccvap_writefn(CPUARMState *env, const ARMCPRegInfo *opaque, | ||
31 | /* This won't be crossing page boundaries */ | ||
32 | haddr = probe_read(env, vaddr, dline_size, mem_idx, GETPC()); | ||
33 | if (haddr) { | ||
34 | +#ifndef CONFIG_USER_ONLY | ||
35 | |||
36 | ram_addr_t offset; | ||
37 | MemoryRegion *mr; | ||
38 | @@ -XXX,XX +XXX,XX @@ static void dccvap_writefn(CPUARMState *env, const ARMCPRegInfo *opaque, | ||
39 | if (mr) { | ||
40 | memory_region_writeback(mr, offset, dline_size); | ||
41 | } | ||
42 | +#endif /*CONFIG_USER_ONLY*/ | ||
20 | } | 43 | } |
21 | 44 | } | |
22 | + old_a64 = old_el ? arm_el_is_aa64(env, old_el) : el0_a64; | 45 | |
23 | + new_a64 = new_el ? arm_el_is_aa64(env, new_el) : el0_a64; | 46 | @@ -XXX,XX +XXX,XX @@ static const ARMCPRegInfo dcpodp_reg[] = { |
24 | + | 47 | .fgt = FGT_DCCVADP, |
25 | + /* | 48 | .accessfn = aa64_cacheop_poc_access, .writefn = dccvap_writefn }, |
26 | + * Both AArch64.TakeException and AArch64.ExceptionReturn | 49 | }; |
27 | + * invoke ResetSVEState when taking an exception from, or | 50 | -#endif /*CONFIG_USER_ONLY*/ |
28 | + * returning to, AArch32 state when PSTATE.SM is enabled. | 51 | |
29 | + */ | 52 | static CPAccessResult access_aa64_tid5(CPUARMState *env, const ARMCPRegInfo *ri, |
30 | + if (old_a64 != new_a64 && FIELD_EX64(env->svcr, SVCR, SM)) { | 53 | bool isread) |
31 | + arm_reset_sve_state(env); | 54 | @@ -XXX,XX +XXX,XX @@ void register_cp_regs_for_features(ARMCPU *cpu) |
32 | + return; | 55 | if (cpu_isar_feature(aa64_tlbios, cpu)) { |
33 | + } | 56 | define_arm_cp_regs(cpu, tlbios_reginfo); |
34 | + | 57 | } |
58 | -#ifndef CONFIG_USER_ONLY | ||
59 | /* Data Cache clean instructions up to PoP */ | ||
60 | if (cpu_isar_feature(aa64_dcpop, cpu)) { | ||
61 | define_one_arm_cp_reg(cpu, dcpop_reg); | ||
62 | @@ -XXX,XX +XXX,XX @@ void register_cp_regs_for_features(ARMCPU *cpu) | ||
63 | define_one_arm_cp_reg(cpu, dcpodp_reg); | ||
64 | } | ||
65 | } | ||
66 | -#endif /*CONFIG_USER_ONLY*/ | ||
67 | |||
35 | /* | 68 | /* |
36 | * DDI0584A.d sec 3.2: "If SVE instructions are disabled or trapped | 69 | * If full MTE is enabled, add all of the system registers. |
37 | * at ELx, or not available because the EL is in AArch32 state, then | ||
38 | @@ -XXX,XX +XXX,XX @@ void aarch64_sve_change_el(CPUARMState *env, int old_el, | ||
39 | * we already have the correct register contents when encountering the | ||
40 | * vq0->vq0 transition between EL0->EL1. | ||
41 | */ | ||
42 | - old_a64 = old_el ? arm_el_is_aa64(env, old_el) : el0_a64; | ||
43 | old_len = (old_a64 && !sve_exception_el(env, old_el) | ||
44 | ? sve_vqm1_for_el(env, old_el) : 0); | ||
45 | - new_a64 = new_el ? arm_el_is_aa64(env, new_el) : el0_a64; | ||
46 | new_len = (new_a64 && !sve_exception_el(env, new_el) | ||
47 | ? sve_vqm1_for_el(env, new_el) : 0); | ||
48 | |||
49 | -- | 70 | -- |
50 | 2.25.1 | 71 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Zhuojia Shen <chaosdefinition@hotmail.com> |
---|---|---|---|
2 | 2 | ||
3 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 3 | Test execution of DC CVAP and DC CVADP instructions under user mode |
4 | Message-id: 20220708151540.18136-25-richard.henderson@linaro.org | 4 | emulation. |
5 | |||
6 | Signed-off-by: Zhuojia Shen <chaosdefinition@hotmail.com> | ||
7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | --- | 10 | --- |
8 | target/arm/helper-sme.h | 5 +++ | 11 | tests/tcg/aarch64/dcpodp.c | 63 +++++++++++++++++++++++++++++++ |
9 | target/arm/sme.decode | 9 +++++ | 12 | tests/tcg/aarch64/dcpop.c | 63 +++++++++++++++++++++++++++++++ |
10 | target/arm/sme_helper.c | 69 ++++++++++++++++++++++++++++++++++++++ | 13 | tests/tcg/aarch64/Makefile.target | 11 ++++++ |
11 | target/arm/translate-sme.c | 32 ++++++++++++++++++ | 14 | 3 files changed, 137 insertions(+) |
12 | 4 files changed, 115 insertions(+) | 15 | create mode 100644 tests/tcg/aarch64/dcpodp.c |
16 | create mode 100644 tests/tcg/aarch64/dcpop.c | ||
13 | 17 | ||
14 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | 18 | diff --git a/tests/tcg/aarch64/dcpodp.c b/tests/tcg/aarch64/dcpodp.c |
15 | index XXXXXXX..XXXXXXX 100644 | 19 | new file mode 100644 |
16 | --- a/target/arm/helper-sme.h | 20 | index XXXXXXX..XXXXXXX |
17 | +++ b/target/arm/helper-sme.h | 21 | --- /dev/null |
18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(sme_addha_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 22 | +++ b/tests/tcg/aarch64/dcpodp.c |
19 | DEF_HELPER_FLAGS_5(sme_addva_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 23 | @@ -XXX,XX +XXX,XX @@ |
20 | DEF_HELPER_FLAGS_5(sme_addha_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 24 | +/* |
21 | DEF_HELPER_FLAGS_5(sme_addva_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | 25 | + * Test execution of DC CVADP instruction. |
26 | + * | ||
27 | + * Copyright (c) 2023 Zhuojia Shen <chaosdefinition@hotmail.com> | ||
28 | + * SPDX-License-Identifier: GPL-2.0-or-later | ||
29 | + */ | ||
22 | + | 30 | + |
23 | +DEF_HELPER_FLAGS_7(sme_fmopa_s, TCG_CALL_NO_RWG, | 31 | +#include <asm/hwcap.h> |
24 | + void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | 32 | +#include <sys/auxv.h> |
25 | +DEF_HELPER_FLAGS_7(sme_fmopa_d, TCG_CALL_NO_RWG, | ||
26 | + void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | ||
27 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | ||
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/target/arm/sme.decode | ||
30 | +++ b/target/arm/sme.decode | ||
31 | @@ -XXX,XX +XXX,XX @@ ADDHA_s 11000000 10 01000 0 ... ... ..... 000 .. @adda_32 | ||
32 | ADDVA_s 11000000 10 01000 1 ... ... ..... 000 .. @adda_32 | ||
33 | ADDHA_d 11000000 11 01000 0 ... ... ..... 00 ... @adda_64 | ||
34 | ADDVA_d 11000000 11 01000 1 ... ... ..... 00 ... @adda_64 | ||
35 | + | 33 | + |
36 | +### SME Outer Product | 34 | +#include <signal.h> |
35 | +#include <stdbool.h> | ||
36 | +#include <stdio.h> | ||
37 | +#include <stdlib.h> | ||
37 | + | 38 | + |
38 | +&op zad zn zm pm pn sub:bool | 39 | +#ifndef HWCAP2_DCPODP |
39 | +@op_32 ........ ... zm:5 pm:3 pn:3 zn:5 sub:1 .. zad:2 &op | 40 | +#define HWCAP2_DCPODP (1 << 0) |
40 | +@op_64 ........ ... zm:5 pm:3 pn:3 zn:5 sub:1 . zad:3 &op | 41 | +#endif |
41 | + | 42 | + |
42 | +FMOPA_s 10000000 100 ..... ... ... ..... . 00 .. @op_32 | 43 | +bool should_fail = false; |
43 | +FMOPA_d 10000000 110 ..... ... ... ..... . 0 ... @op_64 | ||
44 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | ||
45 | index XXXXXXX..XXXXXXX 100644 | ||
46 | --- a/target/arm/sme_helper.c | ||
47 | +++ b/target/arm/sme_helper.c | ||
48 | @@ -XXX,XX +XXX,XX @@ | ||
49 | #include "exec/cpu_ldst.h" | ||
50 | #include "exec/exec-all.h" | ||
51 | #include "qemu/int128.h" | ||
52 | +#include "fpu/softfloat.h" | ||
53 | #include "vec_internal.h" | ||
54 | #include "sve_ldst_internal.h" | ||
55 | |||
56 | @@ -XXX,XX +XXX,XX @@ void HELPER(sme_addva_d)(void *vzda, void *vzn, void *vpn, | ||
57 | } | ||
58 | } | ||
59 | } | ||
60 | + | 44 | + |
61 | +void HELPER(sme_fmopa_s)(void *vza, void *vzn, void *vzm, void *vpn, | 45 | +static void signal_handler(int sig, siginfo_t *si, void *data) |
62 | + void *vpm, void *vst, uint32_t desc) | ||
63 | +{ | 46 | +{ |
64 | + intptr_t row, col, oprsz = simd_maxsz(desc); | 47 | + ucontext_t *uc = (ucontext_t *)data; |
65 | + uint32_t neg = simd_data(desc) << 31; | ||
66 | + uint16_t *pn = vpn, *pm = vpm; | ||
67 | + float_status fpst; | ||
68 | + | 48 | + |
69 | + /* | 49 | + if (should_fail) { |
70 | + * Make a copy of float_status because this operation does not | 50 | + uc->uc_mcontext.pc += 4; |
71 | + * update the cumulative fp exception status. It also produces | 51 | + } else { |
72 | + * default nans. | 52 | + exit(EXIT_FAILURE); |
73 | + */ | ||
74 | + fpst = *(float_status *)vst; | ||
75 | + set_default_nan_mode(true, &fpst); | ||
76 | + | ||
77 | + for (row = 0; row < oprsz; ) { | ||
78 | + uint16_t pa = pn[H2(row >> 4)]; | ||
79 | + do { | ||
80 | + if (pa & 1) { | ||
81 | + void *vza_row = vza + tile_vslice_offset(row); | ||
82 | + uint32_t n = *(uint32_t *)(vzn + H1_4(row)) ^ neg; | ||
83 | + | ||
84 | + for (col = 0; col < oprsz; ) { | ||
85 | + uint16_t pb = pm[H2(col >> 4)]; | ||
86 | + do { | ||
87 | + if (pb & 1) { | ||
88 | + uint32_t *a = vza_row + H1_4(col); | ||
89 | + uint32_t *m = vzm + H1_4(col); | ||
90 | + *a = float32_muladd(n, *m, *a, 0, vst); | ||
91 | + } | ||
92 | + col += 4; | ||
93 | + pb >>= 4; | ||
94 | + } while (col & 15); | ||
95 | + } | ||
96 | + } | ||
97 | + row += 4; | ||
98 | + pa >>= 4; | ||
99 | + } while (row & 15); | ||
100 | + } | 53 | + } |
101 | +} | 54 | +} |
102 | + | 55 | + |
103 | +void HELPER(sme_fmopa_d)(void *vza, void *vzn, void *vzm, void *vpn, | 56 | +static int do_dc_cvadp(void) |
104 | + void *vpm, void *vst, uint32_t desc) | ||
105 | +{ | 57 | +{ |
106 | + intptr_t row, col, oprsz = simd_oprsz(desc) / 8; | 58 | + struct sigaction sa = { |
107 | + uint64_t neg = (uint64_t)simd_data(desc) << 63; | 59 | + .sa_flags = SA_SIGINFO, |
108 | + uint64_t *za = vza, *zn = vzn, *zm = vzm; | 60 | + .sa_sigaction = signal_handler, |
109 | + uint8_t *pn = vpn, *pm = vpm; | 61 | + }; |
110 | + float_status fpst = *(float_status *)vst; | ||
111 | + | 62 | + |
112 | + set_default_nan_mode(true, &fpst); | 63 | + sigemptyset(&sa.sa_mask); |
64 | + if (sigaction(SIGSEGV, &sa, NULL) < 0) { | ||
65 | + perror("sigaction"); | ||
66 | + return EXIT_FAILURE; | ||
67 | + } | ||
113 | + | 68 | + |
114 | + for (row = 0; row < oprsz; ++row) { | 69 | + asm volatile("dc cvadp, %0\n\t" :: "r"(&sa)); |
115 | + if (pn[H1(row)] & 1) { | ||
116 | + uint64_t *za_row = &za[tile_vslice_index(row)]; | ||
117 | + uint64_t n = zn[row] ^ neg; | ||
118 | + | 70 | + |
119 | + for (col = 0; col < oprsz; ++col) { | 71 | + should_fail = true; |
120 | + if (pm[H1(col)] & 1) { | 72 | + asm volatile("dc cvadp, %0\n\t" :: "r"(NULL)); |
121 | + uint64_t *a = &za_row[col]; | 73 | + should_fail = false; |
122 | + *a = float64_muladd(n, zm[col], *a, 0, &fpst); | 74 | + |
123 | + } | 75 | + return EXIT_SUCCESS; |
124 | + } | 76 | +} |
125 | + } | 77 | + |
78 | +int main(void) | ||
79 | +{ | ||
80 | + if (getauxval(AT_HWCAP2) & HWCAP2_DCPODP) { | ||
81 | + return do_dc_cvadp(); | ||
82 | + } else { | ||
83 | + printf("SKIP: no HWCAP2_DCPODP on this system\n"); | ||
84 | + return EXIT_SUCCESS; | ||
126 | + } | 85 | + } |
127 | +} | 86 | +} |
128 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | 87 | diff --git a/tests/tcg/aarch64/dcpop.c b/tests/tcg/aarch64/dcpop.c |
129 | index XXXXXXX..XXXXXXX 100644 | 88 | new file mode 100644 |
130 | --- a/target/arm/translate-sme.c | 89 | index XXXXXXX..XXXXXXX |
131 | +++ b/target/arm/translate-sme.c | 90 | --- /dev/null |
132 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(ADDHA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addha_s) | 91 | +++ b/tests/tcg/aarch64/dcpop.c |
133 | TRANS_FEAT(ADDVA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addva_s) | 92 | @@ -XXX,XX +XXX,XX @@ |
134 | TRANS_FEAT(ADDHA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addha_d) | 93 | +/* |
135 | TRANS_FEAT(ADDVA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addva_d) | 94 | + * Test execution of DC CVAP instruction. |
95 | + * | ||
96 | + * Copyright (c) 2023 Zhuojia Shen <chaosdefinition@hotmail.com> | ||
97 | + * SPDX-License-Identifier: GPL-2.0-or-later | ||
98 | + */ | ||
136 | + | 99 | + |
137 | +static bool do_outprod_fpst(DisasContext *s, arg_op *a, MemOp esz, | 100 | +#include <asm/hwcap.h> |
138 | + gen_helper_gvec_5_ptr *fn) | 101 | +#include <sys/auxv.h> |
102 | + | ||
103 | +#include <signal.h> | ||
104 | +#include <stdbool.h> | ||
105 | +#include <stdio.h> | ||
106 | +#include <stdlib.h> | ||
107 | + | ||
108 | +#ifndef HWCAP_DCPOP | ||
109 | +#define HWCAP_DCPOP (1 << 16) | ||
110 | +#endif | ||
111 | + | ||
112 | +bool should_fail = false; | ||
113 | + | ||
114 | +static void signal_handler(int sig, siginfo_t *si, void *data) | ||
139 | +{ | 115 | +{ |
140 | + int svl = streaming_vec_reg_size(s); | 116 | + ucontext_t *uc = (ucontext_t *)data; |
141 | + uint32_t desc = simd_desc(svl, svl, a->sub); | ||
142 | + TCGv_ptr za, zn, zm, pn, pm, fpst; | ||
143 | + | 117 | + |
144 | + if (!sme_smza_enabled_check(s)) { | 118 | + if (should_fail) { |
145 | + return true; | 119 | + uc->uc_mcontext.pc += 4; |
120 | + } else { | ||
121 | + exit(EXIT_FAILURE); | ||
122 | + } | ||
123 | +} | ||
124 | + | ||
125 | +static int do_dc_cvap(void) | ||
126 | +{ | ||
127 | + struct sigaction sa = { | ||
128 | + .sa_flags = SA_SIGINFO, | ||
129 | + .sa_sigaction = signal_handler, | ||
130 | + }; | ||
131 | + | ||
132 | + sigemptyset(&sa.sa_mask); | ||
133 | + if (sigaction(SIGSEGV, &sa, NULL) < 0) { | ||
134 | + perror("sigaction"); | ||
135 | + return EXIT_FAILURE; | ||
146 | + } | 136 | + } |
147 | + | 137 | + |
148 | + /* Sum XZR+zad to find ZAd. */ | 138 | + asm volatile("dc cvap, %0\n\t" :: "r"(&sa)); |
149 | + za = get_tile_rowcol(s, esz, 31, a->zad, false); | ||
150 | + zn = vec_full_reg_ptr(s, a->zn); | ||
151 | + zm = vec_full_reg_ptr(s, a->zm); | ||
152 | + pn = pred_full_reg_ptr(s, a->pn); | ||
153 | + pm = pred_full_reg_ptr(s, a->pm); | ||
154 | + fpst = fpstatus_ptr(FPST_FPCR); | ||
155 | + | 139 | + |
156 | + fn(za, zn, zm, pn, pm, fpst, tcg_constant_i32(desc)); | 140 | + should_fail = true; |
141 | + asm volatile("dc cvap, %0\n\t" :: "r"(NULL)); | ||
142 | + should_fail = false; | ||
157 | + | 143 | + |
158 | + tcg_temp_free_ptr(za); | 144 | + return EXIT_SUCCESS; |
159 | + tcg_temp_free_ptr(zn); | ||
160 | + tcg_temp_free_ptr(pn); | ||
161 | + tcg_temp_free_ptr(pm); | ||
162 | + tcg_temp_free_ptr(fpst); | ||
163 | + return true; | ||
164 | +} | 145 | +} |
165 | + | 146 | + |
166 | +TRANS_FEAT(FMOPA_s, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_s) | 147 | +int main(void) |
167 | +TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a, MO_64, gen_helper_sme_fmopa_d) | 148 | +{ |
149 | + if (getauxval(AT_HWCAP) & HWCAP_DCPOP) { | ||
150 | + return do_dc_cvap(); | ||
151 | + } else { | ||
152 | + printf("SKIP: no HWCAP_DCPOP on this system\n"); | ||
153 | + return EXIT_SUCCESS; | ||
154 | + } | ||
155 | +} | ||
156 | diff --git a/tests/tcg/aarch64/Makefile.target b/tests/tcg/aarch64/Makefile.target | ||
157 | index XXXXXXX..XXXXXXX 100644 | ||
158 | --- a/tests/tcg/aarch64/Makefile.target | ||
159 | +++ b/tests/tcg/aarch64/Makefile.target | ||
160 | @@ -XXX,XX +XXX,XX @@ config-cc.mak: Makefile | ||
161 | $(quiet-@)( \ | ||
162 | $(call cc-option,-march=armv8.1-a+sve, CROSS_CC_HAS_SVE); \ | ||
163 | $(call cc-option,-march=armv8.1-a+sve2, CROSS_CC_HAS_SVE2); \ | ||
164 | + $(call cc-option,-march=armv8.2-a, CROSS_CC_HAS_ARMV8_2); \ | ||
165 | $(call cc-option,-march=armv8.3-a, CROSS_CC_HAS_ARMV8_3); \ | ||
166 | + $(call cc-option,-march=armv8.5-a, CROSS_CC_HAS_ARMV8_5); \ | ||
167 | $(call cc-option,-mbranch-protection=standard, CROSS_CC_HAS_ARMV8_BTI); \ | ||
168 | $(call cc-option,-march=armv8.5-a+memtag, CROSS_CC_HAS_ARMV8_MTE); \ | ||
169 | $(call cc-option,-march=armv9-a+sme, CROSS_CC_HAS_ARMV9_SME)) 3> config-cc.mak | ||
170 | -include config-cc.mak | ||
171 | |||
172 | +ifneq ($(CROSS_CC_HAS_ARMV8_2),) | ||
173 | +AARCH64_TESTS += dcpop | ||
174 | +dcpop: CFLAGS += -march=armv8.2-a | ||
175 | +endif | ||
176 | +ifneq ($(CROSS_CC_HAS_ARMV8_5),) | ||
177 | +AARCH64_TESTS += dcpodp | ||
178 | +dcpodp: CFLAGS += -march=armv8.5-a | ||
179 | +endif | ||
180 | + | ||
181 | # Pauth Tests | ||
182 | ifneq ($(CROSS_CC_HAS_ARMV8_3),) | ||
183 | AARCH64_TESTS += pauth-1 pauth-2 pauth-4 pauth-5 | ||
168 | -- | 184 | -- |
169 | 2.25.1 | 185 | 2.34.1 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Zhuojia Shen <chaosdefinition@hotmail.com> |
---|---|---|---|
2 | 2 | ||
3 | Dump SVCR, plus use the correct access check for Streaming Mode. | 3 | Accessing EL0-accessible Debug Communication Channel (DCC) registers in |
4 | user mode emulation is currently enabled. However, it does not match | ||
5 | Linux behavior as Linux sets MDSCR_EL1.TDCC on startup to disable EL0 | ||
6 | access to DCC (see __cpu_setup() in arch/arm64/mm/proc.S). | ||
4 | 7 | ||
5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 8 | This patch fixes access_tdcc() to check MDSCR_EL1.TDCC for EL0 and sets |
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 9 | MDSCR_EL1.TDCC for user mode emulation to match Linux. |
7 | Message-id: 20220708151540.18136-2-richard.henderson@linaro.org | 10 | |
11 | Signed-off-by: Zhuojia Shen <chaosdefinition@hotmail.com> | ||
12 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
13 | Message-id: DS7PR12MB630905198DD8E69F6817544CAC4EA@DS7PR12MB6309.namprd12.prod.outlook.com | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 15 | --- |
10 | target/arm/cpu.c | 17 ++++++++++++++++- | 16 | target/arm/cpu.c | 2 ++ |
11 | 1 file changed, 16 insertions(+), 1 deletion(-) | 17 | target/arm/debug_helper.c | 5 +++++ |
18 | 2 files changed, 7 insertions(+) | ||
12 | 19 | ||
13 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c | 20 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c |
14 | index XXXXXXX..XXXXXXX 100644 | 21 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/cpu.c | 22 | --- a/target/arm/cpu.c |
16 | +++ b/target/arm/cpu.c | 23 | +++ b/target/arm/cpu.c |
17 | @@ -XXX,XX +XXX,XX @@ static void aarch64_cpu_dump_state(CPUState *cs, FILE *f, int flags) | 24 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset_hold(Object *obj) |
18 | int i; | 25 | * This is not yet exposed from the Linux kernel in any way. |
26 | */ | ||
27 | env->cp15.sctlr_el[1] |= SCTLR_TSCXT; | ||
28 | + /* Disable access to Debug Communication Channel (DCC). */ | ||
29 | + env->cp15.mdscr_el1 |= 1 << 12; | ||
30 | #else | ||
31 | /* Reset into the highest available EL */ | ||
32 | if (arm_feature(env, ARM_FEATURE_EL3)) { | ||
33 | diff --git a/target/arm/debug_helper.c b/target/arm/debug_helper.c | ||
34 | index XXXXXXX..XXXXXXX 100644 | ||
35 | --- a/target/arm/debug_helper.c | ||
36 | +++ b/target/arm/debug_helper.c | ||
37 | @@ -XXX,XX +XXX,XX @@ static CPAccessResult access_tda(CPUARMState *env, const ARMCPRegInfo *ri, | ||
38 | * is implemented then these are controlled by MDCR_EL2.TDCC for | ||
39 | * EL2 and MDCR_EL3.TDCC for EL3. They are also controlled by | ||
40 | * the general debug access trap bits MDCR_EL2.TDA and MDCR_EL3.TDA. | ||
41 | + * For EL0, they are also controlled by MDSCR_EL1.TDCC. | ||
42 | */ | ||
43 | static CPAccessResult access_tdcc(CPUARMState *env, const ARMCPRegInfo *ri, | ||
44 | bool isread) | ||
45 | { | ||
19 | int el = arm_current_el(env); | 46 | int el = arm_current_el(env); |
20 | const char *ns_status; | 47 | uint64_t mdcr_el2 = arm_mdcr_el2_eff(env); |
21 | + bool sve; | 48 | + bool mdscr_el1_tdcc = extract32(env->cp15.mdscr_el1, 12, 1); |
22 | 49 | bool mdcr_el2_tda = (mdcr_el2 & MDCR_TDA) || (mdcr_el2 & MDCR_TDE) || | |
23 | qemu_fprintf(f, " PC=%016" PRIx64 " ", env->pc); | 50 | (arm_hcr_el2_eff(env) & HCR_TGE); |
24 | for (i = 0; i < 32; i++) { | 51 | bool mdcr_el2_tdcc = cpu_isar_feature(aa64_fgt, env_archcpu(env)) && |
25 | @@ -XXX,XX +XXX,XX @@ static void aarch64_cpu_dump_state(CPUState *cs, FILE *f, int flags) | 52 | @@ -XXX,XX +XXX,XX @@ static CPAccessResult access_tdcc(CPUARMState *env, const ARMCPRegInfo *ri, |
26 | el, | 53 | bool mdcr_el3_tdcc = cpu_isar_feature(aa64_fgt, env_archcpu(env)) && |
27 | psr & PSTATE_SP ? 'h' : 't'); | 54 | (env->cp15.mdcr_el3 & MDCR_TDCC); |
28 | 55 | ||
29 | + if (cpu_isar_feature(aa64_sme, cpu)) { | 56 | + if (el < 1 && mdscr_el1_tdcc) { |
30 | + qemu_fprintf(f, " SVCR=%08" PRIx64 " %c%c", | 57 | + return CP_ACCESS_TRAP; |
31 | + env->svcr, | ||
32 | + (FIELD_EX64(env->svcr, SVCR, ZA) ? 'Z' : '-'), | ||
33 | + (FIELD_EX64(env->svcr, SVCR, SM) ? 'S' : '-')); | ||
34 | + } | 58 | + } |
35 | if (cpu_isar_feature(aa64_bti, cpu)) { | 59 | if (el < 2 && (mdcr_el2_tda || mdcr_el2_tdcc)) { |
36 | qemu_fprintf(f, " BTYPE=%d", (psr & PSTATE_BTYPE) >> 10); | 60 | return CP_ACCESS_TRAP_EL2; |
37 | } | 61 | } |
38 | @@ -XXX,XX +XXX,XX @@ static void aarch64_cpu_dump_state(CPUState *cs, FILE *f, int flags) | ||
39 | qemu_fprintf(f, " FPCR=%08x FPSR=%08x\n", | ||
40 | vfp_get_fpcr(env), vfp_get_fpsr(env)); | ||
41 | |||
42 | - if (cpu_isar_feature(aa64_sve, cpu) && sve_exception_el(env, el) == 0) { | ||
43 | + if (cpu_isar_feature(aa64_sme, cpu) && FIELD_EX64(env->svcr, SVCR, SM)) { | ||
44 | + sve = sme_exception_el(env, el) == 0; | ||
45 | + } else if (cpu_isar_feature(aa64_sve, cpu)) { | ||
46 | + sve = sve_exception_el(env, el) == 0; | ||
47 | + } else { | ||
48 | + sve = false; | ||
49 | + } | ||
50 | + | ||
51 | + if (sve) { | ||
52 | int j, zcr_len = sve_vqm1_for_el(env, el); | ||
53 | |||
54 | for (i = 0; i <= FFR_PRED_NUM; i++) { | ||
55 | -- | 62 | -- |
56 | 2.25.1 | 63 | 2.34.1 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | From: Richard Henderson <richard.henderson@linaro.org> | ||
2 | 1 | ||
3 | Mark these as a non-streaming instructions, which should trap | ||
4 | if full a64 support is not enabled in streaming mode. | ||
5 | |||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20220708151540.18136-7-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | target/arm/sme-fa64.decode | 3 --- | ||
12 | target/arm/translate-sve.c | 22 ++++++++++++---------- | ||
13 | 2 files changed, 12 insertions(+), 13 deletions(-) | ||
14 | |||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | ||
16 | index XXXXXXX..XXXXXXX 100644 | ||
17 | --- a/target/arm/sme-fa64.decode | ||
18 | +++ b/target/arm/sme-fa64.decode | ||
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | ||
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | ||
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | ||
22 | |||
23 | -FAIL 0000 0100 --1- ---- 1011 -0-- ---- ---- # FTSSEL, FEXPA | ||
24 | -FAIL 0000 0101 --10 0001 100- ---- ---- ---- # COMPACT | ||
25 | -FAIL 0100 0101 --0- ---- 1011 ---- ---- ---- # BDEP, BEXT, BGRP | ||
26 | FAIL 0100 0101 000- ---- 0110 1--- ---- ---- # PMULLB, PMULLT (128b result) | ||
27 | FAIL 0110 0100 --1- ---- 1110 01-- ---- ---- # FMMLA, BFMMLA | ||
28 | FAIL 0110 0101 --0- ---- 0000 11-- ---- ---- # FTSMUL | ||
29 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/translate-sve.c | ||
32 | +++ b/target/arm/translate-sve.c | ||
33 | @@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_2 * const fexpa_fns[4] = { | ||
34 | NULL, gen_helper_sve_fexpa_h, | ||
35 | gen_helper_sve_fexpa_s, gen_helper_sve_fexpa_d, | ||
36 | }; | ||
37 | -TRANS_FEAT(FEXPA, aa64_sve, gen_gvec_ool_zz, | ||
38 | - fexpa_fns[a->esz], a->rd, a->rn, 0) | ||
39 | +TRANS_FEAT_NONSTREAMING(FEXPA, aa64_sve, gen_gvec_ool_zz, | ||
40 | + fexpa_fns[a->esz], a->rd, a->rn, 0) | ||
41 | |||
42 | static gen_helper_gvec_3 * const ftssel_fns[4] = { | ||
43 | NULL, gen_helper_sve_ftssel_h, | ||
44 | gen_helper_sve_ftssel_s, gen_helper_sve_ftssel_d, | ||
45 | }; | ||
46 | -TRANS_FEAT(FTSSEL, aa64_sve, gen_gvec_ool_arg_zzz, ftssel_fns[a->esz], a, 0) | ||
47 | +TRANS_FEAT_NONSTREAMING(FTSSEL, aa64_sve, gen_gvec_ool_arg_zzz, | ||
48 | + ftssel_fns[a->esz], a, 0) | ||
49 | |||
50 | /* | ||
51 | *** SVE Predicate Logical Operations Group | ||
52 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(TRN2_q, aa64_sve_f64mm, gen_gvec_ool_arg_zzz, | ||
53 | static gen_helper_gvec_3 * const compact_fns[4] = { | ||
54 | NULL, NULL, gen_helper_sve_compact_s, gen_helper_sve_compact_d | ||
55 | }; | ||
56 | -TRANS_FEAT(COMPACT, aa64_sve, gen_gvec_ool_arg_zpz, compact_fns[a->esz], a, 0) | ||
57 | +TRANS_FEAT_NONSTREAMING(COMPACT, aa64_sve, gen_gvec_ool_arg_zpz, | ||
58 | + compact_fns[a->esz], a, 0) | ||
59 | |||
60 | /* Call the helper that computes the ARM LastActiveElement pseudocode | ||
61 | * function, scaled by the element size. This includes the not found | ||
62 | @@ -XXX,XX +XXX,XX @@ static gen_helper_gvec_3 * const bext_fns[4] = { | ||
63 | gen_helper_sve2_bext_b, gen_helper_sve2_bext_h, | ||
64 | gen_helper_sve2_bext_s, gen_helper_sve2_bext_d, | ||
65 | }; | ||
66 | -TRANS_FEAT(BEXT, aa64_sve2_bitperm, gen_gvec_ool_arg_zzz, | ||
67 | - bext_fns[a->esz], a, 0) | ||
68 | +TRANS_FEAT_NONSTREAMING(BEXT, aa64_sve2_bitperm, gen_gvec_ool_arg_zzz, | ||
69 | + bext_fns[a->esz], a, 0) | ||
70 | |||
71 | static gen_helper_gvec_3 * const bdep_fns[4] = { | ||
72 | gen_helper_sve2_bdep_b, gen_helper_sve2_bdep_h, | ||
73 | gen_helper_sve2_bdep_s, gen_helper_sve2_bdep_d, | ||
74 | }; | ||
75 | -TRANS_FEAT(BDEP, aa64_sve2_bitperm, gen_gvec_ool_arg_zzz, | ||
76 | - bdep_fns[a->esz], a, 0) | ||
77 | +TRANS_FEAT_NONSTREAMING(BDEP, aa64_sve2_bitperm, gen_gvec_ool_arg_zzz, | ||
78 | + bdep_fns[a->esz], a, 0) | ||
79 | |||
80 | static gen_helper_gvec_3 * const bgrp_fns[4] = { | ||
81 | gen_helper_sve2_bgrp_b, gen_helper_sve2_bgrp_h, | ||
82 | gen_helper_sve2_bgrp_s, gen_helper_sve2_bgrp_d, | ||
83 | }; | ||
84 | -TRANS_FEAT(BGRP, aa64_sve2_bitperm, gen_gvec_ool_arg_zzz, | ||
85 | - bgrp_fns[a->esz], a, 0) | ||
86 | +TRANS_FEAT_NONSTREAMING(BGRP, aa64_sve2_bitperm, gen_gvec_ool_arg_zzz, | ||
87 | + bgrp_fns[a->esz], a, 0) | ||
88 | |||
89 | static gen_helper_gvec_3 * const cadd_fns[4] = { | ||
90 | gen_helper_sve2_cadd_b, gen_helper_sve2_cadd_h, | ||
91 | -- | ||
92 | 2.25.1 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | From: Richard Henderson <richard.henderson@linaro.org> | ||
2 | 1 | ||
3 | Mark these as a non-streaming instructions, which should trap | ||
4 | if full a64 support is not enabled in streaming mode. | ||
5 | |||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20220708151540.18136-8-richard.henderson@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | target/arm/sme-fa64.decode | 2 -- | ||
12 | target/arm/translate-sve.c | 24 +++++++++++++++--------- | ||
13 | 2 files changed, 15 insertions(+), 11 deletions(-) | ||
14 | |||
15 | diff --git a/target/arm/sme-fa64.decode b/target/arm/sme-fa64.decode | ||
16 | index XXXXXXX..XXXXXXX 100644 | ||
17 | --- a/target/arm/sme-fa64.decode | ||
18 | +++ b/target/arm/sme-fa64.decode | ||
19 | @@ -XXX,XX +XXX,XX @@ FAIL 0001 1110 0111 1110 0000 00-- ---- ---- # FJCVTZS | ||
20 | # --11 1100 --1- ---- ---- ---- ---- --10 # Load/store FP register (register offset) | ||
21 | # --11 1101 ---- ---- ---- ---- ---- ---- # Load/store FP register (scaled imm) | ||
22 | |||
23 | -FAIL 0100 0101 000- ---- 0110 1--- ---- ---- # PMULLB, PMULLT (128b result) | ||
24 | -FAIL 0110 0100 --1- ---- 1110 01-- ---- ---- # FMMLA, BFMMLA | ||
25 | FAIL 0110 0101 --0- ---- 0000 11-- ---- ---- # FTSMUL | ||
26 | FAIL 0110 0101 --01 0--- 100- ---- ---- ---- # FTMAD | ||
27 | FAIL 0110 0101 --01 1--- 001- ---- ---- ---- # FADDA | ||
28 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | ||
29 | index XXXXXXX..XXXXXXX 100644 | ||
30 | --- a/target/arm/translate-sve.c | ||
31 | +++ b/target/arm/translate-sve.c | ||
32 | @@ -XXX,XX +XXX,XX @@ static bool do_trans_pmull(DisasContext *s, arg_rrr_esz *a, bool sel) | ||
33 | gen_helper_gvec_pmull_q, gen_helper_sve2_pmull_h, | ||
34 | NULL, gen_helper_sve2_pmull_d, | ||
35 | }; | ||
36 | - if (a->esz == 0 | ||
37 | - ? !dc_isar_feature(aa64_sve2_pmull128, s) | ||
38 | - : !dc_isar_feature(aa64_sve, s)) { | ||
39 | + | ||
40 | + if (a->esz == 0) { | ||
41 | + if (!dc_isar_feature(aa64_sve2_pmull128, s)) { | ||
42 | + return false; | ||
43 | + } | ||
44 | + s->is_nonstreaming = true; | ||
45 | + } else if (!dc_isar_feature(aa64_sve, s)) { | ||
46 | return false; | ||
47 | } | ||
48 | return gen_gvec_ool_arg_zzz(s, fns[a->esz], a, sel); | ||
49 | @@ -XXX,XX +XXX,XX @@ DO_ZPZZ_FP(FMINP, aa64_sve2, sve2_fminp_zpzz) | ||
50 | * SVE Integer Multiply-Add (unpredicated) | ||
51 | */ | ||
52 | |||
53 | -TRANS_FEAT(FMMLA_s, aa64_sve_f32mm, gen_gvec_fpst_zzzz, gen_helper_fmmla_s, | ||
54 | - a->rd, a->rn, a->rm, a->ra, 0, FPST_FPCR) | ||
55 | -TRANS_FEAT(FMMLA_d, aa64_sve_f64mm, gen_gvec_fpst_zzzz, gen_helper_fmmla_d, | ||
56 | - a->rd, a->rn, a->rm, a->ra, 0, FPST_FPCR) | ||
57 | +TRANS_FEAT_NONSTREAMING(FMMLA_s, aa64_sve_f32mm, gen_gvec_fpst_zzzz, | ||
58 | + gen_helper_fmmla_s, a->rd, a->rn, a->rm, a->ra, | ||
59 | + 0, FPST_FPCR) | ||
60 | +TRANS_FEAT_NONSTREAMING(FMMLA_d, aa64_sve_f64mm, gen_gvec_fpst_zzzz, | ||
61 | + gen_helper_fmmla_d, a->rd, a->rn, a->rm, a->ra, | ||
62 | + 0, FPST_FPCR) | ||
63 | |||
64 | static gen_helper_gvec_4 * const sqdmlal_zzzw_fns[] = { | ||
65 | NULL, gen_helper_sve2_sqdmlal_zzzw_h, | ||
66 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(BFDOT_zzzz, aa64_sve_bf16, gen_gvec_ool_arg_zzzz, | ||
67 | TRANS_FEAT(BFDOT_zzxz, aa64_sve_bf16, gen_gvec_ool_arg_zzxz, | ||
68 | gen_helper_gvec_bfdot_idx, a) | ||
69 | |||
70 | -TRANS_FEAT(BFMMLA, aa64_sve_bf16, gen_gvec_ool_arg_zzzz, | ||
71 | - gen_helper_gvec_bfmmla, a, 0) | ||
72 | +TRANS_FEAT_NONSTREAMING(BFMMLA, aa64_sve_bf16, gen_gvec_ool_arg_zzzz, | ||
73 | + gen_helper_gvec_bfmmla, a, 0) | ||
74 | |||
75 | static bool do_BFMLAL_zzzw(DisasContext *s, arg_rrrr_esz *a, bool sel) | ||
76 | { | ||
77 | -- | ||
78 | 2.25.1 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | From: Richard Henderson <richard.henderson@linaro.org> | ||
2 | 1 | ||
3 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
4 | Message-id: 20220708151540.18136-26-richard.henderson@linaro.org | ||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | --- | ||
8 | target/arm/helper-sme.h | 2 ++ | ||
9 | target/arm/sme.decode | 2 ++ | ||
10 | target/arm/sme_helper.c | 56 ++++++++++++++++++++++++++++++++++++++ | ||
11 | target/arm/translate-sme.c | 30 ++++++++++++++++++++ | ||
12 | 4 files changed, 90 insertions(+) | ||
13 | |||
14 | diff --git a/target/arm/helper-sme.h b/target/arm/helper-sme.h | ||
15 | index XXXXXXX..XXXXXXX 100644 | ||
16 | --- a/target/arm/helper-sme.h | ||
17 | +++ b/target/arm/helper-sme.h | ||
18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_7(sme_fmopa_s, TCG_CALL_NO_RWG, | ||
19 | void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | ||
20 | DEF_HELPER_FLAGS_7(sme_fmopa_d, TCG_CALL_NO_RWG, | ||
21 | void, ptr, ptr, ptr, ptr, ptr, ptr, i32) | ||
22 | +DEF_HELPER_FLAGS_6(sme_bfmopa, TCG_CALL_NO_RWG, | ||
23 | + void, ptr, ptr, ptr, ptr, ptr, i32) | ||
24 | diff --git a/target/arm/sme.decode b/target/arm/sme.decode | ||
25 | index XXXXXXX..XXXXXXX 100644 | ||
26 | --- a/target/arm/sme.decode | ||
27 | +++ b/target/arm/sme.decode | ||
28 | @@ -XXX,XX +XXX,XX @@ ADDVA_d 11000000 11 01000 1 ... ... ..... 00 ... @adda_64 | ||
29 | |||
30 | FMOPA_s 10000000 100 ..... ... ... ..... . 00 .. @op_32 | ||
31 | FMOPA_d 10000000 110 ..... ... ... ..... . 0 ... @op_64 | ||
32 | + | ||
33 | +BFMOPA 10000001 100 ..... ... ... ..... . 00 .. @op_32 | ||
34 | diff --git a/target/arm/sme_helper.c b/target/arm/sme_helper.c | ||
35 | index XXXXXXX..XXXXXXX 100644 | ||
36 | --- a/target/arm/sme_helper.c | ||
37 | +++ b/target/arm/sme_helper.c | ||
38 | @@ -XXX,XX +XXX,XX @@ void HELPER(sme_fmopa_d)(void *vza, void *vzn, void *vzm, void *vpn, | ||
39 | } | ||
40 | } | ||
41 | } | ||
42 | + | ||
43 | +/* | ||
44 | + * Alter PAIR as needed for controlling predicates being false, | ||
45 | + * and for NEG on an enabled row element. | ||
46 | + */ | ||
47 | +static inline uint32_t f16mop_adj_pair(uint32_t pair, uint32_t pg, uint32_t neg) | ||
48 | +{ | ||
49 | + /* | ||
50 | + * The pseudocode uses a conditional negate after the conditional zero. | ||
51 | + * It is simpler here to unconditionally negate before conditional zero. | ||
52 | + */ | ||
53 | + pair ^= neg; | ||
54 | + if (!(pg & 1)) { | ||
55 | + pair &= 0xffff0000u; | ||
56 | + } | ||
57 | + if (!(pg & 4)) { | ||
58 | + pair &= 0x0000ffffu; | ||
59 | + } | ||
60 | + return pair; | ||
61 | +} | ||
62 | + | ||
63 | +void HELPER(sme_bfmopa)(void *vza, void *vzn, void *vzm, void *vpn, | ||
64 | + void *vpm, uint32_t desc) | ||
65 | +{ | ||
66 | + intptr_t row, col, oprsz = simd_maxsz(desc); | ||
67 | + uint32_t neg = simd_data(desc) * 0x80008000u; | ||
68 | + uint16_t *pn = vpn, *pm = vpm; | ||
69 | + | ||
70 | + for (row = 0; row < oprsz; ) { | ||
71 | + uint16_t prow = pn[H2(row >> 4)]; | ||
72 | + do { | ||
73 | + void *vza_row = vza + tile_vslice_offset(row); | ||
74 | + uint32_t n = *(uint32_t *)(vzn + H1_4(row)); | ||
75 | + | ||
76 | + n = f16mop_adj_pair(n, prow, neg); | ||
77 | + | ||
78 | + for (col = 0; col < oprsz; ) { | ||
79 | + uint16_t pcol = pm[H2(col >> 4)]; | ||
80 | + do { | ||
81 | + if (prow & pcol & 0b0101) { | ||
82 | + uint32_t *a = vza_row + H1_4(col); | ||
83 | + uint32_t m = *(uint32_t *)(vzm + H1_4(col)); | ||
84 | + | ||
85 | + m = f16mop_adj_pair(m, pcol, 0); | ||
86 | + *a = bfdotadd(*a, n, m); | ||
87 | + | ||
88 | + col += 4; | ||
89 | + pcol >>= 4; | ||
90 | + } | ||
91 | + } while (col & 15); | ||
92 | + } | ||
93 | + row += 4; | ||
94 | + prow >>= 4; | ||
95 | + } while (row & 15); | ||
96 | + } | ||
97 | +} | ||
98 | diff --git a/target/arm/translate-sme.c b/target/arm/translate-sme.c | ||
99 | index XXXXXXX..XXXXXXX 100644 | ||
100 | --- a/target/arm/translate-sme.c | ||
101 | +++ b/target/arm/translate-sme.c | ||
102 | @@ -XXX,XX +XXX,XX @@ TRANS_FEAT(ADDVA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addva_s) | ||
103 | TRANS_FEAT(ADDHA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addha_d) | ||
104 | TRANS_FEAT(ADDVA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addva_d) | ||
105 | |||
106 | +static bool do_outprod(DisasContext *s, arg_op *a, MemOp esz, | ||
107 | + gen_helper_gvec_5 *fn) | ||
108 | +{ | ||
109 | + int svl = streaming_vec_reg_size(s); | ||
110 | + uint32_t desc = simd_desc(svl, svl, a->sub); | ||
111 | + TCGv_ptr za, zn, zm, pn, pm; | ||
112 | + | ||
113 | + if (!sme_smza_enabled_check(s)) { | ||
114 | + return true; | ||
115 | + } | ||
116 | + | ||
117 | + /* Sum XZR+zad to find ZAd. */ | ||
118 | + za = get_tile_rowcol(s, esz, 31, a->zad, false); | ||
119 | + zn = vec_full_reg_ptr(s, a->zn); | ||
120 | + zm = vec_full_reg_ptr(s, a->zm); | ||
121 | + pn = pred_full_reg_ptr(s, a->pn); | ||
122 | + pm = pred_full_reg_ptr(s, a->pm); | ||
123 | + | ||
124 | + fn(za, zn, zm, pn, pm, tcg_constant_i32(desc)); | ||
125 | + | ||
126 | + tcg_temp_free_ptr(za); | ||
127 | + tcg_temp_free_ptr(zn); | ||
128 | + tcg_temp_free_ptr(pn); | ||
129 | + tcg_temp_free_ptr(pm); | ||
130 | + return true; | ||
131 | +} | ||
132 | + | ||
133 | static bool do_outprod_fpst(DisasContext *s, arg_op *a, MemOp esz, | ||
134 | gen_helper_gvec_5_ptr *fn) | ||
135 | { | ||
136 | @@ -XXX,XX +XXX,XX @@ static bool do_outprod_fpst(DisasContext *s, arg_op *a, MemOp esz, | ||
137 | |||
138 | TRANS_FEAT(FMOPA_s, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_s) | ||
139 | TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a, MO_64, gen_helper_sme_fmopa_d) | ||
140 | + | ||
141 | +/* TODO: FEAT_EBF16 */ | ||
142 | +TRANS_FEAT(BFMOPA, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_bfmopa) | ||
143 | -- | ||
144 | 2.25.1 | diff view generated by jsdifflib |