1 | arm queue; dunno if this will be the last before softfreeze | 1 | Just my fp16 work, plus some small stuff for the sbsa-ref board; |
---|---|---|---|
2 | or not, but anyway probably the last large one. New orangepi-pc | 2 | but my rule of thumb is to send a pullreq once I get over about |
3 | board model is the big item here. | 3 | 30 patches... |
4 | 4 | ||
5 | thanks | ||
6 | -- PMM | 5 | -- PMM |
7 | 6 | ||
8 | The following changes since commit 67d9ef7d541c3d21a25796c51c26da096a433565: | 7 | The following changes since commit 2f4c51c0f384d7888a04b4815861e6d5fd244d75: |
9 | 8 | ||
10 | Merge remote-tracking branch 'remotes/pmaydell/tags/pull-docs-20200312' into staging (2020-03-12 15:20:52 +0000) | 9 | Merge remote-tracking branch 'remotes/kraxel/tags/usb-20200831-pull-request' into staging (2020-08-31 19:39:13 +0100) |
11 | 10 | ||
12 | are available in the Git repository at: | 11 | are available in the Git repository at: |
13 | 12 | ||
14 | https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20200312 | 13 | https://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20200901 |
15 | 14 | ||
16 | for you to fetch changes up to aca53be34ac3e7cac5f39396a51a338860a5a837: | 15 | for you to fetch changes up to 3f462bf0f6ea6382dd1502d4eb1fcd33c8e774f5: |
17 | 16 | ||
18 | target/arm: kvm: Inject events at the last stage of sync (2020-03-12 16:31:10 +0000) | 17 | hw/arm/sbsa-ref : Add embedded controller in secure memory (2020-09-01 14:01:34 +0100) |
19 | 18 | ||
20 | ---------------------------------------------------------------- | 19 | ---------------------------------------------------------------- |
21 | target-arm queue: | 20 | target-arm queue: |
22 | * Fix various bugs that might result in an assert() due to | 21 | * Implement fp16 support for AArch32 VFP and Neon |
23 | incorrect hflags for M-profile CPUs | 22 | * hw/arm/sbsa-ref: add "reg" property to DT cpu nodes |
24 | * Fix Aspeed SMC Controller user-mode select handling | 23 | * hw/arm/sbsa-ref : Add embedded controller in secure memory |
25 | * Report correct (with-tag) address in fault address register | ||
26 | when TBI is enabled | ||
27 | * cubieboard: make sure SOC object isn't leaked | ||
28 | * fsl-imx25: Wire up eSDHC controllers | ||
29 | * fsl-imx25: Wire up USB controllers | ||
30 | * New board model: orangepi-pc (OrangePi PC) | ||
31 | * ARM/KVM: if user doesn't select GIC version and the | ||
32 | host kernel can only provide GICv3, use that, rather | ||
33 | than defaulting to "fail because GICv2 isn't possible" | ||
34 | * kvm: Only do KVM_SET_VCPU_EVENTS at the last stage of sync | ||
35 | 24 | ||
36 | ---------------------------------------------------------------- | 25 | ---------------------------------------------------------------- |
37 | Beata Michalska (1): | 26 | Graeme Gregory (2): |
38 | target/arm: kvm: Inject events at the last stage of sync | 27 | hw/misc/sbsa_ec : Add an embedded controller for sbsa-ref |
28 | hw/arm/sbsa-ref : Add embedded controller in secure memory | ||
39 | 29 | ||
40 | Cédric Le Goater (2): | 30 | Leif Lindholm (1): |
41 | aspeed/smc: Add some tracing | 31 | hw/arm/sbsa-ref: add "reg" property to DT cpu nodes |
42 | aspeed/smc: Fix User mode select/unselect scheme | ||
43 | 32 | ||
44 | Eric Auger (6): | 33 | Peter Maydell (44): |
45 | hw/arm/virt: Document 'max' value in gic-version property description | 34 | target/arm: Remove local definitions of float constants |
46 | hw/arm/virt: Introduce VirtGICType enum type | 35 | target/arm: Use correct ID register check for aa32_fp16_arith |
47 | hw/arm/virt: Introduce finalize_gic_version() | 36 | target/arm: Implement VFP fp16 for VFP_BINOP operations |
48 | target/arm/kvm: Let kvm_arm_vgic_probe() return a bitmap | 37 | target/arm: Implement VFP fp16 VMLA, VMLS, VNMLS, VNMLA, VNMUL |
49 | hw/arm/virt: kvm: Restructure finalize_gic_version() | 38 | target/arm: Macroify trans functions for VFMA, VFMS, VFNMA, VFNMS |
50 | hw/arm/virt: kvm: allow gicv3 by default if v2 cannot work | 39 | target/arm: Implement VFP fp16 for fused-multiply-add |
40 | target/arm: Macroify uses of do_vfp_2op_sp() and do_vfp_2op_dp() | ||
41 | target/arm: Implement VFP fp16 for VABS, VNEG, VSQRT | ||
42 | target/arm: Implement VFP fp16 for VMOV immediate | ||
43 | target/arm: Implement VFP fp16 VCMP | ||
44 | target/arm: Implement VFP fp16 VLDR and VSTR | ||
45 | target/arm: Implement VFP fp16 VCVT between float and integer | ||
46 | target/arm: Make VFP_CONV_FIX macros take separate float type and float size | ||
47 | target/arm: Use macros instead of open-coding fp16 conversion helpers | ||
48 | target/arm: Implement VFP fp16 VCVT between float and fixed-point | ||
49 | target/arm: Implement VFP vp16 VCVT-with-specified-rounding-mode | ||
50 | target/arm: Implement VFP fp16 VSEL | ||
51 | target/arm: Implement VFP fp16 VRINT* | ||
52 | target/arm: Implement new VFP fp16 insn VINS | ||
53 | target/arm: Implement new VFP fp16 insn VMOVX | ||
54 | target/arm: Implement VFP fp16 VMOV between gp and halfprec registers | ||
55 | target/arm: Implement FP16 for Neon VADD, VSUB, VABD, VMUL | ||
56 | target/arm: Implement fp16 for Neon VRECPE, VRSQRTE using gvec | ||
57 | target/arm: Implement fp16 for Neon VABS, VNEG of floats | ||
58 | target/arm: Implement fp16 for VCEQ, VCGE, VCGT comparisons | ||
59 | target/arm: Implement fp16 for VACGE, VACGT | ||
60 | target/arm: Implement fp16 for Neon VMAX, VMIN | ||
61 | target/arm: Implement fp16 for Neon VMAXNM, VMINNM | ||
62 | target/arm: Implement fp16 for Neon VMLA, VMLS operations | ||
63 | target/arm: Implement fp16 for Neon VFMA, VMFS | ||
64 | target/arm: Implement fp16 for Neon fp compare-vs-0 | ||
65 | target/arm: Implement fp16 for Neon VRECPS | ||
66 | target/arm: Implement fp16 for Neon VRSQRTS | ||
67 | target/arm: Implement fp16 for Neon pairwise fp ops | ||
68 | target/arm: Implement fp16 for Neon float-integer VCVT | ||
69 | target/arm: Convert Neon VCVT fixed-point to gvec | ||
70 | target/arm: Implement fp16 for Neon VCVT fixed-point | ||
71 | target/arm: Implement fp16 for Neon VCVT with rounding modes | ||
72 | target/arm: Implement fp16 for Neon VRINT-with-specified-rounding-mode | ||
73 | target/arm: Implement fp16 for Neon VRINTX | ||
74 | target/arm/vec_helper: Handle oprsz less than 16 bytes in indexed operations | ||
75 | target/arm/vec_helper: Add gvec fp indexed multiply-and-add operations | ||
76 | target/arm: Implement fp16 for Neon VMUL, VMLA, VMLS | ||
77 | target/arm: Enable FP16 in '-cpu max' | ||
51 | 78 | ||
52 | Guenter Roeck (2): | 79 | target/arm/cpu.h | 7 +- |
53 | hw/arm/fsl-imx25: Wire up eSDHC controllers | 80 | target/arm/helper.h | 133 ++++++- |
54 | hw/arm/fsl-imx25: Wire up USB controllers | 81 | target/arm/neon-dp.decode | 8 +- |
82 | target/arm/vfp-uncond.decode | 27 +- | ||
83 | target/arm/vfp.decode | 34 +- | ||
84 | hw/arm/sbsa-ref.c | 43 ++- | ||
85 | hw/misc/sbsa_ec.c | 98 +++++ | ||
86 | target/arm/cpu.c | 3 +- | ||
87 | target/arm/cpu64.c | 10 +- | ||
88 | target/arm/helper-a64.c | 11 - | ||
89 | target/arm/translate-sve.c | 4 - | ||
90 | target/arm/vec_helper.c | 431 ++++++++++++++++++++- | ||
91 | target/arm/vfp_helper.c | 244 +++++------- | ||
92 | hw/misc/meson.build | 2 + | ||
93 | target/arm/translate-neon.c.inc | 755 +++++++++++++------------------------ | ||
94 | target/arm/translate-vfp.c.inc | 810 ++++++++++++++++++++++++++++++++++++---- | ||
95 | 16 files changed, 1819 insertions(+), 801 deletions(-) | ||
96 | create mode 100644 hw/misc/sbsa_ec.c | ||
55 | 97 | ||
56 | Igor Mammedov (1): | ||
57 | hw/arm/cubieboard: make sure SOC object isn't leaked | ||
58 | |||
59 | Niek Linnenbank (13): | ||
60 | hw/arm: add Allwinner H3 System-on-Chip | ||
61 | hw/arm: add Xunlong Orange Pi PC machine | ||
62 | hw/arm/allwinner-h3: add Clock Control Unit | ||
63 | hw/arm/allwinner-h3: add USB host controller | ||
64 | hw/arm/allwinner-h3: add System Control module | ||
65 | hw/arm/allwinner: add CPU Configuration module | ||
66 | hw/arm/allwinner: add Security Identifier device | ||
67 | hw/arm/allwinner: add SD/MMC host controller | ||
68 | hw/arm/allwinner-h3: add EMAC ethernet device | ||
69 | hw/arm/allwinner-h3: add Boot ROM support | ||
70 | hw/arm/allwinner-h3: add SDRAM controller device | ||
71 | hw/arm/allwinner: add RTC device support | ||
72 | docs: add Orange Pi PC document | ||
73 | |||
74 | Peter Maydell (4): | ||
75 | hw/intc/armv7m_nvic: Rebuild hflags on reset | ||
76 | target/arm: Update hflags in trans_CPS_v7m() | ||
77 | target/arm: Recalculate hflags correctly after writes to CONTROL | ||
78 | target/arm: Fix some comment typos | ||
79 | |||
80 | Philippe Mathieu-Daudé (5): | ||
81 | tests/boot_linux_console: Add a quick test for the OrangePi PC board | ||
82 | tests/boot_linux_console: Add initrd test for the Orange Pi PC board | ||
83 | tests/boot_linux_console: Add a SD card test for the OrangePi PC board | ||
84 | tests/boot_linux_console: Add a SLOW test booting Ubuntu on OrangePi PC | ||
85 | tests/boot_linux_console: Test booting NetBSD via U-Boot on OrangePi PC | ||
86 | |||
87 | Richard Henderson (2): | ||
88 | target/arm: Check addresses for disabled regimes | ||
89 | target/arm: Disable clean_data_tbi for system mode | ||
90 | |||
91 | Makefile.objs | 1 + | ||
92 | hw/arm/Makefile.objs | 1 + | ||
93 | hw/misc/Makefile.objs | 5 + | ||
94 | hw/net/Makefile.objs | 1 + | ||
95 | hw/rtc/Makefile.objs | 1 + | ||
96 | hw/sd/Makefile.objs | 1 + | ||
97 | hw/usb/hcd-ehci.h | 1 + | ||
98 | include/hw/arm/allwinner-a10.h | 4 + | ||
99 | include/hw/arm/allwinner-h3.h | 161 ++++++ | ||
100 | include/hw/arm/fsl-imx25.h | 18 + | ||
101 | include/hw/arm/virt.h | 12 +- | ||
102 | include/hw/misc/allwinner-cpucfg.h | 52 ++ | ||
103 | include/hw/misc/allwinner-h3-ccu.h | 66 +++ | ||
104 | include/hw/misc/allwinner-h3-dramc.h | 106 ++++ | ||
105 | include/hw/misc/allwinner-h3-sysctrl.h | 67 +++ | ||
106 | include/hw/misc/allwinner-sid.h | 60 +++ | ||
107 | include/hw/net/allwinner-sun8i-emac.h | 99 ++++ | ||
108 | include/hw/rtc/allwinner-rtc.h | 134 +++++ | ||
109 | include/hw/sd/allwinner-sdhost.h | 135 +++++ | ||
110 | target/arm/helper.h | 1 + | ||
111 | target/arm/kvm_arm.h | 3 + | ||
112 | hw/arm/allwinner-a10.c | 19 + | ||
113 | hw/arm/allwinner-h3.c | 465 ++++++++++++++++++ | ||
114 | hw/arm/cubieboard.c | 18 + | ||
115 | hw/arm/fsl-imx25.c | 56 +++ | ||
116 | hw/arm/imx25_pdk.c | 16 + | ||
117 | hw/arm/orangepi.c | 130 +++++ | ||
118 | hw/arm/virt.c | 145 ++++-- | ||
119 | hw/intc/armv7m_nvic.c | 6 + | ||
120 | hw/misc/allwinner-cpucfg.c | 282 +++++++++++ | ||
121 | hw/misc/allwinner-h3-ccu.c | 242 +++++++++ | ||
122 | hw/misc/allwinner-h3-dramc.c | 358 ++++++++++++++ | ||
123 | hw/misc/allwinner-h3-sysctrl.c | 140 ++++++ | ||
124 | hw/misc/allwinner-sid.c | 168 +++++++ | ||
125 | hw/net/allwinner-sun8i-emac.c | 871 +++++++++++++++++++++++++++++++++ | ||
126 | hw/rtc/allwinner-rtc.c | 411 ++++++++++++++++ | ||
127 | hw/sd/allwinner-sdhost.c | 854 ++++++++++++++++++++++++++++++++ | ||
128 | hw/ssi/aspeed_smc.c | 56 ++- | ||
129 | hw/usb/hcd-ehci-sysbus.c | 17 + | ||
130 | target/arm/helper.c | 49 +- | ||
131 | target/arm/kvm.c | 14 +- | ||
132 | target/arm/kvm32.c | 15 +- | ||
133 | target/arm/kvm64.c | 15 +- | ||
134 | target/arm/translate-a64.c | 11 + | ||
135 | target/arm/translate.c | 14 +- | ||
136 | MAINTAINERS | 9 + | ||
137 | default-configs/arm-softmmu.mak | 1 + | ||
138 | docs/system/arm/orangepi.rst | 253 ++++++++++ | ||
139 | docs/system/target-arm.rst | 2 + | ||
140 | hw/arm/Kconfig | 12 + | ||
141 | hw/misc/trace-events | 19 + | ||
142 | hw/net/Kconfig | 3 + | ||
143 | hw/net/trace-events | 10 + | ||
144 | hw/rtc/trace-events | 4 + | ||
145 | hw/sd/trace-events | 7 + | ||
146 | hw/ssi/trace-events | 10 + | ||
147 | tests/acceptance/boot_linux_console.py | 230 +++++++++ | ||
148 | 57 files changed, 5787 insertions(+), 74 deletions(-) | ||
149 | create mode 100644 include/hw/arm/allwinner-h3.h | ||
150 | create mode 100644 include/hw/misc/allwinner-cpucfg.h | ||
151 | create mode 100644 include/hw/misc/allwinner-h3-ccu.h | ||
152 | create mode 100644 include/hw/misc/allwinner-h3-dramc.h | ||
153 | create mode 100644 include/hw/misc/allwinner-h3-sysctrl.h | ||
154 | create mode 100644 include/hw/misc/allwinner-sid.h | ||
155 | create mode 100644 include/hw/net/allwinner-sun8i-emac.h | ||
156 | create mode 100644 include/hw/rtc/allwinner-rtc.h | ||
157 | create mode 100644 include/hw/sd/allwinner-sdhost.h | ||
158 | create mode 100644 hw/arm/allwinner-h3.c | ||
159 | create mode 100644 hw/arm/orangepi.c | ||
160 | create mode 100644 hw/misc/allwinner-cpucfg.c | ||
161 | create mode 100644 hw/misc/allwinner-h3-ccu.c | ||
162 | create mode 100644 hw/misc/allwinner-h3-dramc.c | ||
163 | create mode 100644 hw/misc/allwinner-h3-sysctrl.c | ||
164 | create mode 100644 hw/misc/allwinner-sid.c | ||
165 | create mode 100644 hw/net/allwinner-sun8i-emac.c | ||
166 | create mode 100644 hw/rtc/allwinner-rtc.c | ||
167 | create mode 100644 hw/sd/allwinner-sdhost.c | ||
168 | create mode 100644 docs/system/arm/orangepi.rst | ||
169 | create mode 100644 hw/ssi/trace-events | ||
170 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | In several places the target/arm code defines local float constants | ||
2 | for 2, 3 and 1.5, which are also provided by include/fpu/softfloat.h. | ||
3 | Remove the unnecessary local duplicate versions. | ||
1 | 4 | ||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20200828183354.27913-2-peter.maydell@linaro.org | ||
8 | --- | ||
9 | target/arm/helper-a64.c | 11 ----------- | ||
10 | target/arm/translate-sve.c | 4 ---- | ||
11 | target/arm/vfp_helper.c | 4 ---- | ||
12 | 3 files changed, 19 deletions(-) | ||
13 | |||
14 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | ||
16 | --- a/target/arm/helper-a64.c | ||
17 | +++ b/target/arm/helper-a64.c | ||
18 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_cgt_f64)(float64 a, float64 b, void *fpstp) | ||
19 | * versions, these do a fully fused multiply-add or | ||
20 | * multiply-add-and-halve. | ||
21 | */ | ||
22 | -#define float16_two make_float16(0x4000) | ||
23 | -#define float16_three make_float16(0x4200) | ||
24 | -#define float16_one_point_five make_float16(0x3e00) | ||
25 | - | ||
26 | -#define float32_two make_float32(0x40000000) | ||
27 | -#define float32_three make_float32(0x40400000) | ||
28 | -#define float32_one_point_five make_float32(0x3fc00000) | ||
29 | - | ||
30 | -#define float64_two make_float64(0x4000000000000000ULL) | ||
31 | -#define float64_three make_float64(0x4008000000000000ULL) | ||
32 | -#define float64_one_point_five make_float64(0x3FF8000000000000ULL) | ||
33 | |||
34 | uint32_t HELPER(recpsf_f16)(uint32_t a, uint32_t b, void *fpstp) | ||
35 | { | ||
36 | diff --git a/target/arm/translate-sve.c b/target/arm/translate-sve.c | ||
37 | index XXXXXXX..XXXXXXX 100644 | ||
38 | --- a/target/arm/translate-sve.c | ||
39 | +++ b/target/arm/translate-sve.c | ||
40 | @@ -XXX,XX +XXX,XX @@ static bool trans_##NAME##_zpzi(DisasContext *s, arg_rpri_esz *a) \ | ||
41 | return true; \ | ||
42 | } | ||
43 | |||
44 | -#define float16_two make_float16(0x4000) | ||
45 | -#define float32_two make_float32(0x40000000) | ||
46 | -#define float64_two make_float64(0x4000000000000000ULL) | ||
47 | - | ||
48 | DO_FP_IMM(FADD, fadds, half, one) | ||
49 | DO_FP_IMM(FSUB, fsubs, half, one) | ||
50 | DO_FP_IMM(FMUL, fmuls, half, two) | ||
51 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
52 | index XXXXXXX..XXXXXXX 100644 | ||
53 | --- a/target/arm/vfp_helper.c | ||
54 | +++ b/target/arm/vfp_helper.c | ||
55 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(vfp_fcvt_f64_to_f16)(float64 a, void *fpstp, uint32_t ahp_mode) | ||
56 | return r; | ||
57 | } | ||
58 | |||
59 | -#define float32_two make_float32(0x40000000) | ||
60 | -#define float32_three make_float32(0x40400000) | ||
61 | -#define float32_one_point_five make_float32(0x3fc00000) | ||
62 | - | ||
63 | float32 HELPER(recps_f32)(CPUARMState *env, float32 a, float32 b) | ||
64 | { | ||
65 | float_status *s = &env->vfp.standard_fp_status; | ||
66 | -- | ||
67 | 2.20.1 | ||
68 | |||
69 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | The aa32_fp16_arith feature check function currently looks at the | ||
2 | AArch64 ID_AA64PFR0 register. This is (as the comment notes) not | ||
3 | correct. The bogus check was put in mostly to allow testing of the | ||
4 | fp16 variants of the VCMLA instructions and it was something of | ||
5 | a mistake that we allowed them to exist in master. | ||
1 | 6 | ||
7 | Switch the feature check function to testing VMFR1.FPHP, which is | ||
8 | what it ought to be. | ||
9 | |||
10 | This will remove emulation of the VCMLA and VCADD insns from | ||
11 | AArch32 code running on an AArch64 '-cpu max' using system emulation. | ||
12 | (They were never enabled for aarch32 linux-user and system-emulation.) | ||
13 | Since we weren't advertising their existence via the AArch32 ID | ||
14 | register, well-behaved guests wouldn't have been using them anyway. | ||
15 | |||
16 | Once we have implemented all the AArch32 support for the FP16 extension | ||
17 | we will advertise it in the MVFR1 ID register field, which will reenable | ||
18 | these insns along with all the others. | ||
19 | |||
20 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
21 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
22 | Message-id: 20200828183354.27913-3-peter.maydell@linaro.org | ||
23 | --- | ||
24 | target/arm/cpu.h | 7 +------ | ||
25 | 1 file changed, 1 insertion(+), 6 deletions(-) | ||
26 | |||
27 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h | ||
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/target/arm/cpu.h | ||
30 | +++ b/target/arm/cpu.h | ||
31 | @@ -XXX,XX +XXX,XX @@ static inline bool isar_feature_aa32_predinv(const ARMISARegisters *id) | ||
32 | |||
33 | static inline bool isar_feature_aa32_fp16_arith(const ARMISARegisters *id) | ||
34 | { | ||
35 | - /* | ||
36 | - * This is a placeholder for use by VCMA until the rest of | ||
37 | - * the ARMv8.2-FP16 extension is implemented for aa32 mode. | ||
38 | - * At which point we can properly set and check MVFR1.FPHP. | ||
39 | - */ | ||
40 | - return FIELD_EX64(id->id_aa64pfr0, ID_AA64PFR0, FP) == 1; | ||
41 | + return FIELD_EX32(id->mvfr1, MVFR1, FPHP) >= 3; | ||
42 | } | ||
43 | |||
44 | static inline bool isar_feature_aa32_vfp_simd(const ARMISARegisters *id) | ||
45 | -- | ||
46 | 2.20.1 | ||
47 | |||
48 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | 1 | Implmeent VFP fp16 support for simple binary-operator VFP insns VADD, | |
2 | VSUB, VMUL, VDIV, VMINNM and VMAXNM: | ||
3 | |||
4 | * make the VFP_BINOP() macro generate float16 helpers as well as | ||
5 | float32 and float64 | ||
6 | * implement a do_vfp_3op_hp() function similar to the existing | ||
7 | do_vfp_3op_sp() | ||
8 | * add decode for the half-precision insn patterns | ||
9 | |||
10 | Note that the VFP_BINOP macro use creates a couple of unused helper | ||
11 | functions vfp_maxh and vfp_minh, but they're small so it's not worth | ||
12 | splitting the BINOP operations into "needs halfprec" and "no | ||
13 | halfprec" groups. | ||
14 | |||
15 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
16 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
17 | Message-id: 20200828183354.27913-4-peter.maydell@linaro.org | ||
18 | --- | ||
19 | target/arm/helper.h | 8 ++++ | ||
20 | target/arm/vfp-uncond.decode | 3 ++ | ||
21 | target/arm/vfp.decode | 4 ++ | ||
22 | target/arm/vfp_helper.c | 5 ++ | ||
23 | target/arm/translate-vfp.c.inc | 86 ++++++++++++++++++++++++++++++++++ | ||
24 | 5 files changed, 106 insertions(+) | ||
25 | |||
26 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
27 | index XXXXXXX..XXXXXXX 100644 | ||
28 | --- a/target/arm/helper.h | ||
29 | +++ b/target/arm/helper.h | ||
30 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(probe_access, TCG_CALL_NO_WG, void, env, tl, i32, i32, i32) | ||
31 | DEF_HELPER_1(vfp_get_fpscr, i32, env) | ||
32 | DEF_HELPER_2(vfp_set_fpscr, void, env, i32) | ||
33 | |||
34 | +DEF_HELPER_3(vfp_addh, f16, f16, f16, ptr) | ||
35 | DEF_HELPER_3(vfp_adds, f32, f32, f32, ptr) | ||
36 | DEF_HELPER_3(vfp_addd, f64, f64, f64, ptr) | ||
37 | +DEF_HELPER_3(vfp_subh, f16, f16, f16, ptr) | ||
38 | DEF_HELPER_3(vfp_subs, f32, f32, f32, ptr) | ||
39 | DEF_HELPER_3(vfp_subd, f64, f64, f64, ptr) | ||
40 | +DEF_HELPER_3(vfp_mulh, f16, f16, f16, ptr) | ||
41 | DEF_HELPER_3(vfp_muls, f32, f32, f32, ptr) | ||
42 | DEF_HELPER_3(vfp_muld, f64, f64, f64, ptr) | ||
43 | +DEF_HELPER_3(vfp_divh, f16, f16, f16, ptr) | ||
44 | DEF_HELPER_3(vfp_divs, f32, f32, f32, ptr) | ||
45 | DEF_HELPER_3(vfp_divd, f64, f64, f64, ptr) | ||
46 | +DEF_HELPER_3(vfp_maxh, f16, f16, f16, ptr) | ||
47 | DEF_HELPER_3(vfp_maxs, f32, f32, f32, ptr) | ||
48 | DEF_HELPER_3(vfp_maxd, f64, f64, f64, ptr) | ||
49 | +DEF_HELPER_3(vfp_minh, f16, f16, f16, ptr) | ||
50 | DEF_HELPER_3(vfp_mins, f32, f32, f32, ptr) | ||
51 | DEF_HELPER_3(vfp_mind, f64, f64, f64, ptr) | ||
52 | +DEF_HELPER_3(vfp_maxnumh, f16, f16, f16, ptr) | ||
53 | DEF_HELPER_3(vfp_maxnums, f32, f32, f32, ptr) | ||
54 | DEF_HELPER_3(vfp_maxnumd, f64, f64, f64, ptr) | ||
55 | +DEF_HELPER_3(vfp_minnumh, f16, f16, f16, ptr) | ||
56 | DEF_HELPER_3(vfp_minnums, f32, f32, f32, ptr) | ||
57 | DEF_HELPER_3(vfp_minnumd, f64, f64, f64, ptr) | ||
58 | DEF_HELPER_1(vfp_negs, f32, f32) | ||
59 | diff --git a/target/arm/vfp-uncond.decode b/target/arm/vfp-uncond.decode | ||
60 | index XXXXXXX..XXXXXXX 100644 | ||
61 | --- a/target/arm/vfp-uncond.decode | ||
62 | +++ b/target/arm/vfp-uncond.decode | ||
63 | @@ -XXX,XX +XXX,XX @@ VSEL 1111 1110 0. cc:2 .... .... 1010 .0.0 .... \ | ||
64 | VSEL 1111 1110 0. cc:2 .... .... 1011 .0.0 .... \ | ||
65 | vm=%vm_dp vn=%vn_dp vd=%vd_dp dp=1 | ||
66 | |||
67 | +VMAXNM_hp 1111 1110 1.00 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
68 | +VMINNM_hp 1111 1110 1.00 .... .... 1001 .1.0 .... @vfp_dnm_s | ||
69 | + | ||
70 | VMAXNM_sp 1111 1110 1.00 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
71 | VMINNM_sp 1111 1110 1.00 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
72 | |||
73 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode | ||
74 | index XXXXXXX..XXXXXXX 100644 | ||
75 | --- a/target/arm/vfp.decode | ||
76 | +++ b/target/arm/vfp.decode | ||
77 | @@ -XXX,XX +XXX,XX @@ VNMLS_dp ---- 1110 0.01 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
78 | VNMLA_sp ---- 1110 0.01 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
79 | VNMLA_dp ---- 1110 0.01 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
80 | |||
81 | +VMUL_hp ---- 1110 0.10 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
82 | VMUL_sp ---- 1110 0.10 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
83 | VMUL_dp ---- 1110 0.10 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
84 | |||
85 | VNMUL_sp ---- 1110 0.10 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
86 | VNMUL_dp ---- 1110 0.10 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
87 | |||
88 | +VADD_hp ---- 1110 0.11 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
89 | VADD_sp ---- 1110 0.11 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
90 | VADD_dp ---- 1110 0.11 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
91 | |||
92 | +VSUB_hp ---- 1110 0.11 .... .... 1001 .1.0 .... @vfp_dnm_s | ||
93 | VSUB_sp ---- 1110 0.11 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
94 | VSUB_dp ---- 1110 0.11 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
95 | |||
96 | +VDIV_hp ---- 1110 1.00 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
97 | VDIV_sp ---- 1110 1.00 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
98 | VDIV_dp ---- 1110 1.00 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
99 | |||
100 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
101 | index XXXXXXX..XXXXXXX 100644 | ||
102 | --- a/target/arm/vfp_helper.c | ||
103 | +++ b/target/arm/vfp_helper.c | ||
104 | @@ -XXX,XX +XXX,XX @@ void vfp_set_fpscr(CPUARMState *env, uint32_t val) | ||
105 | #define VFP_HELPER(name, p) HELPER(glue(glue(vfp_,name),p)) | ||
106 | |||
107 | #define VFP_BINOP(name) \ | ||
108 | +dh_ctype_f16 VFP_HELPER(name, h)(dh_ctype_f16 a, dh_ctype_f16 b, void *fpstp) \ | ||
109 | +{ \ | ||
110 | + float_status *fpst = fpstp; \ | ||
111 | + return float16_ ## name(a, b, fpst); \ | ||
112 | +} \ | ||
113 | float32 VFP_HELPER(name, s)(float32 a, float32 b, void *fpstp) \ | ||
114 | { \ | ||
115 | float_status *fpst = fpstp; \ | ||
116 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
117 | index XXXXXXX..XXXXXXX 100644 | ||
118 | --- a/target/arm/translate-vfp.c.inc | ||
119 | +++ b/target/arm/translate-vfp.c.inc | ||
120 | @@ -XXX,XX +XXX,XX @@ static bool do_vfp_3op_sp(DisasContext *s, VFPGen3OpSPFn *fn, | ||
121 | return true; | ||
122 | } | ||
123 | |||
124 | +static bool do_vfp_3op_hp(DisasContext *s, VFPGen3OpSPFn *fn, | ||
125 | + int vd, int vn, int vm, bool reads_vd) | ||
126 | +{ | ||
127 | + /* | ||
128 | + * Do a half-precision operation. Functionally this is | ||
129 | + * the same as do_vfp_3op_sp(), except: | ||
130 | + * - it uses the FPST_FPCR_F16 | ||
131 | + * - it doesn't need the VFP vector handling (fp16 is a | ||
132 | + * v8 feature, and in v8 VFP vectors don't exist) | ||
133 | + * - it does the aa32_fp16_arith feature test | ||
134 | + */ | ||
135 | + TCGv_i32 f0, f1, fd; | ||
136 | + TCGv_ptr fpst; | ||
137 | + | ||
138 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
139 | + return false; | ||
140 | + } | ||
141 | + | ||
142 | + if (s->vec_len != 0 || s->vec_stride != 0) { | ||
143 | + return false; | ||
144 | + } | ||
145 | + | ||
146 | + if (!vfp_access_check(s)) { | ||
147 | + return true; | ||
148 | + } | ||
149 | + | ||
150 | + f0 = tcg_temp_new_i32(); | ||
151 | + f1 = tcg_temp_new_i32(); | ||
152 | + fd = tcg_temp_new_i32(); | ||
153 | + fpst = fpstatus_ptr(FPST_FPCR_F16); | ||
154 | + | ||
155 | + neon_load_reg32(f0, vn); | ||
156 | + neon_load_reg32(f1, vm); | ||
157 | + | ||
158 | + if (reads_vd) { | ||
159 | + neon_load_reg32(fd, vd); | ||
160 | + } | ||
161 | + fn(fd, f0, f1, fpst); | ||
162 | + neon_store_reg32(fd, vd); | ||
163 | + | ||
164 | + tcg_temp_free_i32(f0); | ||
165 | + tcg_temp_free_i32(f1); | ||
166 | + tcg_temp_free_i32(fd); | ||
167 | + tcg_temp_free_ptr(fpst); | ||
168 | + | ||
169 | + return true; | ||
170 | +} | ||
171 | + | ||
172 | static bool do_vfp_3op_dp(DisasContext *s, VFPGen3OpDPFn *fn, | ||
173 | int vd, int vn, int vm, bool reads_vd) | ||
174 | { | ||
175 | @@ -XXX,XX +XXX,XX @@ static bool trans_VNMLA_dp(DisasContext *s, arg_VNMLA_dp *a) | ||
176 | return do_vfp_3op_dp(s, gen_VNMLA_dp, a->vd, a->vn, a->vm, true); | ||
177 | } | ||
178 | |||
179 | +static bool trans_VMUL_hp(DisasContext *s, arg_VMUL_sp *a) | ||
180 | +{ | ||
181 | + return do_vfp_3op_hp(s, gen_helper_vfp_mulh, a->vd, a->vn, a->vm, false); | ||
182 | +} | ||
183 | + | ||
184 | static bool trans_VMUL_sp(DisasContext *s, arg_VMUL_sp *a) | ||
185 | { | ||
186 | return do_vfp_3op_sp(s, gen_helper_vfp_muls, a->vd, a->vn, a->vm, false); | ||
187 | @@ -XXX,XX +XXX,XX @@ static bool trans_VNMUL_dp(DisasContext *s, arg_VNMUL_dp *a) | ||
188 | return do_vfp_3op_dp(s, gen_VNMUL_dp, a->vd, a->vn, a->vm, false); | ||
189 | } | ||
190 | |||
191 | +static bool trans_VADD_hp(DisasContext *s, arg_VADD_sp *a) | ||
192 | +{ | ||
193 | + return do_vfp_3op_hp(s, gen_helper_vfp_addh, a->vd, a->vn, a->vm, false); | ||
194 | +} | ||
195 | + | ||
196 | static bool trans_VADD_sp(DisasContext *s, arg_VADD_sp *a) | ||
197 | { | ||
198 | return do_vfp_3op_sp(s, gen_helper_vfp_adds, a->vd, a->vn, a->vm, false); | ||
199 | @@ -XXX,XX +XXX,XX @@ static bool trans_VADD_dp(DisasContext *s, arg_VADD_dp *a) | ||
200 | return do_vfp_3op_dp(s, gen_helper_vfp_addd, a->vd, a->vn, a->vm, false); | ||
201 | } | ||
202 | |||
203 | +static bool trans_VSUB_hp(DisasContext *s, arg_VSUB_sp *a) | ||
204 | +{ | ||
205 | + return do_vfp_3op_hp(s, gen_helper_vfp_subh, a->vd, a->vn, a->vm, false); | ||
206 | +} | ||
207 | + | ||
208 | static bool trans_VSUB_sp(DisasContext *s, arg_VSUB_sp *a) | ||
209 | { | ||
210 | return do_vfp_3op_sp(s, gen_helper_vfp_subs, a->vd, a->vn, a->vm, false); | ||
211 | @@ -XXX,XX +XXX,XX @@ static bool trans_VSUB_dp(DisasContext *s, arg_VSUB_dp *a) | ||
212 | return do_vfp_3op_dp(s, gen_helper_vfp_subd, a->vd, a->vn, a->vm, false); | ||
213 | } | ||
214 | |||
215 | +static bool trans_VDIV_hp(DisasContext *s, arg_VDIV_sp *a) | ||
216 | +{ | ||
217 | + return do_vfp_3op_hp(s, gen_helper_vfp_divh, a->vd, a->vn, a->vm, false); | ||
218 | +} | ||
219 | + | ||
220 | static bool trans_VDIV_sp(DisasContext *s, arg_VDIV_sp *a) | ||
221 | { | ||
222 | return do_vfp_3op_sp(s, gen_helper_vfp_divs, a->vd, a->vn, a->vm, false); | ||
223 | @@ -XXX,XX +XXX,XX @@ static bool trans_VDIV_dp(DisasContext *s, arg_VDIV_dp *a) | ||
224 | return do_vfp_3op_dp(s, gen_helper_vfp_divd, a->vd, a->vn, a->vm, false); | ||
225 | } | ||
226 | |||
227 | +static bool trans_VMINNM_hp(DisasContext *s, arg_VMINNM_sp *a) | ||
228 | +{ | ||
229 | + if (!dc_isar_feature(aa32_vminmaxnm, s)) { | ||
230 | + return false; | ||
231 | + } | ||
232 | + return do_vfp_3op_hp(s, gen_helper_vfp_minnumh, | ||
233 | + a->vd, a->vn, a->vm, false); | ||
234 | +} | ||
235 | + | ||
236 | +static bool trans_VMAXNM_hp(DisasContext *s, arg_VMAXNM_sp *a) | ||
237 | +{ | ||
238 | + if (!dc_isar_feature(aa32_vminmaxnm, s)) { | ||
239 | + return false; | ||
240 | + } | ||
241 | + return do_vfp_3op_hp(s, gen_helper_vfp_maxnumh, | ||
242 | + a->vd, a->vn, a->vm, false); | ||
243 | +} | ||
244 | + | ||
245 | static bool trans_VMINNM_sp(DisasContext *s, arg_VMINNM_sp *a) | ||
246 | { | ||
247 | if (!dc_isar_feature(aa32_vminmaxnm, s)) { | ||
248 | -- | ||
249 | 2.20.1 | ||
250 | |||
251 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | 1 | Implement fp16 versions of the VFP VMLA, VMLS, VNMLS, VNMLA, VNMUL | |
2 | instructions. (These are all the remaining ones which we implement | ||
3 | via do_vfp_3op_[hsd]p().) | ||
4 | |||
5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20200828183354.27913-5-peter.maydell@linaro.org | ||
8 | --- | ||
9 | target/arm/helper.h | 1 + | ||
10 | target/arm/vfp.decode | 5 ++ | ||
11 | target/arm/vfp_helper.c | 5 ++ | ||
12 | target/arm/translate-vfp.c.inc | 84 ++++++++++++++++++++++++++++++++++ | ||
13 | 4 files changed, 95 insertions(+) | ||
14 | |||
15 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
16 | index XXXXXXX..XXXXXXX 100644 | ||
17 | --- a/target/arm/helper.h | ||
18 | +++ b/target/arm/helper.h | ||
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_maxnumd, f64, f64, f64, ptr) | ||
20 | DEF_HELPER_3(vfp_minnumh, f16, f16, f16, ptr) | ||
21 | DEF_HELPER_3(vfp_minnums, f32, f32, f32, ptr) | ||
22 | DEF_HELPER_3(vfp_minnumd, f64, f64, f64, ptr) | ||
23 | +DEF_HELPER_1(vfp_negh, f16, f16) | ||
24 | DEF_HELPER_1(vfp_negs, f32, f32) | ||
25 | DEF_HELPER_1(vfp_negd, f64, f64) | ||
26 | DEF_HELPER_1(vfp_abss, f32, f32) | ||
27 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode | ||
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/target/arm/vfp.decode | ||
30 | +++ b/target/arm/vfp.decode | ||
31 | @@ -XXX,XX +XXX,XX @@ VLDM_VSTM_dp ---- 1101 0.1 l:1 rn:4 .... 1011 imm:8 \ | ||
32 | vd=%vd_dp p=1 u=0 w=1 | ||
33 | |||
34 | # 3-register VFP data-processing; bits [23,21:20,6] identify the operation. | ||
35 | +VMLA_hp ---- 1110 0.00 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
36 | VMLA_sp ---- 1110 0.00 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
37 | VMLA_dp ---- 1110 0.00 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
38 | |||
39 | +VMLS_hp ---- 1110 0.00 .... .... 1001 .1.0 .... @vfp_dnm_s | ||
40 | VMLS_sp ---- 1110 0.00 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
41 | VMLS_dp ---- 1110 0.00 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
42 | |||
43 | +VNMLS_hp ---- 1110 0.01 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
44 | VNMLS_sp ---- 1110 0.01 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
45 | VNMLS_dp ---- 1110 0.01 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
46 | |||
47 | +VNMLA_hp ---- 1110 0.01 .... .... 1001 .1.0 .... @vfp_dnm_s | ||
48 | VNMLA_sp ---- 1110 0.01 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
49 | VNMLA_dp ---- 1110 0.01 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
50 | |||
51 | @@ -XXX,XX +XXX,XX @@ VMUL_hp ---- 1110 0.10 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
52 | VMUL_sp ---- 1110 0.10 .... .... 1010 .0.0 .... @vfp_dnm_s | ||
53 | VMUL_dp ---- 1110 0.10 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
54 | |||
55 | +VNMUL_hp ---- 1110 0.10 .... .... 1001 .1.0 .... @vfp_dnm_s | ||
56 | VNMUL_sp ---- 1110 0.10 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
57 | VNMUL_dp ---- 1110 0.10 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
58 | |||
59 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
60 | index XXXXXXX..XXXXXXX 100644 | ||
61 | --- a/target/arm/vfp_helper.c | ||
62 | +++ b/target/arm/vfp_helper.c | ||
63 | @@ -XXX,XX +XXX,XX @@ VFP_BINOP(minnum) | ||
64 | VFP_BINOP(maxnum) | ||
65 | #undef VFP_BINOP | ||
66 | |||
67 | +dh_ctype_f16 VFP_HELPER(neg, h)(dh_ctype_f16 a) | ||
68 | +{ | ||
69 | + return float16_chs(a); | ||
70 | +} | ||
71 | + | ||
72 | float32 VFP_HELPER(neg, s)(float32 a) | ||
73 | { | ||
74 | return float32_chs(a); | ||
75 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
76 | index XXXXXXX..XXXXXXX 100644 | ||
77 | --- a/target/arm/translate-vfp.c.inc | ||
78 | +++ b/target/arm/translate-vfp.c.inc | ||
79 | @@ -XXX,XX +XXX,XX @@ static bool do_vfp_2op_dp(DisasContext *s, VFPGen2OpDPFn *fn, int vd, int vm) | ||
80 | return true; | ||
81 | } | ||
82 | |||
83 | +static void gen_VMLA_hp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
84 | +{ | ||
85 | + /* Note that order of inputs to the add matters for NaNs */ | ||
86 | + TCGv_i32 tmp = tcg_temp_new_i32(); | ||
87 | + | ||
88 | + gen_helper_vfp_mulh(tmp, vn, vm, fpst); | ||
89 | + gen_helper_vfp_addh(vd, vd, tmp, fpst); | ||
90 | + tcg_temp_free_i32(tmp); | ||
91 | +} | ||
92 | + | ||
93 | +static bool trans_VMLA_hp(DisasContext *s, arg_VMLA_sp *a) | ||
94 | +{ | ||
95 | + return do_vfp_3op_hp(s, gen_VMLA_hp, a->vd, a->vn, a->vm, true); | ||
96 | +} | ||
97 | + | ||
98 | static void gen_VMLA_sp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
99 | { | ||
100 | /* Note that order of inputs to the add matters for NaNs */ | ||
101 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMLA_dp(DisasContext *s, arg_VMLA_dp *a) | ||
102 | return do_vfp_3op_dp(s, gen_VMLA_dp, a->vd, a->vn, a->vm, true); | ||
103 | } | ||
104 | |||
105 | +static void gen_VMLS_hp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
106 | +{ | ||
107 | + /* | ||
108 | + * VMLS: vd = vd + -(vn * vm) | ||
109 | + * Note that order of inputs to the add matters for NaNs. | ||
110 | + */ | ||
111 | + TCGv_i32 tmp = tcg_temp_new_i32(); | ||
112 | + | ||
113 | + gen_helper_vfp_mulh(tmp, vn, vm, fpst); | ||
114 | + gen_helper_vfp_negh(tmp, tmp); | ||
115 | + gen_helper_vfp_addh(vd, vd, tmp, fpst); | ||
116 | + tcg_temp_free_i32(tmp); | ||
117 | +} | ||
118 | + | ||
119 | +static bool trans_VMLS_hp(DisasContext *s, arg_VMLS_sp *a) | ||
120 | +{ | ||
121 | + return do_vfp_3op_hp(s, gen_VMLS_hp, a->vd, a->vn, a->vm, true); | ||
122 | +} | ||
123 | + | ||
124 | static void gen_VMLS_sp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
125 | { | ||
126 | /* | ||
127 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMLS_dp(DisasContext *s, arg_VMLS_dp *a) | ||
128 | return do_vfp_3op_dp(s, gen_VMLS_dp, a->vd, a->vn, a->vm, true); | ||
129 | } | ||
130 | |||
131 | +static void gen_VNMLS_hp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
132 | +{ | ||
133 | + /* | ||
134 | + * VNMLS: -fd + (fn * fm) | ||
135 | + * Note that it isn't valid to replace (-A + B) with (B - A) or similar | ||
136 | + * plausible looking simplifications because this will give wrong results | ||
137 | + * for NaNs. | ||
138 | + */ | ||
139 | + TCGv_i32 tmp = tcg_temp_new_i32(); | ||
140 | + | ||
141 | + gen_helper_vfp_mulh(tmp, vn, vm, fpst); | ||
142 | + gen_helper_vfp_negh(vd, vd); | ||
143 | + gen_helper_vfp_addh(vd, vd, tmp, fpst); | ||
144 | + tcg_temp_free_i32(tmp); | ||
145 | +} | ||
146 | + | ||
147 | +static bool trans_VNMLS_hp(DisasContext *s, arg_VNMLS_sp *a) | ||
148 | +{ | ||
149 | + return do_vfp_3op_hp(s, gen_VNMLS_hp, a->vd, a->vn, a->vm, true); | ||
150 | +} | ||
151 | + | ||
152 | static void gen_VNMLS_sp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
153 | { | ||
154 | /* | ||
155 | @@ -XXX,XX +XXX,XX @@ static bool trans_VNMLS_dp(DisasContext *s, arg_VNMLS_dp *a) | ||
156 | return do_vfp_3op_dp(s, gen_VNMLS_dp, a->vd, a->vn, a->vm, true); | ||
157 | } | ||
158 | |||
159 | +static void gen_VNMLA_hp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
160 | +{ | ||
161 | + /* VNMLA: -fd + -(fn * fm) */ | ||
162 | + TCGv_i32 tmp = tcg_temp_new_i32(); | ||
163 | + | ||
164 | + gen_helper_vfp_mulh(tmp, vn, vm, fpst); | ||
165 | + gen_helper_vfp_negh(tmp, tmp); | ||
166 | + gen_helper_vfp_negh(vd, vd); | ||
167 | + gen_helper_vfp_addh(vd, vd, tmp, fpst); | ||
168 | + tcg_temp_free_i32(tmp); | ||
169 | +} | ||
170 | + | ||
171 | +static bool trans_VNMLA_hp(DisasContext *s, arg_VNMLA_sp *a) | ||
172 | +{ | ||
173 | + return do_vfp_3op_hp(s, gen_VNMLA_hp, a->vd, a->vn, a->vm, true); | ||
174 | +} | ||
175 | + | ||
176 | static void gen_VNMLA_sp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
177 | { | ||
178 | /* VNMLA: -fd + -(fn * fm) */ | ||
179 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMUL_dp(DisasContext *s, arg_VMUL_dp *a) | ||
180 | return do_vfp_3op_dp(s, gen_helper_vfp_muld, a->vd, a->vn, a->vm, false); | ||
181 | } | ||
182 | |||
183 | +static void gen_VNMUL_hp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
184 | +{ | ||
185 | + /* VNMUL: -(fn * fm) */ | ||
186 | + gen_helper_vfp_mulh(vd, vn, vm, fpst); | ||
187 | + gen_helper_vfp_negh(vd, vd); | ||
188 | +} | ||
189 | + | ||
190 | +static bool trans_VNMUL_hp(DisasContext *s, arg_VNMUL_sp *a) | ||
191 | +{ | ||
192 | + return do_vfp_3op_hp(s, gen_VNMUL_hp, a->vd, a->vn, a->vm, false); | ||
193 | +} | ||
194 | + | ||
195 | static void gen_VNMUL_sp(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, TCGv_ptr fpst) | ||
196 | { | ||
197 | /* VNMUL: -(fn * fm) */ | ||
198 | -- | ||
199 | 2.20.1 | ||
200 | |||
201 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | Macroify creation of the trans functions for single and double | ||
2 | precision VFMA, VFMS, VFNMA, VFNMS. The repetition was OK for | ||
3 | two sizes, but we're about to add halfprec and it will get a bit | ||
4 | more than seems reasonable. | ||
1 | 5 | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20200828183354.27913-6-peter.maydell@linaro.org | ||
9 | --- | ||
10 | target/arm/translate-vfp.c.inc | 50 +++++++++------------------------- | ||
11 | 1 file changed, 13 insertions(+), 37 deletions(-) | ||
12 | |||
13 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
14 | index XXXXXXX..XXXXXXX 100644 | ||
15 | --- a/target/arm/translate-vfp.c.inc | ||
16 | +++ b/target/arm/translate-vfp.c.inc | ||
17 | @@ -XXX,XX +XXX,XX @@ static bool do_vfm_sp(DisasContext *s, arg_VFMA_sp *a, bool neg_n, bool neg_d) | ||
18 | return true; | ||
19 | } | ||
20 | |||
21 | -static bool trans_VFMA_sp(DisasContext *s, arg_VFMA_sp *a) | ||
22 | -{ | ||
23 | - return do_vfm_sp(s, a, false, false); | ||
24 | -} | ||
25 | - | ||
26 | -static bool trans_VFMS_sp(DisasContext *s, arg_VFMS_sp *a) | ||
27 | -{ | ||
28 | - return do_vfm_sp(s, a, true, false); | ||
29 | -} | ||
30 | - | ||
31 | -static bool trans_VFNMA_sp(DisasContext *s, arg_VFNMA_sp *a) | ||
32 | -{ | ||
33 | - return do_vfm_sp(s, a, false, true); | ||
34 | -} | ||
35 | - | ||
36 | -static bool trans_VFNMS_sp(DisasContext *s, arg_VFNMS_sp *a) | ||
37 | -{ | ||
38 | - return do_vfm_sp(s, a, true, true); | ||
39 | -} | ||
40 | - | ||
41 | static bool do_vfm_dp(DisasContext *s, arg_VFMA_dp *a, bool neg_n, bool neg_d) | ||
42 | { | ||
43 | /* | ||
44 | @@ -XXX,XX +XXX,XX @@ static bool do_vfm_dp(DisasContext *s, arg_VFMA_dp *a, bool neg_n, bool neg_d) | ||
45 | return true; | ||
46 | } | ||
47 | |||
48 | -static bool trans_VFMA_dp(DisasContext *s, arg_VFMA_dp *a) | ||
49 | -{ | ||
50 | - return do_vfm_dp(s, a, false, false); | ||
51 | -} | ||
52 | +#define MAKE_ONE_VFM_TRANS_FN(INSN, PREC, NEGN, NEGD) \ | ||
53 | + static bool trans_##INSN##_##PREC(DisasContext *s, \ | ||
54 | + arg_##INSN##_##PREC *a) \ | ||
55 | + { \ | ||
56 | + return do_vfm_##PREC(s, a, NEGN, NEGD); \ | ||
57 | + } | ||
58 | |||
59 | -static bool trans_VFMS_dp(DisasContext *s, arg_VFMS_dp *a) | ||
60 | -{ | ||
61 | - return do_vfm_dp(s, a, true, false); | ||
62 | -} | ||
63 | +#define MAKE_VFM_TRANS_FNS(PREC) \ | ||
64 | + MAKE_ONE_VFM_TRANS_FN(VFMA, PREC, false, false) \ | ||
65 | + MAKE_ONE_VFM_TRANS_FN(VFMS, PREC, true, false) \ | ||
66 | + MAKE_ONE_VFM_TRANS_FN(VFNMA, PREC, false, true) \ | ||
67 | + MAKE_ONE_VFM_TRANS_FN(VFNMS, PREC, true, true) | ||
68 | |||
69 | -static bool trans_VFNMA_dp(DisasContext *s, arg_VFNMA_dp *a) | ||
70 | -{ | ||
71 | - return do_vfm_dp(s, a, false, true); | ||
72 | -} | ||
73 | - | ||
74 | -static bool trans_VFNMS_dp(DisasContext *s, arg_VFNMS_dp *a) | ||
75 | -{ | ||
76 | - return do_vfm_dp(s, a, true, true); | ||
77 | -} | ||
78 | +MAKE_VFM_TRANS_FNS(sp) | ||
79 | +MAKE_VFM_TRANS_FNS(dp) | ||
80 | |||
81 | static bool trans_VMOV_imm_sp(DisasContext *s, arg_VMOV_imm_sp *a) | ||
82 | { | ||
83 | -- | ||
84 | 2.20.1 | ||
85 | |||
86 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Implement VFP fp16 support for fused multiply-add insns |
---|---|---|---|
2 | VFNMA, VFNMS, VFMA, VFMS. | ||
2 | 3 | ||
3 | In the Allwinner H3 SoC the SDRAM controller is responsible | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | for interfacing with the external Synchronous Dynamic Random | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Access Memory (SDRAM). Types of memory that the SDRAM controller | 6 | Message-id: 20200828183354.27913-7-peter.maydell@linaro.org |
6 | supports are DDR2/DDR3 and capacities of up to 2GiB. This commit | 7 | --- |
7 | adds emulation support of the Allwinner H3 SDRAM controller. | 8 | target/arm/helper.h | 1 + |
9 | target/arm/vfp.decode | 5 +++ | ||
10 | target/arm/vfp_helper.c | 7 ++++ | ||
11 | target/arm/translate-vfp.c.inc | 64 ++++++++++++++++++++++++++++++++++ | ||
12 | 4 files changed, 77 insertions(+) | ||
8 | 13 | ||
9 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | 14 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
10 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
11 | Message-id: 20200311221854.30370-12-nieklinnenbank@gmail.com | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | --- | ||
14 | hw/misc/Makefile.objs | 1 + | ||
15 | include/hw/arm/allwinner-h3.h | 5 + | ||
16 | include/hw/misc/allwinner-h3-dramc.h | 106 ++++++++ | ||
17 | hw/arm/allwinner-h3.c | 19 +- | ||
18 | hw/arm/orangepi.c | 6 + | ||
19 | hw/misc/allwinner-h3-dramc.c | 358 +++++++++++++++++++++++++++ | ||
20 | hw/misc/trace-events | 10 + | ||
21 | 7 files changed, 502 insertions(+), 3 deletions(-) | ||
22 | create mode 100644 include/hw/misc/allwinner-h3-dramc.h | ||
23 | create mode 100644 hw/misc/allwinner-h3-dramc.c | ||
24 | |||
25 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs | ||
26 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
27 | --- a/hw/misc/Makefile.objs | 16 | --- a/target/arm/helper.h |
28 | +++ b/hw/misc/Makefile.objs | 17 | +++ b/target/arm/helper.h |
29 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_IVSHMEM_DEVICE) += ivshmem.o | 18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(vfp_fcvt_f64_to_f16, TCG_CALL_NO_RWG, f16, f64, ptr, i32) |
30 | 19 | ||
31 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-ccu.o | 20 | DEF_HELPER_4(vfp_muladdd, f64, f64, f64, f64, ptr) |
32 | obj-$(CONFIG_ALLWINNER_H3) += allwinner-cpucfg.o | 21 | DEF_HELPER_4(vfp_muladds, f32, f32, f32, f32, ptr) |
33 | +common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-dramc.o | 22 | +DEF_HELPER_4(vfp_muladdh, f16, f16, f16, f16, ptr) |
34 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-sysctrl.o | 23 | |
35 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-sid.o | 24 | DEF_HELPER_3(recps_f32, f32, env, f32, f32) |
36 | common-obj-$(CONFIG_REALVIEW) += arm_sysctl.o | 25 | DEF_HELPER_3(rsqrts_f32, f32, env, f32, f32) |
37 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | 26 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode |
38 | index XXXXXXX..XXXXXXX 100644 | 27 | index XXXXXXX..XXXXXXX 100644 |
39 | --- a/include/hw/arm/allwinner-h3.h | 28 | --- a/target/arm/vfp.decode |
40 | +++ b/include/hw/arm/allwinner-h3.h | 29 | +++ b/target/arm/vfp.decode |
41 | @@ -XXX,XX +XXX,XX @@ | 30 | @@ -XXX,XX +XXX,XX @@ VDIV_hp ---- 1110 1.00 .... .... 1001 .0.0 .... @vfp_dnm_s |
42 | #include "hw/intc/arm_gic.h" | 31 | VDIV_sp ---- 1110 1.00 .... .... 1010 .0.0 .... @vfp_dnm_s |
43 | #include "hw/misc/allwinner-h3-ccu.h" | 32 | VDIV_dp ---- 1110 1.00 .... .... 1011 .0.0 .... @vfp_dnm_d |
44 | #include "hw/misc/allwinner-cpucfg.h" | 33 | |
45 | +#include "hw/misc/allwinner-h3-dramc.h" | 34 | +VFMA_hp ---- 1110 1.10 .... .... 1001 .0. 0 .... @vfp_dnm_s |
46 | #include "hw/misc/allwinner-h3-sysctrl.h" | 35 | +VFMS_hp ---- 1110 1.10 .... .... 1001 .1. 0 .... @vfp_dnm_s |
47 | #include "hw/misc/allwinner-sid.h" | 36 | +VFNMA_hp ---- 1110 1.01 .... .... 1001 .0. 0 .... @vfp_dnm_s |
48 | #include "hw/sd/allwinner-sdhost.h" | 37 | +VFNMS_hp ---- 1110 1.01 .... .... 1001 .1. 0 .... @vfp_dnm_s |
49 | @@ -XXX,XX +XXX,XX @@ enum { | ||
50 | AW_H3_UART2, | ||
51 | AW_H3_UART3, | ||
52 | AW_H3_EMAC, | ||
53 | + AW_H3_DRAMCOM, | ||
54 | + AW_H3_DRAMCTL, | ||
55 | + AW_H3_DRAMPHY, | ||
56 | AW_H3_GIC_DIST, | ||
57 | AW_H3_GIC_CPU, | ||
58 | AW_H3_GIC_HYP, | ||
59 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
60 | AwA10PITState timer; | ||
61 | AwH3ClockCtlState ccu; | ||
62 | AwCpuCfgState cpucfg; | ||
63 | + AwH3DramCtlState dramc; | ||
64 | AwH3SysCtrlState sysctrl; | ||
65 | AwSidState sid; | ||
66 | AwSdHostState mmc0; | ||
67 | diff --git a/include/hw/misc/allwinner-h3-dramc.h b/include/hw/misc/allwinner-h3-dramc.h | ||
68 | new file mode 100644 | ||
69 | index XXXXXXX..XXXXXXX | ||
70 | --- /dev/null | ||
71 | +++ b/include/hw/misc/allwinner-h3-dramc.h | ||
72 | @@ -XXX,XX +XXX,XX @@ | ||
73 | +/* | ||
74 | + * Allwinner H3 SDRAM Controller emulation | ||
75 | + * | ||
76 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
77 | + * | ||
78 | + * This program is free software: you can redistribute it and/or modify | ||
79 | + * it under the terms of the GNU General Public License as published by | ||
80 | + * the Free Software Foundation, either version 2 of the License, or | ||
81 | + * (at your option) any later version. | ||
82 | + * | ||
83 | + * This program is distributed in the hope that it will be useful, | ||
84 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
85 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
86 | + * GNU General Public License for more details. | ||
87 | + * | ||
88 | + * You should have received a copy of the GNU General Public License | ||
89 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
90 | + */ | ||
91 | + | 38 | + |
92 | +#ifndef HW_MISC_ALLWINNER_H3_DRAMC_H | 39 | VFMA_sp ---- 1110 1.10 .... .... 1010 .0. 0 .... @vfp_dnm_s |
93 | +#define HW_MISC_ALLWINNER_H3_DRAMC_H | 40 | VFMS_sp ---- 1110 1.10 .... .... 1010 .1. 0 .... @vfp_dnm_s |
41 | VFNMA_sp ---- 1110 1.01 .... .... 1010 .0. 0 .... @vfp_dnm_s | ||
42 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
43 | index XXXXXXX..XXXXXXX 100644 | ||
44 | --- a/target/arm/vfp_helper.c | ||
45 | +++ b/target/arm/vfp_helper.c | ||
46 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(rsqrte_u32)(uint32_t a) | ||
47 | } | ||
48 | |||
49 | /* VFPv4 fused multiply-accumulate */ | ||
50 | +dh_ctype_f16 VFP_HELPER(muladd, h)(dh_ctype_f16 a, dh_ctype_f16 b, | ||
51 | + dh_ctype_f16 c, void *fpstp) | ||
52 | +{ | ||
53 | + float_status *fpst = fpstp; | ||
54 | + return float16_muladd(a, b, c, 0, fpst); | ||
55 | +} | ||
94 | + | 56 | + |
95 | +#include "qom/object.h" | 57 | float32 VFP_HELPER(muladd, s)(float32 a, float32 b, float32 c, void *fpstp) |
96 | +#include "hw/sysbus.h" | 58 | { |
97 | +#include "exec/hwaddr.h" | 59 | float_status *fpst = fpstp; |
98 | + | 60 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc |
99 | +/** | ||
100 | + * Constants | ||
101 | + * @{ | ||
102 | + */ | ||
103 | + | ||
104 | +/** Highest register address used by DRAMCOM module */ | ||
105 | +#define AW_H3_DRAMCOM_REGS_MAXADDR (0x804) | ||
106 | + | ||
107 | +/** Total number of known DRAMCOM registers */ | ||
108 | +#define AW_H3_DRAMCOM_REGS_NUM (AW_H3_DRAMCOM_REGS_MAXADDR / \ | ||
109 | + sizeof(uint32_t)) | ||
110 | + | ||
111 | +/** Highest register address used by DRAMCTL module */ | ||
112 | +#define AW_H3_DRAMCTL_REGS_MAXADDR (0x88c) | ||
113 | + | ||
114 | +/** Total number of known DRAMCTL registers */ | ||
115 | +#define AW_H3_DRAMCTL_REGS_NUM (AW_H3_DRAMCTL_REGS_MAXADDR / \ | ||
116 | + sizeof(uint32_t)) | ||
117 | + | ||
118 | +/** Highest register address used by DRAMPHY module */ | ||
119 | +#define AW_H3_DRAMPHY_REGS_MAXADDR (0x4) | ||
120 | + | ||
121 | +/** Total number of known DRAMPHY registers */ | ||
122 | +#define AW_H3_DRAMPHY_REGS_NUM (AW_H3_DRAMPHY_REGS_MAXADDR / \ | ||
123 | + sizeof(uint32_t)) | ||
124 | + | ||
125 | +/** @} */ | ||
126 | + | ||
127 | +/** | ||
128 | + * Object model | ||
129 | + * @{ | ||
130 | + */ | ||
131 | + | ||
132 | +#define TYPE_AW_H3_DRAMC "allwinner-h3-dramc" | ||
133 | +#define AW_H3_DRAMC(obj) \ | ||
134 | + OBJECT_CHECK(AwH3DramCtlState, (obj), TYPE_AW_H3_DRAMC) | ||
135 | + | ||
136 | +/** @} */ | ||
137 | + | ||
138 | +/** | ||
139 | + * Allwinner H3 SDRAM Controller object instance state. | ||
140 | + */ | ||
141 | +typedef struct AwH3DramCtlState { | ||
142 | + /*< private >*/ | ||
143 | + SysBusDevice parent_obj; | ||
144 | + /*< public >*/ | ||
145 | + | ||
146 | + /** Physical base address for start of RAM */ | ||
147 | + hwaddr ram_addr; | ||
148 | + | ||
149 | + /** Total RAM size in megabytes */ | ||
150 | + uint32_t ram_size; | ||
151 | + | ||
152 | + /** | ||
153 | + * @name Memory Regions | ||
154 | + * @{ | ||
155 | + */ | ||
156 | + | ||
157 | + MemoryRegion row_mirror; /**< Simulates rows for RAM size detection */ | ||
158 | + MemoryRegion row_mirror_alias; /**< Alias of the row which is mirrored */ | ||
159 | + MemoryRegion dramcom_iomem; /**< DRAMCOM module I/O registers */ | ||
160 | + MemoryRegion dramctl_iomem; /**< DRAMCTL module I/O registers */ | ||
161 | + MemoryRegion dramphy_iomem; /**< DRAMPHY module I/O registers */ | ||
162 | + | ||
163 | + /** @} */ | ||
164 | + | ||
165 | + /** | ||
166 | + * @name Hardware Registers | ||
167 | + * @{ | ||
168 | + */ | ||
169 | + | ||
170 | + uint32_t dramcom[AW_H3_DRAMCOM_REGS_NUM]; /**< Array of DRAMCOM registers */ | ||
171 | + uint32_t dramctl[AW_H3_DRAMCTL_REGS_NUM]; /**< Array of DRAMCTL registers */ | ||
172 | + uint32_t dramphy[AW_H3_DRAMPHY_REGS_NUM] ;/**< Array of DRAMPHY registers */ | ||
173 | + | ||
174 | + /** @} */ | ||
175 | + | ||
176 | +} AwH3DramCtlState; | ||
177 | + | ||
178 | +#endif /* HW_MISC_ALLWINNER_H3_DRAMC_H */ | ||
179 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
180 | index XXXXXXX..XXXXXXX 100644 | 61 | index XXXXXXX..XXXXXXX 100644 |
181 | --- a/hw/arm/allwinner-h3.c | 62 | --- a/target/arm/translate-vfp.c.inc |
182 | +++ b/hw/arm/allwinner-h3.c | 63 | +++ b/target/arm/translate-vfp.c.inc |
183 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | 64 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMAXNM_dp(DisasContext *s, arg_VMAXNM_dp *a) |
184 | [AW_H3_UART2] = 0x01c28800, | 65 | a->vd, a->vn, a->vm, false); |
185 | [AW_H3_UART3] = 0x01c28c00, | ||
186 | [AW_H3_EMAC] = 0x01c30000, | ||
187 | + [AW_H3_DRAMCOM] = 0x01c62000, | ||
188 | + [AW_H3_DRAMCTL] = 0x01c63000, | ||
189 | + [AW_H3_DRAMPHY] = 0x01c65000, | ||
190 | [AW_H3_GIC_DIST] = 0x01c81000, | ||
191 | [AW_H3_GIC_CPU] = 0x01c82000, | ||
192 | [AW_H3_GIC_HYP] = 0x01c84000, | ||
193 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
194 | { "scr", 0x01c2c400, 1 * KiB }, | ||
195 | { "gpu", 0x01c40000, 64 * KiB }, | ||
196 | { "hstmr", 0x01c60000, 4 * KiB }, | ||
197 | - { "dramcom", 0x01c62000, 4 * KiB }, | ||
198 | - { "dramctl0", 0x01c63000, 4 * KiB }, | ||
199 | - { "dramphy0", 0x01c65000, 4 * KiB }, | ||
200 | { "spi0", 0x01c68000, 4 * KiB }, | ||
201 | { "spi1", 0x01c69000, 4 * KiB }, | ||
202 | { "csi", 0x01cb0000, 320 * KiB }, | ||
203 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
204 | |||
205 | sysbus_init_child_obj(obj, "emac", &s->emac, sizeof(s->emac), | ||
206 | TYPE_AW_SUN8I_EMAC); | ||
207 | + | ||
208 | + sysbus_init_child_obj(obj, "dramc", &s->dramc, sizeof(s->dramc), | ||
209 | + TYPE_AW_H3_DRAMC); | ||
210 | + object_property_add_alias(obj, "ram-addr", OBJECT(&s->dramc), | ||
211 | + "ram-addr", &error_abort); | ||
212 | + object_property_add_alias(obj, "ram-size", OBJECT(&s->dramc), | ||
213 | + "ram-size", &error_abort); | ||
214 | } | 66 | } |
215 | 67 | ||
216 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | 68 | +static bool do_vfm_hp(DisasContext *s, arg_VFMA_sp *a, bool neg_n, bool neg_d) |
217 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
218 | qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART3), | ||
219 | 115200, serial_hd(3), DEVICE_NATIVE_ENDIAN); | ||
220 | |||
221 | + /* DRAMC */ | ||
222 | + qdev_init_nofail(DEVICE(&s->dramc)); | ||
223 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 0, s->memmap[AW_H3_DRAMCOM]); | ||
224 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 1, s->memmap[AW_H3_DRAMCTL]); | ||
225 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 2, s->memmap[AW_H3_DRAMPHY]); | ||
226 | + | ||
227 | /* Unimplemented devices */ | ||
228 | for (i = 0; i < ARRAY_SIZE(unimplemented); i++) { | ||
229 | create_unimplemented_device(unimplemented[i].device_name, | ||
230 | diff --git a/hw/arm/orangepi.c b/hw/arm/orangepi.c | ||
231 | index XXXXXXX..XXXXXXX 100644 | ||
232 | --- a/hw/arm/orangepi.c | ||
233 | +++ b/hw/arm/orangepi.c | ||
234 | @@ -XXX,XX +XXX,XX @@ static void orangepi_init(MachineState *machine) | ||
235 | /* Setup EMAC properties */ | ||
236 | object_property_set_int(OBJECT(&h3->emac), 1, "phy-addr", &error_abort); | ||
237 | |||
238 | + /* DRAMC */ | ||
239 | + object_property_set_uint(OBJECT(h3), h3->memmap[AW_H3_SDRAM], | ||
240 | + "ram-addr", &error_abort); | ||
241 | + object_property_set_int(OBJECT(h3), machine->ram_size / MiB, "ram-size", | ||
242 | + &error_abort); | ||
243 | + | ||
244 | /* Mark H3 object realized */ | ||
245 | object_property_set_bool(OBJECT(h3), true, "realized", &error_abort); | ||
246 | |||
247 | diff --git a/hw/misc/allwinner-h3-dramc.c b/hw/misc/allwinner-h3-dramc.c | ||
248 | new file mode 100644 | ||
249 | index XXXXXXX..XXXXXXX | ||
250 | --- /dev/null | ||
251 | +++ b/hw/misc/allwinner-h3-dramc.c | ||
252 | @@ -XXX,XX +XXX,XX @@ | ||
253 | +/* | ||
254 | + * Allwinner H3 SDRAM Controller emulation | ||
255 | + * | ||
256 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
257 | + * | ||
258 | + * This program is free software: you can redistribute it and/or modify | ||
259 | + * it under the terms of the GNU General Public License as published by | ||
260 | + * the Free Software Foundation, either version 2 of the License, or | ||
261 | + * (at your option) any later version. | ||
262 | + * | ||
263 | + * This program is distributed in the hope that it will be useful, | ||
264 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
265 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
266 | + * GNU General Public License for more details. | ||
267 | + * | ||
268 | + * You should have received a copy of the GNU General Public License | ||
269 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
270 | + */ | ||
271 | + | ||
272 | +#include "qemu/osdep.h" | ||
273 | +#include "qemu/units.h" | ||
274 | +#include "qemu/error-report.h" | ||
275 | +#include "hw/sysbus.h" | ||
276 | +#include "migration/vmstate.h" | ||
277 | +#include "qemu/log.h" | ||
278 | +#include "qemu/module.h" | ||
279 | +#include "exec/address-spaces.h" | ||
280 | +#include "hw/qdev-properties.h" | ||
281 | +#include "qapi/error.h" | ||
282 | +#include "hw/misc/allwinner-h3-dramc.h" | ||
283 | +#include "trace.h" | ||
284 | + | ||
285 | +#define REG_INDEX(offset) (offset / sizeof(uint32_t)) | ||
286 | + | ||
287 | +/* DRAMCOM register offsets */ | ||
288 | +enum { | ||
289 | + REG_DRAMCOM_CR = 0x0000, /* Control Register */ | ||
290 | +}; | ||
291 | + | ||
292 | +/* DRAMCTL register offsets */ | ||
293 | +enum { | ||
294 | + REG_DRAMCTL_PIR = 0x0000, /* PHY Initialization Register */ | ||
295 | + REG_DRAMCTL_PGSR = 0x0010, /* PHY General Status Register */ | ||
296 | + REG_DRAMCTL_STATR = 0x0018, /* Status Register */ | ||
297 | +}; | ||
298 | + | ||
299 | +/* DRAMCTL register flags */ | ||
300 | +enum { | ||
301 | + REG_DRAMCTL_PGSR_INITDONE = (1 << 0), | ||
302 | +}; | ||
303 | + | ||
304 | +enum { | ||
305 | + REG_DRAMCTL_STATR_ACTIVE = (1 << 0), | ||
306 | +}; | ||
307 | + | ||
308 | +static void allwinner_h3_dramc_map_rows(AwH3DramCtlState *s, uint8_t row_bits, | ||
309 | + uint8_t bank_bits, uint16_t page_size) | ||
310 | +{ | 69 | +{ |
311 | + /* | 70 | + /* |
312 | + * This function simulates row addressing behavior when bootloader | 71 | + * VFNMA : fd = muladd(-fd, fn, fm) |
313 | + * software attempts to detect the amount of available SDRAM. In U-Boot | 72 | + * VFNMS : fd = muladd(-fd, -fn, fm) |
314 | + * the controller is configured with the widest row addressing available. | 73 | + * VFMA : fd = muladd( fd, fn, fm) |
315 | + * Then a pattern is written to RAM at an offset on the row boundary size. | 74 | + * VFMS : fd = muladd( fd, -fn, fm) |
316 | + * If the value read back equals the value read back from the | ||
317 | + * start of RAM, the bootloader knows the amount of row bits. | ||
318 | + * | 75 | + * |
319 | + * This function inserts a mirrored memory region when the configured row | 76 | + * These are fused multiply-add, and must be done as one floating |
320 | + * bits are not matching the actual emulated memory, to simulate the | 77 | + * point operation with no rounding between the multiplication and |
321 | + * same behavior on hardware as expected by the bootloader. | 78 | + * addition steps. NB that doing the negations here as separate |
79 | + * steps is correct : an input NaN should come out with its sign | ||
80 | + * bit flipped if it is a negated-input. | ||
322 | + */ | 81 | + */ |
323 | + uint8_t row_bits_actual = 0; | 82 | + TCGv_ptr fpst; |
83 | + TCGv_i32 vn, vm, vd; | ||
324 | + | 84 | + |
325 | + /* Calculate the actual row bits using the ram_size property */ | 85 | + /* |
326 | + for (uint8_t i = 8; i < 12; i++) { | 86 | + * Present in VFPv4 only, and only with the FP16 extension. |
327 | + if (1 << i == s->ram_size) { | 87 | + * Note that we can't rely on the SIMDFMAC check alone, because |
328 | + row_bits_actual = i + 3; | 88 | + * in a Neon-no-VFP core that ID register field will be non-zero. |
329 | + break; | 89 | + */ |
330 | + } | 90 | + if (!dc_isar_feature(aa32_fp16_arith, s) || |
91 | + !dc_isar_feature(aa32_simdfmac, s) || | ||
92 | + !dc_isar_feature(aa32_fpsp_v2, s)) { | ||
93 | + return false; | ||
331 | + } | 94 | + } |
332 | + | 95 | + |
333 | + if (s->ram_size == (1 << (row_bits - 3))) { | 96 | + if (s->vec_len != 0 || s->vec_stride != 0) { |
334 | + /* When row bits is the expected value, remove the mirror */ | 97 | + return false; |
335 | + memory_region_set_enabled(&s->row_mirror_alias, false); | 98 | + } |
336 | + trace_allwinner_h3_dramc_rowmirror_disable(); | ||
337 | + | 99 | + |
338 | + } else if (row_bits_actual) { | 100 | + if (!vfp_access_check(s)) { |
339 | + /* Row bits not matching ram_size, install the rows mirror */ | 101 | + return true; |
340 | + hwaddr row_mirror = s->ram_addr + ((1 << (row_bits_actual + | 102 | + } |
341 | + bank_bits)) * page_size); | ||
342 | + | 103 | + |
343 | + memory_region_set_enabled(&s->row_mirror_alias, true); | 104 | + vn = tcg_temp_new_i32(); |
344 | + memory_region_set_address(&s->row_mirror_alias, row_mirror); | 105 | + vm = tcg_temp_new_i32(); |
106 | + vd = tcg_temp_new_i32(); | ||
345 | + | 107 | + |
346 | + trace_allwinner_h3_dramc_rowmirror_enable(row_mirror); | 108 | + neon_load_reg32(vn, a->vn); |
109 | + neon_load_reg32(vm, a->vm); | ||
110 | + if (neg_n) { | ||
111 | + /* VFNMS, VFMS */ | ||
112 | + gen_helper_vfp_negh(vn, vn); | ||
347 | + } | 113 | + } |
114 | + neon_load_reg32(vd, a->vd); | ||
115 | + if (neg_d) { | ||
116 | + /* VFNMA, VFNMS */ | ||
117 | + gen_helper_vfp_negh(vd, vd); | ||
118 | + } | ||
119 | + fpst = fpstatus_ptr(FPST_FPCR_F16); | ||
120 | + gen_helper_vfp_muladdh(vd, vn, vm, vd, fpst); | ||
121 | + neon_store_reg32(vd, a->vd); | ||
122 | + | ||
123 | + tcg_temp_free_ptr(fpst); | ||
124 | + tcg_temp_free_i32(vn); | ||
125 | + tcg_temp_free_i32(vm); | ||
126 | + tcg_temp_free_i32(vd); | ||
127 | + | ||
128 | + return true; | ||
348 | +} | 129 | +} |
349 | + | 130 | + |
350 | +static uint64_t allwinner_h3_dramcom_read(void *opaque, hwaddr offset, | 131 | static bool do_vfm_sp(DisasContext *s, arg_VFMA_sp *a, bool neg_n, bool neg_d) |
351 | + unsigned size) | 132 | { |
352 | +{ | 133 | /* |
353 | + const AwH3DramCtlState *s = AW_H3_DRAMC(opaque); | 134 | @@ -XXX,XX +XXX,XX @@ static bool do_vfm_dp(DisasContext *s, arg_VFMA_dp *a, bool neg_n, bool neg_d) |
354 | + const uint32_t idx = REG_INDEX(offset); | 135 | MAKE_ONE_VFM_TRANS_FN(VFNMA, PREC, false, true) \ |
355 | + | 136 | MAKE_ONE_VFM_TRANS_FN(VFNMS, PREC, true, true) |
356 | + if (idx >= AW_H3_DRAMCOM_REGS_NUM) { | 137 | |
357 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | 138 | +MAKE_VFM_TRANS_FNS(hp) |
358 | + __func__, (uint32_t)offset); | 139 | MAKE_VFM_TRANS_FNS(sp) |
359 | + return 0; | 140 | MAKE_VFM_TRANS_FNS(dp) |
360 | + } | 141 | |
361 | + | ||
362 | + trace_allwinner_h3_dramcom_read(offset, s->dramcom[idx], size); | ||
363 | + | ||
364 | + return s->dramcom[idx]; | ||
365 | +} | ||
366 | + | ||
367 | +static void allwinner_h3_dramcom_write(void *opaque, hwaddr offset, | ||
368 | + uint64_t val, unsigned size) | ||
369 | +{ | ||
370 | + AwH3DramCtlState *s = AW_H3_DRAMC(opaque); | ||
371 | + const uint32_t idx = REG_INDEX(offset); | ||
372 | + | ||
373 | + trace_allwinner_h3_dramcom_write(offset, val, size); | ||
374 | + | ||
375 | + if (idx >= AW_H3_DRAMCOM_REGS_NUM) { | ||
376 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
377 | + __func__, (uint32_t)offset); | ||
378 | + return; | ||
379 | + } | ||
380 | + | ||
381 | + switch (offset) { | ||
382 | + case REG_DRAMCOM_CR: /* Control Register */ | ||
383 | + allwinner_h3_dramc_map_rows(s, ((val >> 4) & 0xf) + 1, | ||
384 | + ((val >> 2) & 0x1) + 2, | ||
385 | + 1 << (((val >> 8) & 0xf) + 3)); | ||
386 | + break; | ||
387 | + default: | ||
388 | + break; | ||
389 | + }; | ||
390 | + | ||
391 | + s->dramcom[idx] = (uint32_t) val; | ||
392 | +} | ||
393 | + | ||
394 | +static uint64_t allwinner_h3_dramctl_read(void *opaque, hwaddr offset, | ||
395 | + unsigned size) | ||
396 | +{ | ||
397 | + const AwH3DramCtlState *s = AW_H3_DRAMC(opaque); | ||
398 | + const uint32_t idx = REG_INDEX(offset); | ||
399 | + | ||
400 | + if (idx >= AW_H3_DRAMCTL_REGS_NUM) { | ||
401 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
402 | + __func__, (uint32_t)offset); | ||
403 | + return 0; | ||
404 | + } | ||
405 | + | ||
406 | + trace_allwinner_h3_dramctl_read(offset, s->dramctl[idx], size); | ||
407 | + | ||
408 | + return s->dramctl[idx]; | ||
409 | +} | ||
410 | + | ||
411 | +static void allwinner_h3_dramctl_write(void *opaque, hwaddr offset, | ||
412 | + uint64_t val, unsigned size) | ||
413 | +{ | ||
414 | + AwH3DramCtlState *s = AW_H3_DRAMC(opaque); | ||
415 | + const uint32_t idx = REG_INDEX(offset); | ||
416 | + | ||
417 | + trace_allwinner_h3_dramctl_write(offset, val, size); | ||
418 | + | ||
419 | + if (idx >= AW_H3_DRAMCTL_REGS_NUM) { | ||
420 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
421 | + __func__, (uint32_t)offset); | ||
422 | + return; | ||
423 | + } | ||
424 | + | ||
425 | + switch (offset) { | ||
426 | + case REG_DRAMCTL_PIR: /* PHY Initialization Register */ | ||
427 | + s->dramctl[REG_INDEX(REG_DRAMCTL_PGSR)] |= REG_DRAMCTL_PGSR_INITDONE; | ||
428 | + s->dramctl[REG_INDEX(REG_DRAMCTL_STATR)] |= REG_DRAMCTL_STATR_ACTIVE; | ||
429 | + break; | ||
430 | + default: | ||
431 | + break; | ||
432 | + } | ||
433 | + | ||
434 | + s->dramctl[idx] = (uint32_t) val; | ||
435 | +} | ||
436 | + | ||
437 | +static uint64_t allwinner_h3_dramphy_read(void *opaque, hwaddr offset, | ||
438 | + unsigned size) | ||
439 | +{ | ||
440 | + const AwH3DramCtlState *s = AW_H3_DRAMC(opaque); | ||
441 | + const uint32_t idx = REG_INDEX(offset); | ||
442 | + | ||
443 | + if (idx >= AW_H3_DRAMPHY_REGS_NUM) { | ||
444 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
445 | + __func__, (uint32_t)offset); | ||
446 | + return 0; | ||
447 | + } | ||
448 | + | ||
449 | + trace_allwinner_h3_dramphy_read(offset, s->dramphy[idx], size); | ||
450 | + | ||
451 | + return s->dramphy[idx]; | ||
452 | +} | ||
453 | + | ||
454 | +static void allwinner_h3_dramphy_write(void *opaque, hwaddr offset, | ||
455 | + uint64_t val, unsigned size) | ||
456 | +{ | ||
457 | + AwH3DramCtlState *s = AW_H3_DRAMC(opaque); | ||
458 | + const uint32_t idx = REG_INDEX(offset); | ||
459 | + | ||
460 | + trace_allwinner_h3_dramphy_write(offset, val, size); | ||
461 | + | ||
462 | + if (idx >= AW_H3_DRAMPHY_REGS_NUM) { | ||
463 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
464 | + __func__, (uint32_t)offset); | ||
465 | + return; | ||
466 | + } | ||
467 | + | ||
468 | + s->dramphy[idx] = (uint32_t) val; | ||
469 | +} | ||
470 | + | ||
471 | +static const MemoryRegionOps allwinner_h3_dramcom_ops = { | ||
472 | + .read = allwinner_h3_dramcom_read, | ||
473 | + .write = allwinner_h3_dramcom_write, | ||
474 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
475 | + .valid = { | ||
476 | + .min_access_size = 4, | ||
477 | + .max_access_size = 4, | ||
478 | + }, | ||
479 | + .impl.min_access_size = 4, | ||
480 | +}; | ||
481 | + | ||
482 | +static const MemoryRegionOps allwinner_h3_dramctl_ops = { | ||
483 | + .read = allwinner_h3_dramctl_read, | ||
484 | + .write = allwinner_h3_dramctl_write, | ||
485 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
486 | + .valid = { | ||
487 | + .min_access_size = 4, | ||
488 | + .max_access_size = 4, | ||
489 | + }, | ||
490 | + .impl.min_access_size = 4, | ||
491 | +}; | ||
492 | + | ||
493 | +static const MemoryRegionOps allwinner_h3_dramphy_ops = { | ||
494 | + .read = allwinner_h3_dramphy_read, | ||
495 | + .write = allwinner_h3_dramphy_write, | ||
496 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
497 | + .valid = { | ||
498 | + .min_access_size = 4, | ||
499 | + .max_access_size = 4, | ||
500 | + }, | ||
501 | + .impl.min_access_size = 4, | ||
502 | +}; | ||
503 | + | ||
504 | +static void allwinner_h3_dramc_reset(DeviceState *dev) | ||
505 | +{ | ||
506 | + AwH3DramCtlState *s = AW_H3_DRAMC(dev); | ||
507 | + | ||
508 | + /* Set default values for registers */ | ||
509 | + memset(&s->dramcom, 0, sizeof(s->dramcom)); | ||
510 | + memset(&s->dramctl, 0, sizeof(s->dramctl)); | ||
511 | + memset(&s->dramphy, 0, sizeof(s->dramphy)); | ||
512 | +} | ||
513 | + | ||
514 | +static void allwinner_h3_dramc_realize(DeviceState *dev, Error **errp) | ||
515 | +{ | ||
516 | + AwH3DramCtlState *s = AW_H3_DRAMC(dev); | ||
517 | + | ||
518 | + /* Only power of 2 RAM sizes from 256MiB up to 2048MiB are supported */ | ||
519 | + for (uint8_t i = 8; i < 13; i++) { | ||
520 | + if (1 << i == s->ram_size) { | ||
521 | + break; | ||
522 | + } else if (i == 12) { | ||
523 | + error_report("%s: ram-size %u MiB is not supported", | ||
524 | + __func__, s->ram_size); | ||
525 | + exit(1); | ||
526 | + } | ||
527 | + } | ||
528 | + | ||
529 | + /* Setup row mirror mappings */ | ||
530 | + memory_region_init_ram(&s->row_mirror, OBJECT(s), | ||
531 | + "allwinner-h3-dramc.row-mirror", | ||
532 | + 4 * KiB, &error_abort); | ||
533 | + memory_region_add_subregion_overlap(get_system_memory(), s->ram_addr, | ||
534 | + &s->row_mirror, 10); | ||
535 | + | ||
536 | + memory_region_init_alias(&s->row_mirror_alias, OBJECT(s), | ||
537 | + "allwinner-h3-dramc.row-mirror-alias", | ||
538 | + &s->row_mirror, 0, 4 * KiB); | ||
539 | + memory_region_add_subregion_overlap(get_system_memory(), | ||
540 | + s->ram_addr + 1 * MiB, | ||
541 | + &s->row_mirror_alias, 10); | ||
542 | + memory_region_set_enabled(&s->row_mirror_alias, false); | ||
543 | +} | ||
544 | + | ||
545 | +static void allwinner_h3_dramc_init(Object *obj) | ||
546 | +{ | ||
547 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
548 | + AwH3DramCtlState *s = AW_H3_DRAMC(obj); | ||
549 | + | ||
550 | + /* DRAMCOM registers */ | ||
551 | + memory_region_init_io(&s->dramcom_iomem, OBJECT(s), | ||
552 | + &allwinner_h3_dramcom_ops, s, | ||
553 | + TYPE_AW_H3_DRAMC, 4 * KiB); | ||
554 | + sysbus_init_mmio(sbd, &s->dramcom_iomem); | ||
555 | + | ||
556 | + /* DRAMCTL registers */ | ||
557 | + memory_region_init_io(&s->dramctl_iomem, OBJECT(s), | ||
558 | + &allwinner_h3_dramctl_ops, s, | ||
559 | + TYPE_AW_H3_DRAMC, 4 * KiB); | ||
560 | + sysbus_init_mmio(sbd, &s->dramctl_iomem); | ||
561 | + | ||
562 | + /* DRAMPHY registers */ | ||
563 | + memory_region_init_io(&s->dramphy_iomem, OBJECT(s), | ||
564 | + &allwinner_h3_dramphy_ops, s, | ||
565 | + TYPE_AW_H3_DRAMC, 4 * KiB); | ||
566 | + sysbus_init_mmio(sbd, &s->dramphy_iomem); | ||
567 | +} | ||
568 | + | ||
569 | +static Property allwinner_h3_dramc_properties[] = { | ||
570 | + DEFINE_PROP_UINT64("ram-addr", AwH3DramCtlState, ram_addr, 0x0), | ||
571 | + DEFINE_PROP_UINT32("ram-size", AwH3DramCtlState, ram_size, 256 * MiB), | ||
572 | + DEFINE_PROP_END_OF_LIST() | ||
573 | +}; | ||
574 | + | ||
575 | +static const VMStateDescription allwinner_h3_dramc_vmstate = { | ||
576 | + .name = "allwinner-h3-dramc", | ||
577 | + .version_id = 1, | ||
578 | + .minimum_version_id = 1, | ||
579 | + .fields = (VMStateField[]) { | ||
580 | + VMSTATE_UINT32_ARRAY(dramcom, AwH3DramCtlState, AW_H3_DRAMCOM_REGS_NUM), | ||
581 | + VMSTATE_UINT32_ARRAY(dramctl, AwH3DramCtlState, AW_H3_DRAMCTL_REGS_NUM), | ||
582 | + VMSTATE_UINT32_ARRAY(dramphy, AwH3DramCtlState, AW_H3_DRAMPHY_REGS_NUM), | ||
583 | + VMSTATE_END_OF_LIST() | ||
584 | + } | ||
585 | +}; | ||
586 | + | ||
587 | +static void allwinner_h3_dramc_class_init(ObjectClass *klass, void *data) | ||
588 | +{ | ||
589 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
590 | + | ||
591 | + dc->reset = allwinner_h3_dramc_reset; | ||
592 | + dc->vmsd = &allwinner_h3_dramc_vmstate; | ||
593 | + dc->realize = allwinner_h3_dramc_realize; | ||
594 | + device_class_set_props(dc, allwinner_h3_dramc_properties); | ||
595 | +} | ||
596 | + | ||
597 | +static const TypeInfo allwinner_h3_dramc_info = { | ||
598 | + .name = TYPE_AW_H3_DRAMC, | ||
599 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
600 | + .instance_init = allwinner_h3_dramc_init, | ||
601 | + .instance_size = sizeof(AwH3DramCtlState), | ||
602 | + .class_init = allwinner_h3_dramc_class_init, | ||
603 | +}; | ||
604 | + | ||
605 | +static void allwinner_h3_dramc_register(void) | ||
606 | +{ | ||
607 | + type_register_static(&allwinner_h3_dramc_info); | ||
608 | +} | ||
609 | + | ||
610 | +type_init(allwinner_h3_dramc_register) | ||
611 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events | ||
612 | index XXXXXXX..XXXXXXX 100644 | ||
613 | --- a/hw/misc/trace-events | ||
614 | +++ b/hw/misc/trace-events | ||
615 | @@ -XXX,XX +XXX,XX @@ allwinner_cpucfg_cpu_reset(uint8_t cpu_id, uint32_t reset_addr) "id %u, reset_ad | ||
616 | allwinner_cpucfg_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
617 | allwinner_cpucfg_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
618 | |||
619 | +# allwinner-h3-dramc.c | ||
620 | +allwinner_h3_dramc_rowmirror_disable(void) "Disable row mirror" | ||
621 | +allwinner_h3_dramc_rowmirror_enable(uint64_t addr) "Enable row mirror: addr 0x%" PRIx64 | ||
622 | +allwinner_h3_dramcom_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
623 | +allwinner_h3_dramcom_write(uint64_t offset, uint64_t data, unsigned size) "Write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
624 | +allwinner_h3_dramctl_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
625 | +allwinner_h3_dramctl_write(uint64_t offset, uint64_t data, unsigned size) "Write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
626 | +allwinner_h3_dramphy_read(uint64_t offset, uint64_t data, unsigned size) "Read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
627 | +allwinner_h3_dramphy_write(uint64_t offset, uint64_t data, unsigned size) "write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
628 | + | ||
629 | # allwinner-sid.c | ||
630 | allwinner_sid_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
631 | allwinner_sid_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
632 | -- | 142 | -- |
633 | 2.20.1 | 143 | 2.20.1 |
634 | 144 | ||
635 | 145 | diff view generated by jsdifflib |
1 | From: Cédric Le Goater <clg@kaod.org> | 1 | Macroify the uses of do_vfp_2op_sp() and do_vfp_2op_dp(); this will |
---|---|---|---|
2 | make it easier to add the halfprec support. | ||
2 | 3 | ||
3 | The Aspeed SMC Controller can operate in different modes : Read, Fast | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Read, Write and User modes. When the User mode is configured, it | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | selects automatically the SPI slave device until the CE_STOP_ACTIVE | 6 | Message-id: 20200828183354.27913-8-peter.maydell@linaro.org |
6 | bit is set to 1. When any other modes are configured the device is | 7 | --- |
7 | unselected. The HW logic handles the chip select automatically when | 8 | target/arm/translate-vfp.c.inc | 49 ++++++++++------------------------ |
8 | the flash is accessed through its AHB window. | 9 | 1 file changed, 14 insertions(+), 35 deletions(-) |
9 | 10 | ||
10 | When configuring the CEx Control Register, the User mode logic to | 11 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc |
11 | select and unselect the slave is incorrect and data corruption can be | ||
12 | seen on machines using two chips, witherspoon and romulus. | ||
13 | |||
14 | Rework the handler setting the CEx Control Register to fix this issue. | ||
15 | |||
16 | Fixes: 7c1c69bca43c ("ast2400: add SMC controllers (FMC and SPI)") | ||
17 | Signed-off-by: Cédric Le Goater <clg@kaod.org> | ||
18 | Reviewed-by: Andrew Jeffery <andrew@aj.id.au> | ||
19 | Message-id: 20200206112645.21275-3-clg@kaod.org | ||
20 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
21 | --- | ||
22 | hw/ssi/aspeed_smc.c | 39 +++++++++++++++++++++++---------------- | ||
23 | hw/ssi/trace-events | 1 + | ||
24 | 2 files changed, 24 insertions(+), 16 deletions(-) | ||
25 | |||
26 | diff --git a/hw/ssi/aspeed_smc.c b/hw/ssi/aspeed_smc.c | ||
27 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
28 | --- a/hw/ssi/aspeed_smc.c | 13 | --- a/target/arm/translate-vfp.c.inc |
29 | +++ b/hw/ssi/aspeed_smc.c | 14 | +++ b/target/arm/translate-vfp.c.inc |
30 | @@ -XXX,XX +XXX,XX @@ static inline int aspeed_smc_flash_is_4byte(const AspeedSMCFlash *fl) | 15 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMOV_imm_dp(DisasContext *s, arg_VMOV_imm_dp *a) |
31 | } | 16 | return true; |
32 | } | 17 | } |
33 | 18 | ||
34 | -static inline bool aspeed_smc_is_ce_stop_active(const AspeedSMCFlash *fl) | 19 | -static bool trans_VMOV_reg_sp(DisasContext *s, arg_VMOV_reg_sp *a) |
35 | +static void aspeed_smc_flash_do_select(AspeedSMCFlash *fl, bool unselect) | 20 | -{ |
21 | - return do_vfp_2op_sp(s, tcg_gen_mov_i32, a->vd, a->vm); | ||
22 | -} | ||
23 | +#define DO_VFP_2OP(INSN, PREC, FN) \ | ||
24 | + static bool trans_##INSN##_##PREC(DisasContext *s, \ | ||
25 | + arg_##INSN##_##PREC *a) \ | ||
26 | + { \ | ||
27 | + return do_vfp_2op_##PREC(s, FN, a->vd, a->vm); \ | ||
28 | + } | ||
29 | |||
30 | -static bool trans_VMOV_reg_dp(DisasContext *s, arg_VMOV_reg_dp *a) | ||
31 | -{ | ||
32 | - return do_vfp_2op_dp(s, tcg_gen_mov_i64, a->vd, a->vm); | ||
33 | -} | ||
34 | +DO_VFP_2OP(VMOV_reg, sp, tcg_gen_mov_i32) | ||
35 | +DO_VFP_2OP(VMOV_reg, dp, tcg_gen_mov_i64) | ||
36 | |||
37 | -static bool trans_VABS_sp(DisasContext *s, arg_VABS_sp *a) | ||
38 | -{ | ||
39 | - return do_vfp_2op_sp(s, gen_helper_vfp_abss, a->vd, a->vm); | ||
40 | -} | ||
41 | +DO_VFP_2OP(VABS, sp, gen_helper_vfp_abss) | ||
42 | +DO_VFP_2OP(VABS, dp, gen_helper_vfp_absd) | ||
43 | |||
44 | -static bool trans_VABS_dp(DisasContext *s, arg_VABS_dp *a) | ||
45 | -{ | ||
46 | - return do_vfp_2op_dp(s, gen_helper_vfp_absd, a->vd, a->vm); | ||
47 | -} | ||
48 | - | ||
49 | -static bool trans_VNEG_sp(DisasContext *s, arg_VNEG_sp *a) | ||
50 | -{ | ||
51 | - return do_vfp_2op_sp(s, gen_helper_vfp_negs, a->vd, a->vm); | ||
52 | -} | ||
53 | - | ||
54 | -static bool trans_VNEG_dp(DisasContext *s, arg_VNEG_dp *a) | ||
55 | -{ | ||
56 | - return do_vfp_2op_dp(s, gen_helper_vfp_negd, a->vd, a->vm); | ||
57 | -} | ||
58 | +DO_VFP_2OP(VNEG, sp, gen_helper_vfp_negs) | ||
59 | +DO_VFP_2OP(VNEG, dp, gen_helper_vfp_negd) | ||
60 | |||
61 | static void gen_VSQRT_sp(TCGv_i32 vd, TCGv_i32 vm) | ||
36 | { | 62 | { |
37 | - const AspeedSMCState *s = fl->controller; | 63 | gen_helper_vfp_sqrts(vd, vm, cpu_env); |
38 | + AspeedSMCState *s = fl->controller; | ||
39 | |||
40 | - return s->regs[s->r_ctrl0 + fl->id] & CTRL_CE_STOP_ACTIVE; | ||
41 | + trace_aspeed_smc_flash_select(fl->id, unselect ? "un" : ""); | ||
42 | + | ||
43 | + qemu_set_irq(s->cs_lines[fl->id], unselect); | ||
44 | } | 64 | } |
45 | 65 | ||
46 | static void aspeed_smc_flash_select(AspeedSMCFlash *fl) | 66 | -static bool trans_VSQRT_sp(DisasContext *s, arg_VSQRT_sp *a) |
67 | -{ | ||
68 | - return do_vfp_2op_sp(s, gen_VSQRT_sp, a->vd, a->vm); | ||
69 | -} | ||
70 | - | ||
71 | static void gen_VSQRT_dp(TCGv_i64 vd, TCGv_i64 vm) | ||
47 | { | 72 | { |
48 | - AspeedSMCState *s = fl->controller; | 73 | gen_helper_vfp_sqrtd(vd, vm, cpu_env); |
49 | - | ||
50 | - s->regs[s->r_ctrl0 + fl->id] &= ~CTRL_CE_STOP_ACTIVE; | ||
51 | - qemu_set_irq(s->cs_lines[fl->id], aspeed_smc_is_ce_stop_active(fl)); | ||
52 | + aspeed_smc_flash_do_select(fl, false); | ||
53 | } | 74 | } |
54 | 75 | ||
55 | static void aspeed_smc_flash_unselect(AspeedSMCFlash *fl) | 76 | -static bool trans_VSQRT_dp(DisasContext *s, arg_VSQRT_dp *a) |
77 | -{ | ||
78 | - return do_vfp_2op_dp(s, gen_VSQRT_dp, a->vd, a->vm); | ||
79 | -} | ||
80 | +DO_VFP_2OP(VSQRT, sp, gen_VSQRT_sp) | ||
81 | +DO_VFP_2OP(VSQRT, dp, gen_VSQRT_dp) | ||
82 | |||
83 | static bool trans_VCMP_sp(DisasContext *s, arg_VCMP_sp *a) | ||
56 | { | 84 | { |
57 | - AspeedSMCState *s = fl->controller; | ||
58 | - | ||
59 | - s->regs[s->r_ctrl0 + fl->id] |= CTRL_CE_STOP_ACTIVE; | ||
60 | - qemu_set_irq(s->cs_lines[fl->id], aspeed_smc_is_ce_stop_active(fl)); | ||
61 | + aspeed_smc_flash_do_select(fl, true); | ||
62 | } | ||
63 | |||
64 | static uint32_t aspeed_smc_check_segment_addr(const AspeedSMCFlash *fl, | ||
65 | @@ -XXX,XX +XXX,XX @@ static const MemoryRegionOps aspeed_smc_flash_ops = { | ||
66 | }, | ||
67 | }; | ||
68 | |||
69 | -static void aspeed_smc_flash_update_cs(AspeedSMCFlash *fl) | ||
70 | +static void aspeed_smc_flash_update_ctrl(AspeedSMCFlash *fl, uint32_t value) | ||
71 | { | ||
72 | AspeedSMCState *s = fl->controller; | ||
73 | + bool unselect; | ||
74 | |||
75 | - s->snoop_index = aspeed_smc_is_ce_stop_active(fl) ? SNOOP_OFF : SNOOP_START; | ||
76 | + /* User mode selects the CS, other modes unselect */ | ||
77 | + unselect = (value & CTRL_CMD_MODE_MASK) != CTRL_USERMODE; | ||
78 | |||
79 | - qemu_set_irq(s->cs_lines[fl->id], aspeed_smc_is_ce_stop_active(fl)); | ||
80 | + /* A change of CTRL_CE_STOP_ACTIVE from 0 to 1, unselects the CS */ | ||
81 | + if (!(s->regs[s->r_ctrl0 + fl->id] & CTRL_CE_STOP_ACTIVE) && | ||
82 | + value & CTRL_CE_STOP_ACTIVE) { | ||
83 | + unselect = true; | ||
84 | + } | ||
85 | + | ||
86 | + s->regs[s->r_ctrl0 + fl->id] = value; | ||
87 | + | ||
88 | + s->snoop_index = unselect ? SNOOP_OFF : SNOOP_START; | ||
89 | + | ||
90 | + aspeed_smc_flash_do_select(fl, unselect); | ||
91 | } | ||
92 | |||
93 | static void aspeed_smc_reset(DeviceState *d) | ||
94 | @@ -XXX,XX +XXX,XX @@ static void aspeed_smc_write(void *opaque, hwaddr addr, uint64_t data, | ||
95 | s->regs[addr] = value; | ||
96 | } else if (addr >= s->r_ctrl0 && addr < s->r_ctrl0 + s->num_cs) { | ||
97 | int cs = addr - s->r_ctrl0; | ||
98 | - s->regs[addr] = value; | ||
99 | - aspeed_smc_flash_update_cs(&s->flashes[cs]); | ||
100 | + aspeed_smc_flash_update_ctrl(&s->flashes[cs], value); | ||
101 | } else if (addr >= R_SEG_ADDR0 && | ||
102 | addr < R_SEG_ADDR0 + s->ctrl->max_slaves) { | ||
103 | int cs = addr - R_SEG_ADDR0; | ||
104 | diff --git a/hw/ssi/trace-events b/hw/ssi/trace-events | ||
105 | index XXXXXXX..XXXXXXX 100644 | ||
106 | --- a/hw/ssi/trace-events | ||
107 | +++ b/hw/ssi/trace-events | ||
108 | @@ -XXX,XX +XXX,XX @@ aspeed_smc_flash_write(int cs, uint64_t addr, uint32_t size, uint64_t data, int | ||
109 | aspeed_smc_read(uint64_t addr, uint32_t size, uint64_t data) "@0x%" PRIx64 " size %u: 0x%" PRIx64 | ||
110 | aspeed_smc_dma_checksum(uint32_t addr, uint32_t data) "0x%08x: 0x%08x" | ||
111 | aspeed_smc_write(uint64_t addr, uint32_t size, uint64_t data) "@0x%" PRIx64 " size %u: 0x%" PRIx64 | ||
112 | +aspeed_smc_flash_select(int cs, const char *prefix) "CS%d %sselect" | ||
113 | -- | 85 | -- |
114 | 2.20.1 | 86 | 2.20.1 |
115 | 87 | ||
116 | 88 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Implement VFP fp16 for VABS, VNEG and VSQRT. This is all |
---|---|---|---|
2 | the fp16 insns that use the DO_VFP_2OP macro, because there | ||
3 | is no fp16 version of VMOV_reg. | ||
2 | 4 | ||
3 | The Allwinner Sun8i System on Chip family includes an Ethernet MAC (EMAC) | 5 | Notes: |
4 | which provides 10M/100M/1000M Ethernet connectivity. This commit | 6 | * the gen_helper_vfp_negh already exists as we needed to create |
5 | adds support for the Allwinner EMAC from the Sun8i family (H2+, H3, A33, etc), | 7 | it for the fp16 multiply-add insns |
6 | including emulation for the following functionality: | 8 | * as usual we need to use the f16 version of the fp_status; |
9 | this is only relevant for VSQRT | ||
7 | 10 | ||
8 | * DMA transfers | 11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | * MII interface | 12 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
10 | * Transmit CRC calculation | 13 | Message-id: 20200828183354.27913-9-peter.maydell@linaro.org |
14 | --- | ||
15 | target/arm/helper.h | 2 ++ | ||
16 | target/arm/vfp.decode | 3 +++ | ||
17 | target/arm/vfp_helper.c | 10 +++++++++ | ||
18 | target/arm/translate-vfp.c.inc | 40 ++++++++++++++++++++++++++++++++++ | ||
19 | 4 files changed, 55 insertions(+) | ||
11 | 20 | ||
12 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | 21 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
13 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
14 | Message-id: 20200311221854.30370-10-nieklinnenbank@gmail.com | ||
15 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
16 | --- | ||
17 | hw/net/Makefile.objs | 1 + | ||
18 | include/hw/arm/allwinner-h3.h | 3 + | ||
19 | include/hw/net/allwinner-sun8i-emac.h | 99 +++ | ||
20 | hw/arm/allwinner-h3.c | 16 +- | ||
21 | hw/arm/orangepi.c | 3 + | ||
22 | hw/net/allwinner-sun8i-emac.c | 871 ++++++++++++++++++++++++++ | ||
23 | hw/arm/Kconfig | 1 + | ||
24 | hw/net/Kconfig | 3 + | ||
25 | hw/net/trace-events | 10 + | ||
26 | 9 files changed, 1006 insertions(+), 1 deletion(-) | ||
27 | create mode 100644 include/hw/net/allwinner-sun8i-emac.h | ||
28 | create mode 100644 hw/net/allwinner-sun8i-emac.c | ||
29 | |||
30 | diff --git a/hw/net/Makefile.objs b/hw/net/Makefile.objs | ||
31 | index XXXXXXX..XXXXXXX 100644 | 22 | index XXXXXXX..XXXXXXX 100644 |
32 | --- a/hw/net/Makefile.objs | 23 | --- a/target/arm/helper.h |
33 | +++ b/hw/net/Makefile.objs | 24 | +++ b/target/arm/helper.h |
34 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_XGMAC) += xgmac.o | 25 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_minnumd, f64, f64, f64, ptr) |
35 | common-obj-$(CONFIG_MIPSNET) += mipsnet.o | 26 | DEF_HELPER_1(vfp_negh, f16, f16) |
36 | common-obj-$(CONFIG_XILINX_AXI) += xilinx_axienet.o | 27 | DEF_HELPER_1(vfp_negs, f32, f32) |
37 | common-obj-$(CONFIG_ALLWINNER_EMAC) += allwinner_emac.o | 28 | DEF_HELPER_1(vfp_negd, f64, f64) |
38 | +common-obj-$(CONFIG_ALLWINNER_SUN8I_EMAC) += allwinner-sun8i-emac.o | 29 | +DEF_HELPER_1(vfp_absh, f16, f16) |
39 | common-obj-$(CONFIG_IMX_FEC) += imx_fec.o | 30 | DEF_HELPER_1(vfp_abss, f32, f32) |
40 | 31 | DEF_HELPER_1(vfp_absd, f64, f64) | |
41 | common-obj-$(CONFIG_CADENCE) += cadence_gem.o | 32 | +DEF_HELPER_2(vfp_sqrth, f16, f16, env) |
42 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | 33 | DEF_HELPER_2(vfp_sqrts, f32, f32, env) |
34 | DEF_HELPER_2(vfp_sqrtd, f64, f64, env) | ||
35 | DEF_HELPER_3(vfp_cmps, void, f32, f32, env) | ||
36 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode | ||
43 | index XXXXXXX..XXXXXXX 100644 | 37 | index XXXXXXX..XXXXXXX 100644 |
44 | --- a/include/hw/arm/allwinner-h3.h | 38 | --- a/target/arm/vfp.decode |
45 | +++ b/include/hw/arm/allwinner-h3.h | 39 | +++ b/target/arm/vfp.decode |
46 | @@ -XXX,XX +XXX,XX @@ | 40 | @@ -XXX,XX +XXX,XX @@ VMOV_imm_dp ---- 1110 1.11 .... .... 1011 0000 .... \ |
47 | #include "hw/misc/allwinner-h3-sysctrl.h" | 41 | VMOV_reg_sp ---- 1110 1.11 0000 .... 1010 01.0 .... @vfp_dm_ss |
48 | #include "hw/misc/allwinner-sid.h" | 42 | VMOV_reg_dp ---- 1110 1.11 0000 .... 1011 01.0 .... @vfp_dm_dd |
49 | #include "hw/sd/allwinner-sdhost.h" | 43 | |
50 | +#include "hw/net/allwinner-sun8i-emac.h" | 44 | +VABS_hp ---- 1110 1.11 0000 .... 1001 11.0 .... @vfp_dm_ss |
51 | #include "target/arm/cpu.h" | 45 | VABS_sp ---- 1110 1.11 0000 .... 1010 11.0 .... @vfp_dm_ss |
52 | 46 | VABS_dp ---- 1110 1.11 0000 .... 1011 11.0 .... @vfp_dm_dd | |
53 | /** | 47 | |
54 | @@ -XXX,XX +XXX,XX @@ enum { | 48 | +VNEG_hp ---- 1110 1.11 0001 .... 1001 01.0 .... @vfp_dm_ss |
55 | AW_H3_UART1, | 49 | VNEG_sp ---- 1110 1.11 0001 .... 1010 01.0 .... @vfp_dm_ss |
56 | AW_H3_UART2, | 50 | VNEG_dp ---- 1110 1.11 0001 .... 1011 01.0 .... @vfp_dm_dd |
57 | AW_H3_UART3, | 51 | |
58 | + AW_H3_EMAC, | 52 | +VSQRT_hp ---- 1110 1.11 0001 .... 1001 11.0 .... @vfp_dm_ss |
59 | AW_H3_GIC_DIST, | 53 | VSQRT_sp ---- 1110 1.11 0001 .... 1010 11.0 .... @vfp_dm_ss |
60 | AW_H3_GIC_CPU, | 54 | VSQRT_dp ---- 1110 1.11 0001 .... 1011 11.0 .... @vfp_dm_dd |
61 | AW_H3_GIC_HYP, | 55 | |
62 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | 56 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c |
63 | AwH3SysCtrlState sysctrl; | ||
64 | AwSidState sid; | ||
65 | AwSdHostState mmc0; | ||
66 | + AwSun8iEmacState emac; | ||
67 | GICState gic; | ||
68 | MemoryRegion sram_a1; | ||
69 | MemoryRegion sram_a2; | ||
70 | diff --git a/include/hw/net/allwinner-sun8i-emac.h b/include/hw/net/allwinner-sun8i-emac.h | ||
71 | new file mode 100644 | ||
72 | index XXXXXXX..XXXXXXX | ||
73 | --- /dev/null | ||
74 | +++ b/include/hw/net/allwinner-sun8i-emac.h | ||
75 | @@ -XXX,XX +XXX,XX @@ | ||
76 | +/* | ||
77 | + * Allwinner Sun8i Ethernet MAC emulation | ||
78 | + * | ||
79 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
80 | + * | ||
81 | + * This program is free software: you can redistribute it and/or modify | ||
82 | + * it under the terms of the GNU General Public License as published by | ||
83 | + * the Free Software Foundation, either version 2 of the License, or | ||
84 | + * (at your option) any later version. | ||
85 | + * | ||
86 | + * This program is distributed in the hope that it will be useful, | ||
87 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
88 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
89 | + * GNU General Public License for more details. | ||
90 | + * | ||
91 | + * You should have received a copy of the GNU General Public License | ||
92 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
93 | + */ | ||
94 | + | ||
95 | +#ifndef HW_NET_ALLWINNER_SUN8I_EMAC_H | ||
96 | +#define HW_NET_ALLWINNER_SUN8I_EMAC_H | ||
97 | + | ||
98 | +#include "qom/object.h" | ||
99 | +#include "net/net.h" | ||
100 | +#include "hw/sysbus.h" | ||
101 | + | ||
102 | +/** | ||
103 | + * Object model | ||
104 | + * @{ | ||
105 | + */ | ||
106 | + | ||
107 | +#define TYPE_AW_SUN8I_EMAC "allwinner-sun8i-emac" | ||
108 | +#define AW_SUN8I_EMAC(obj) \ | ||
109 | + OBJECT_CHECK(AwSun8iEmacState, (obj), TYPE_AW_SUN8I_EMAC) | ||
110 | + | ||
111 | +/** @} */ | ||
112 | + | ||
113 | +/** | ||
114 | + * Allwinner Sun8i EMAC object instance state | ||
115 | + */ | ||
116 | +typedef struct AwSun8iEmacState { | ||
117 | + /*< private >*/ | ||
118 | + SysBusDevice parent_obj; | ||
119 | + /*< public >*/ | ||
120 | + | ||
121 | + /** Maps I/O registers in physical memory */ | ||
122 | + MemoryRegion iomem; | ||
123 | + | ||
124 | + /** Interrupt output signal to notify CPU */ | ||
125 | + qemu_irq irq; | ||
126 | + | ||
127 | + /** Generic Network Interface Controller (NIC) for networking API */ | ||
128 | + NICState *nic; | ||
129 | + | ||
130 | + /** Generic Network Interface Controller (NIC) configuration */ | ||
131 | + NICConf conf; | ||
132 | + | ||
133 | + /** | ||
134 | + * @name Media Independent Interface (MII) | ||
135 | + * @{ | ||
136 | + */ | ||
137 | + | ||
138 | + uint8_t mii_phy_addr; /**< PHY address */ | ||
139 | + uint32_t mii_cr; /**< Control */ | ||
140 | + uint32_t mii_st; /**< Status */ | ||
141 | + uint32_t mii_adv; /**< Advertised Abilities */ | ||
142 | + | ||
143 | + /** @} */ | ||
144 | + | ||
145 | + /** | ||
146 | + * @name Hardware Registers | ||
147 | + * @{ | ||
148 | + */ | ||
149 | + | ||
150 | + uint32_t basic_ctl0; /**< Basic Control 0 */ | ||
151 | + uint32_t basic_ctl1; /**< Basic Control 1 */ | ||
152 | + uint32_t int_en; /**< Interrupt Enable */ | ||
153 | + uint32_t int_sta; /**< Interrupt Status */ | ||
154 | + uint32_t frm_flt; /**< Receive Frame Filter */ | ||
155 | + | ||
156 | + uint32_t rx_ctl0; /**< Receive Control 0 */ | ||
157 | + uint32_t rx_ctl1; /**< Receive Control 1 */ | ||
158 | + uint32_t rx_desc_head; /**< Receive Descriptor List Address */ | ||
159 | + uint32_t rx_desc_curr; /**< Current Receive Descriptor Address */ | ||
160 | + | ||
161 | + uint32_t tx_ctl0; /**< Transmit Control 0 */ | ||
162 | + uint32_t tx_ctl1; /**< Transmit Control 1 */ | ||
163 | + uint32_t tx_desc_head; /**< Transmit Descriptor List Address */ | ||
164 | + uint32_t tx_desc_curr; /**< Current Transmit Descriptor Address */ | ||
165 | + uint32_t tx_flowctl; /**< Transmit Flow Control */ | ||
166 | + | ||
167 | + uint32_t mii_cmd; /**< Management Interface Command */ | ||
168 | + uint32_t mii_data; /**< Management Interface Data */ | ||
169 | + | ||
170 | + /** @} */ | ||
171 | + | ||
172 | +} AwSun8iEmacState; | ||
173 | + | ||
174 | +#endif /* HW_NET_ALLWINNER_SUN8I_H */ | ||
175 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
176 | index XXXXXXX..XXXXXXX 100644 | 57 | index XXXXXXX..XXXXXXX 100644 |
177 | --- a/hw/arm/allwinner-h3.c | 58 | --- a/target/arm/vfp_helper.c |
178 | +++ b/hw/arm/allwinner-h3.c | 59 | +++ b/target/arm/vfp_helper.c |
179 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | 60 | @@ -XXX,XX +XXX,XX @@ float64 VFP_HELPER(neg, d)(float64 a) |
180 | [AW_H3_UART1] = 0x01c28400, | 61 | return float64_chs(a); |
181 | [AW_H3_UART2] = 0x01c28800, | ||
182 | [AW_H3_UART3] = 0x01c28c00, | ||
183 | + [AW_H3_EMAC] = 0x01c30000, | ||
184 | [AW_H3_GIC_DIST] = 0x01c81000, | ||
185 | [AW_H3_GIC_CPU] = 0x01c82000, | ||
186 | [AW_H3_GIC_HYP] = 0x01c84000, | ||
187 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
188 | { "twi1", 0x01c2b000, 1 * KiB }, | ||
189 | { "twi2", 0x01c2b400, 1 * KiB }, | ||
190 | { "scr", 0x01c2c400, 1 * KiB }, | ||
191 | - { "emac", 0x01c30000, 64 * KiB }, | ||
192 | { "gpu", 0x01c40000, 64 * KiB }, | ||
193 | { "hstmr", 0x01c60000, 4 * KiB }, | ||
194 | { "dramcom", 0x01c62000, 4 * KiB }, | ||
195 | @@ -XXX,XX +XXX,XX @@ enum { | ||
196 | AW_H3_GIC_SPI_OHCI2 = 77, | ||
197 | AW_H3_GIC_SPI_EHCI3 = 78, | ||
198 | AW_H3_GIC_SPI_OHCI3 = 79, | ||
199 | + AW_H3_GIC_SPI_EMAC = 82 | ||
200 | }; | ||
201 | |||
202 | /* Allwinner H3 general constants */ | ||
203 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
204 | |||
205 | sysbus_init_child_obj(obj, "mmc0", &s->mmc0, sizeof(s->mmc0), | ||
206 | TYPE_AW_SDHOST_SUN5I); | ||
207 | + | ||
208 | + sysbus_init_child_obj(obj, "emac", &s->emac, sizeof(s->emac), | ||
209 | + TYPE_AW_SUN8I_EMAC); | ||
210 | } | 62 | } |
211 | 63 | ||
212 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | 64 | +dh_ctype_f16 VFP_HELPER(abs, h)(dh_ctype_f16 a) |
213 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
214 | object_property_add_alias(OBJECT(s), "sd-bus", OBJECT(&s->mmc0), | ||
215 | "sd-bus", &error_abort); | ||
216 | |||
217 | + /* EMAC */ | ||
218 | + if (nd_table[0].used) { | ||
219 | + qemu_check_nic_model(&nd_table[0], TYPE_AW_SUN8I_EMAC); | ||
220 | + qdev_set_nic_properties(DEVICE(&s->emac), &nd_table[0]); | ||
221 | + } | ||
222 | + qdev_init_nofail(DEVICE(&s->emac)); | ||
223 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->emac), 0, s->memmap[AW_H3_EMAC]); | ||
224 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->emac), 0, | ||
225 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_EMAC)); | ||
226 | + | ||
227 | /* Universal Serial Bus */ | ||
228 | sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI0], | ||
229 | qdev_get_gpio_in(DEVICE(&s->gic), | ||
230 | diff --git a/hw/arm/orangepi.c b/hw/arm/orangepi.c | ||
231 | index XXXXXXX..XXXXXXX 100644 | ||
232 | --- a/hw/arm/orangepi.c | ||
233 | +++ b/hw/arm/orangepi.c | ||
234 | @@ -XXX,XX +XXX,XX @@ static void orangepi_init(MachineState *machine) | ||
235 | warn_report("Security Identifier value does not include H3 prefix"); | ||
236 | } | ||
237 | |||
238 | + /* Setup EMAC properties */ | ||
239 | + object_property_set_int(OBJECT(&h3->emac), 1, "phy-addr", &error_abort); | ||
240 | + | ||
241 | /* Mark H3 object realized */ | ||
242 | object_property_set_bool(OBJECT(h3), true, "realized", &error_abort); | ||
243 | |||
244 | diff --git a/hw/net/allwinner-sun8i-emac.c b/hw/net/allwinner-sun8i-emac.c | ||
245 | new file mode 100644 | ||
246 | index XXXXXXX..XXXXXXX | ||
247 | --- /dev/null | ||
248 | +++ b/hw/net/allwinner-sun8i-emac.c | ||
249 | @@ -XXX,XX +XXX,XX @@ | ||
250 | +/* | ||
251 | + * Allwinner Sun8i Ethernet MAC emulation | ||
252 | + * | ||
253 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
254 | + * | ||
255 | + * This program is free software: you can redistribute it and/or modify | ||
256 | + * it under the terms of the GNU General Public License as published by | ||
257 | + * the Free Software Foundation, either version 2 of the License, or | ||
258 | + * (at your option) any later version. | ||
259 | + * | ||
260 | + * This program is distributed in the hope that it will be useful, | ||
261 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
262 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
263 | + * GNU General Public License for more details. | ||
264 | + * | ||
265 | + * You should have received a copy of the GNU General Public License | ||
266 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
267 | + */ | ||
268 | + | ||
269 | +#include "qemu/osdep.h" | ||
270 | +#include "qemu/units.h" | ||
271 | +#include "hw/sysbus.h" | ||
272 | +#include "migration/vmstate.h" | ||
273 | +#include "net/net.h" | ||
274 | +#include "hw/irq.h" | ||
275 | +#include "hw/qdev-properties.h" | ||
276 | +#include "qemu/log.h" | ||
277 | +#include "trace.h" | ||
278 | +#include "net/checksum.h" | ||
279 | +#include "qemu/module.h" | ||
280 | +#include "exec/cpu-common.h" | ||
281 | +#include "hw/net/allwinner-sun8i-emac.h" | ||
282 | + | ||
283 | +/* EMAC register offsets */ | ||
284 | +enum { | ||
285 | + REG_BASIC_CTL_0 = 0x0000, /* Basic Control 0 */ | ||
286 | + REG_BASIC_CTL_1 = 0x0004, /* Basic Control 1 */ | ||
287 | + REG_INT_STA = 0x0008, /* Interrupt Status */ | ||
288 | + REG_INT_EN = 0x000C, /* Interrupt Enable */ | ||
289 | + REG_TX_CTL_0 = 0x0010, /* Transmit Control 0 */ | ||
290 | + REG_TX_CTL_1 = 0x0014, /* Transmit Control 1 */ | ||
291 | + REG_TX_FLOW_CTL = 0x001C, /* Transmit Flow Control */ | ||
292 | + REG_TX_DMA_DESC_LIST = 0x0020, /* Transmit Descriptor List Address */ | ||
293 | + REG_RX_CTL_0 = 0x0024, /* Receive Control 0 */ | ||
294 | + REG_RX_CTL_1 = 0x0028, /* Receive Control 1 */ | ||
295 | + REG_RX_DMA_DESC_LIST = 0x0034, /* Receive Descriptor List Address */ | ||
296 | + REG_FRM_FLT = 0x0038, /* Receive Frame Filter */ | ||
297 | + REG_RX_HASH_0 = 0x0040, /* Receive Hash Table 0 */ | ||
298 | + REG_RX_HASH_1 = 0x0044, /* Receive Hash Table 1 */ | ||
299 | + REG_MII_CMD = 0x0048, /* Management Interface Command */ | ||
300 | + REG_MII_DATA = 0x004C, /* Management Interface Data */ | ||
301 | + REG_ADDR_HIGH = 0x0050, /* MAC Address High */ | ||
302 | + REG_ADDR_LOW = 0x0054, /* MAC Address Low */ | ||
303 | + REG_TX_DMA_STA = 0x00B0, /* Transmit DMA Status */ | ||
304 | + REG_TX_CUR_DESC = 0x00B4, /* Transmit Current Descriptor */ | ||
305 | + REG_TX_CUR_BUF = 0x00B8, /* Transmit Current Buffer */ | ||
306 | + REG_RX_DMA_STA = 0x00C0, /* Receive DMA Status */ | ||
307 | + REG_RX_CUR_DESC = 0x00C4, /* Receive Current Descriptor */ | ||
308 | + REG_RX_CUR_BUF = 0x00C8, /* Receive Current Buffer */ | ||
309 | + REG_RGMII_STA = 0x00D0, /* RGMII Status */ | ||
310 | +}; | ||
311 | + | ||
312 | +/* EMAC register flags */ | ||
313 | +enum { | ||
314 | + BASIC_CTL0_100Mbps = (0b11 << 2), | ||
315 | + BASIC_CTL0_FD = (1 << 0), | ||
316 | + BASIC_CTL1_SOFTRST = (1 << 0), | ||
317 | +}; | ||
318 | + | ||
319 | +enum { | ||
320 | + INT_STA_RGMII_LINK = (1 << 16), | ||
321 | + INT_STA_RX_EARLY = (1 << 13), | ||
322 | + INT_STA_RX_OVERFLOW = (1 << 12), | ||
323 | + INT_STA_RX_TIMEOUT = (1 << 11), | ||
324 | + INT_STA_RX_DMA_STOP = (1 << 10), | ||
325 | + INT_STA_RX_BUF_UA = (1 << 9), | ||
326 | + INT_STA_RX = (1 << 8), | ||
327 | + INT_STA_TX_EARLY = (1 << 5), | ||
328 | + INT_STA_TX_UNDERFLOW = (1 << 4), | ||
329 | + INT_STA_TX_TIMEOUT = (1 << 3), | ||
330 | + INT_STA_TX_BUF_UA = (1 << 2), | ||
331 | + INT_STA_TX_DMA_STOP = (1 << 1), | ||
332 | + INT_STA_TX = (1 << 0), | ||
333 | +}; | ||
334 | + | ||
335 | +enum { | ||
336 | + INT_EN_RX_EARLY = (1 << 13), | ||
337 | + INT_EN_RX_OVERFLOW = (1 << 12), | ||
338 | + INT_EN_RX_TIMEOUT = (1 << 11), | ||
339 | + INT_EN_RX_DMA_STOP = (1 << 10), | ||
340 | + INT_EN_RX_BUF_UA = (1 << 9), | ||
341 | + INT_EN_RX = (1 << 8), | ||
342 | + INT_EN_TX_EARLY = (1 << 5), | ||
343 | + INT_EN_TX_UNDERFLOW = (1 << 4), | ||
344 | + INT_EN_TX_TIMEOUT = (1 << 3), | ||
345 | + INT_EN_TX_BUF_UA = (1 << 2), | ||
346 | + INT_EN_TX_DMA_STOP = (1 << 1), | ||
347 | + INT_EN_TX = (1 << 0), | ||
348 | +}; | ||
349 | + | ||
350 | +enum { | ||
351 | + TX_CTL0_TX_EN = (1 << 31), | ||
352 | + TX_CTL1_TX_DMA_START = (1 << 31), | ||
353 | + TX_CTL1_TX_DMA_EN = (1 << 30), | ||
354 | + TX_CTL1_TX_FLUSH = (1 << 0), | ||
355 | +}; | ||
356 | + | ||
357 | +enum { | ||
358 | + RX_CTL0_RX_EN = (1 << 31), | ||
359 | + RX_CTL0_STRIP_FCS = (1 << 28), | ||
360 | + RX_CTL0_CRC_IPV4 = (1 << 27), | ||
361 | +}; | ||
362 | + | ||
363 | +enum { | ||
364 | + RX_CTL1_RX_DMA_START = (1 << 31), | ||
365 | + RX_CTL1_RX_DMA_EN = (1 << 30), | ||
366 | + RX_CTL1_RX_MD = (1 << 1), | ||
367 | +}; | ||
368 | + | ||
369 | +enum { | ||
370 | + RX_FRM_FLT_DIS_ADDR = (1 << 31), | ||
371 | +}; | ||
372 | + | ||
373 | +enum { | ||
374 | + MII_CMD_PHY_ADDR_SHIFT = (12), | ||
375 | + MII_CMD_PHY_ADDR_MASK = (0xf000), | ||
376 | + MII_CMD_PHY_REG_SHIFT = (4), | ||
377 | + MII_CMD_PHY_REG_MASK = (0xf0), | ||
378 | + MII_CMD_PHY_RW = (1 << 1), | ||
379 | + MII_CMD_PHY_BUSY = (1 << 0), | ||
380 | +}; | ||
381 | + | ||
382 | +enum { | ||
383 | + TX_DMA_STA_STOP = (0b000), | ||
384 | + TX_DMA_STA_RUN_FETCH = (0b001), | ||
385 | + TX_DMA_STA_WAIT_STA = (0b010), | ||
386 | +}; | ||
387 | + | ||
388 | +enum { | ||
389 | + RX_DMA_STA_STOP = (0b000), | ||
390 | + RX_DMA_STA_RUN_FETCH = (0b001), | ||
391 | + RX_DMA_STA_WAIT_FRM = (0b011), | ||
392 | +}; | ||
393 | + | ||
394 | +/* EMAC register reset values */ | ||
395 | +enum { | ||
396 | + REG_BASIC_CTL_1_RST = 0x08000000, | ||
397 | +}; | ||
398 | + | ||
399 | +/* EMAC constants */ | ||
400 | +enum { | ||
401 | + AW_SUN8I_EMAC_MIN_PKT_SZ = 64 | ||
402 | +}; | ||
403 | + | ||
404 | +/* Transmit/receive frame descriptor */ | ||
405 | +typedef struct FrameDescriptor { | ||
406 | + uint32_t status; | ||
407 | + uint32_t status2; | ||
408 | + uint32_t addr; | ||
409 | + uint32_t next; | ||
410 | +} FrameDescriptor; | ||
411 | + | ||
412 | +/* Frame descriptor flags */ | ||
413 | +enum { | ||
414 | + DESC_STATUS_CTL = (1 << 31), | ||
415 | + DESC_STATUS2_BUF_SIZE_MASK = (0x7ff), | ||
416 | +}; | ||
417 | + | ||
418 | +/* Transmit frame descriptor flags */ | ||
419 | +enum { | ||
420 | + TX_DESC_STATUS_LENGTH_ERR = (1 << 14), | ||
421 | + TX_DESC_STATUS2_FIRST_DESC = (1 << 29), | ||
422 | + TX_DESC_STATUS2_LAST_DESC = (1 << 30), | ||
423 | + TX_DESC_STATUS2_CHECKSUM_MASK = (0x3 << 27), | ||
424 | +}; | ||
425 | + | ||
426 | +/* Receive frame descriptor flags */ | ||
427 | +enum { | ||
428 | + RX_DESC_STATUS_FIRST_DESC = (1 << 9), | ||
429 | + RX_DESC_STATUS_LAST_DESC = (1 << 8), | ||
430 | + RX_DESC_STATUS_FRM_LEN_MASK = (0x3fff0000), | ||
431 | + RX_DESC_STATUS_FRM_LEN_SHIFT = (16), | ||
432 | + RX_DESC_STATUS_NO_BUF = (1 << 14), | ||
433 | + RX_DESC_STATUS_HEADER_ERR = (1 << 7), | ||
434 | + RX_DESC_STATUS_LENGTH_ERR = (1 << 4), | ||
435 | + RX_DESC_STATUS_CRC_ERR = (1 << 1), | ||
436 | + RX_DESC_STATUS_PAYLOAD_ERR = (1 << 0), | ||
437 | + RX_DESC_STATUS2_RX_INT_CTL = (1 << 31), | ||
438 | +}; | ||
439 | + | ||
440 | +/* MII register offsets */ | ||
441 | +enum { | ||
442 | + MII_REG_CR = (0x0), /* Control */ | ||
443 | + MII_REG_ST = (0x1), /* Status */ | ||
444 | + MII_REG_ID_HIGH = (0x2), /* Identifier High */ | ||
445 | + MII_REG_ID_LOW = (0x3), /* Identifier Low */ | ||
446 | + MII_REG_ADV = (0x4), /* Advertised abilities */ | ||
447 | + MII_REG_LPA = (0x5), /* Link partner abilities */ | ||
448 | +}; | ||
449 | + | ||
450 | +/* MII register flags */ | ||
451 | +enum { | ||
452 | + MII_REG_CR_RESET = (1 << 15), | ||
453 | + MII_REG_CR_POWERDOWN = (1 << 11), | ||
454 | + MII_REG_CR_10Mbit = (0), | ||
455 | + MII_REG_CR_100Mbit = (1 << 13), | ||
456 | + MII_REG_CR_1000Mbit = (1 << 6), | ||
457 | + MII_REG_CR_AUTO_NEG = (1 << 12), | ||
458 | + MII_REG_CR_AUTO_NEG_RESTART = (1 << 9), | ||
459 | + MII_REG_CR_FULLDUPLEX = (1 << 8), | ||
460 | +}; | ||
461 | + | ||
462 | +enum { | ||
463 | + MII_REG_ST_100BASE_T4 = (1 << 15), | ||
464 | + MII_REG_ST_100BASE_X_FD = (1 << 14), | ||
465 | + MII_REG_ST_100BASE_X_HD = (1 << 13), | ||
466 | + MII_REG_ST_10_FD = (1 << 12), | ||
467 | + MII_REG_ST_10_HD = (1 << 11), | ||
468 | + MII_REG_ST_100BASE_T2_FD = (1 << 10), | ||
469 | + MII_REG_ST_100BASE_T2_HD = (1 << 9), | ||
470 | + MII_REG_ST_AUTONEG_COMPLETE = (1 << 5), | ||
471 | + MII_REG_ST_AUTONEG_AVAIL = (1 << 3), | ||
472 | + MII_REG_ST_LINK_UP = (1 << 2), | ||
473 | +}; | ||
474 | + | ||
475 | +enum { | ||
476 | + MII_REG_LPA_10_HD = (1 << 5), | ||
477 | + MII_REG_LPA_10_FD = (1 << 6), | ||
478 | + MII_REG_LPA_100_HD = (1 << 7), | ||
479 | + MII_REG_LPA_100_FD = (1 << 8), | ||
480 | + MII_REG_LPA_PAUSE = (1 << 10), | ||
481 | + MII_REG_LPA_ASYMPAUSE = (1 << 11), | ||
482 | +}; | ||
483 | + | ||
484 | +/* MII constants */ | ||
485 | +enum { | ||
486 | + MII_PHY_ID_HIGH = 0x0044, | ||
487 | + MII_PHY_ID_LOW = 0x1400, | ||
488 | +}; | ||
489 | + | ||
490 | +static void allwinner_sun8i_emac_mii_set_link(AwSun8iEmacState *s, | ||
491 | + bool link_active) | ||
492 | +{ | 65 | +{ |
493 | + if (link_active) { | 66 | + return float16_abs(a); |
494 | + s->mii_st |= MII_REG_ST_LINK_UP; | ||
495 | + } else { | ||
496 | + s->mii_st &= ~MII_REG_ST_LINK_UP; | ||
497 | + } | ||
498 | +} | 67 | +} |
499 | + | 68 | + |
500 | +static void allwinner_sun8i_emac_mii_reset(AwSun8iEmacState *s, | 69 | float32 VFP_HELPER(abs, s)(float32 a) |
501 | + bool link_active) | 70 | { |
71 | return float32_abs(a); | ||
72 | @@ -XXX,XX +XXX,XX @@ float64 VFP_HELPER(abs, d)(float64 a) | ||
73 | return float64_abs(a); | ||
74 | } | ||
75 | |||
76 | +dh_ctype_f16 VFP_HELPER(sqrt, h)(dh_ctype_f16 a, CPUARMState *env) | ||
502 | +{ | 77 | +{ |
503 | + s->mii_cr = MII_REG_CR_100Mbit | MII_REG_CR_AUTO_NEG | | 78 | + return float16_sqrt(a, &env->vfp.fp_status_f16); |
504 | + MII_REG_CR_FULLDUPLEX; | ||
505 | + s->mii_st = MII_REG_ST_100BASE_T4 | MII_REG_ST_100BASE_X_FD | | ||
506 | + MII_REG_ST_100BASE_X_HD | MII_REG_ST_10_FD | MII_REG_ST_10_HD | | ||
507 | + MII_REG_ST_100BASE_T2_FD | MII_REG_ST_100BASE_T2_HD | | ||
508 | + MII_REG_ST_AUTONEG_COMPLETE | MII_REG_ST_AUTONEG_AVAIL; | ||
509 | + s->mii_adv = 0; | ||
510 | + | ||
511 | + allwinner_sun8i_emac_mii_set_link(s, link_active); | ||
512 | +} | 79 | +} |
513 | + | 80 | + |
514 | +static void allwinner_sun8i_emac_mii_cmd(AwSun8iEmacState *s) | 81 | float32 VFP_HELPER(sqrt, s)(float32 a, CPUARMState *env) |
82 | { | ||
83 | return float32_sqrt(a, &env->vfp.fp_status); | ||
84 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
85 | index XXXXXXX..XXXXXXX 100644 | ||
86 | --- a/target/arm/translate-vfp.c.inc | ||
87 | +++ b/target/arm/translate-vfp.c.inc | ||
88 | @@ -XXX,XX +XXX,XX @@ static bool do_vfp_2op_sp(DisasContext *s, VFPGen2OpSPFn *fn, int vd, int vm) | ||
89 | return true; | ||
90 | } | ||
91 | |||
92 | +static bool do_vfp_2op_hp(DisasContext *s, VFPGen2OpSPFn *fn, int vd, int vm) | ||
515 | +{ | 93 | +{ |
516 | + uint8_t addr, reg; | 94 | + /* |
95 | + * Do a half-precision operation. Functionally this is | ||
96 | + * the same as do_vfp_2op_sp(), except: | ||
97 | + * - it doesn't need the VFP vector handling (fp16 is a | ||
98 | + * v8 feature, and in v8 VFP vectors don't exist) | ||
99 | + * - it does the aa32_fp16_arith feature test | ||
100 | + */ | ||
101 | + TCGv_i32 f0; | ||
517 | + | 102 | + |
518 | + addr = (s->mii_cmd & MII_CMD_PHY_ADDR_MASK) >> MII_CMD_PHY_ADDR_SHIFT; | 103 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
519 | + reg = (s->mii_cmd & MII_CMD_PHY_REG_MASK) >> MII_CMD_PHY_REG_SHIFT; | 104 | + return false; |
520 | + | ||
521 | + if (addr != s->mii_phy_addr) { | ||
522 | + return; | ||
523 | + } | 105 | + } |
524 | + | 106 | + |
525 | + /* Read or write a PHY register? */ | 107 | + if (s->vec_len != 0 || s->vec_stride != 0) { |
526 | + if (s->mii_cmd & MII_CMD_PHY_RW) { | 108 | + return false; |
527 | + trace_allwinner_sun8i_emac_mii_write_reg(reg, s->mii_data); | 109 | + } |
528 | + | 110 | + |
529 | + switch (reg) { | 111 | + if (!vfp_access_check(s)) { |
530 | + case MII_REG_CR: | 112 | + return true; |
531 | + if (s->mii_data & MII_REG_CR_RESET) { | 113 | + } |
532 | + allwinner_sun8i_emac_mii_reset(s, s->mii_st & | ||
533 | + MII_REG_ST_LINK_UP); | ||
534 | + } else { | ||
535 | + s->mii_cr = s->mii_data & ~(MII_REG_CR_RESET | | ||
536 | + MII_REG_CR_AUTO_NEG_RESTART); | ||
537 | + } | ||
538 | + break; | ||
539 | + case MII_REG_ADV: | ||
540 | + s->mii_adv = s->mii_data; | ||
541 | + break; | ||
542 | + case MII_REG_ID_HIGH: | ||
543 | + case MII_REG_ID_LOW: | ||
544 | + case MII_REG_LPA: | ||
545 | + break; | ||
546 | + default: | ||
547 | + qemu_log_mask(LOG_UNIMP, "allwinner-h3-emac: write access to " | ||
548 | + "unknown MII register 0x%x\n", reg); | ||
549 | + break; | ||
550 | + } | ||
551 | + } else { | ||
552 | + switch (reg) { | ||
553 | + case MII_REG_CR: | ||
554 | + s->mii_data = s->mii_cr; | ||
555 | + break; | ||
556 | + case MII_REG_ST: | ||
557 | + s->mii_data = s->mii_st; | ||
558 | + break; | ||
559 | + case MII_REG_ID_HIGH: | ||
560 | + s->mii_data = MII_PHY_ID_HIGH; | ||
561 | + break; | ||
562 | + case MII_REG_ID_LOW: | ||
563 | + s->mii_data = MII_PHY_ID_LOW; | ||
564 | + break; | ||
565 | + case MII_REG_ADV: | ||
566 | + s->mii_data = s->mii_adv; | ||
567 | + break; | ||
568 | + case MII_REG_LPA: | ||
569 | + s->mii_data = MII_REG_LPA_10_HD | MII_REG_LPA_10_FD | | ||
570 | + MII_REG_LPA_100_HD | MII_REG_LPA_100_FD | | ||
571 | + MII_REG_LPA_PAUSE | MII_REG_LPA_ASYMPAUSE; | ||
572 | + break; | ||
573 | + default: | ||
574 | + qemu_log_mask(LOG_UNIMP, "allwinner-h3-emac: read access to " | ||
575 | + "unknown MII register 0x%x\n", reg); | ||
576 | + s->mii_data = 0; | ||
577 | + break; | ||
578 | + } | ||
579 | + | 114 | + |
580 | + trace_allwinner_sun8i_emac_mii_read_reg(reg, s->mii_data); | 115 | + f0 = tcg_temp_new_i32(); |
581 | + } | 116 | + neon_load_reg32(f0, vm); |
117 | + fn(f0, f0); | ||
118 | + neon_store_reg32(f0, vd); | ||
119 | + tcg_temp_free_i32(f0); | ||
120 | + | ||
121 | + return true; | ||
582 | +} | 122 | +} |
583 | + | 123 | + |
584 | +static void allwinner_sun8i_emac_update_irq(AwSun8iEmacState *s) | 124 | static bool do_vfp_2op_dp(DisasContext *s, VFPGen2OpDPFn *fn, int vd, int vm) |
125 | { | ||
126 | uint32_t delta_m = 0; | ||
127 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMOV_imm_dp(DisasContext *s, arg_VMOV_imm_dp *a) | ||
128 | DO_VFP_2OP(VMOV_reg, sp, tcg_gen_mov_i32) | ||
129 | DO_VFP_2OP(VMOV_reg, dp, tcg_gen_mov_i64) | ||
130 | |||
131 | +DO_VFP_2OP(VABS, hp, gen_helper_vfp_absh) | ||
132 | DO_VFP_2OP(VABS, sp, gen_helper_vfp_abss) | ||
133 | DO_VFP_2OP(VABS, dp, gen_helper_vfp_absd) | ||
134 | |||
135 | +DO_VFP_2OP(VNEG, hp, gen_helper_vfp_negh) | ||
136 | DO_VFP_2OP(VNEG, sp, gen_helper_vfp_negs) | ||
137 | DO_VFP_2OP(VNEG, dp, gen_helper_vfp_negd) | ||
138 | |||
139 | +static void gen_VSQRT_hp(TCGv_i32 vd, TCGv_i32 vm) | ||
585 | +{ | 140 | +{ |
586 | + qemu_set_irq(s->irq, (s->int_sta & s->int_en) != 0); | 141 | + gen_helper_vfp_sqrth(vd, vm, cpu_env); |
587 | +} | 142 | +} |
588 | + | 143 | + |
589 | +static uint32_t allwinner_sun8i_emac_next_desc(FrameDescriptor *desc, | 144 | static void gen_VSQRT_sp(TCGv_i32 vd, TCGv_i32 vm) |
590 | + size_t min_size) | 145 | { |
591 | +{ | 146 | gen_helper_vfp_sqrts(vd, vm, cpu_env); |
592 | + uint32_t paddr = desc->next; | 147 | @@ -XXX,XX +XXX,XX @@ static void gen_VSQRT_dp(TCGv_i64 vd, TCGv_i64 vm) |
593 | + | 148 | gen_helper_vfp_sqrtd(vd, vm, cpu_env); |
594 | + cpu_physical_memory_read(paddr, desc, sizeof(*desc)); | 149 | } |
595 | + | 150 | |
596 | + if ((desc->status & DESC_STATUS_CTL) && | 151 | +DO_VFP_2OP(VSQRT, hp, gen_VSQRT_hp) |
597 | + (desc->status2 & DESC_STATUS2_BUF_SIZE_MASK) >= min_size) { | 152 | DO_VFP_2OP(VSQRT, sp, gen_VSQRT_sp) |
598 | + return paddr; | 153 | DO_VFP_2OP(VSQRT, dp, gen_VSQRT_dp) |
599 | + } else { | 154 | |
600 | + return 0; | ||
601 | + } | ||
602 | +} | ||
603 | + | ||
604 | +static uint32_t allwinner_sun8i_emac_get_desc(FrameDescriptor *desc, | ||
605 | + uint32_t start_addr, | ||
606 | + size_t min_size) | ||
607 | +{ | ||
608 | + uint32_t desc_addr = start_addr; | ||
609 | + | ||
610 | + /* Note that the list is a cycle. Last entry points back to the head. */ | ||
611 | + while (desc_addr != 0) { | ||
612 | + cpu_physical_memory_read(desc_addr, desc, sizeof(*desc)); | ||
613 | + | ||
614 | + if ((desc->status & DESC_STATUS_CTL) && | ||
615 | + (desc->status2 & DESC_STATUS2_BUF_SIZE_MASK) >= min_size) { | ||
616 | + return desc_addr; | ||
617 | + } else if (desc->next == start_addr) { | ||
618 | + break; | ||
619 | + } else { | ||
620 | + desc_addr = desc->next; | ||
621 | + } | ||
622 | + } | ||
623 | + | ||
624 | + return 0; | ||
625 | +} | ||
626 | + | ||
627 | +static uint32_t allwinner_sun8i_emac_rx_desc(AwSun8iEmacState *s, | ||
628 | + FrameDescriptor *desc, | ||
629 | + size_t min_size) | ||
630 | +{ | ||
631 | + return allwinner_sun8i_emac_get_desc(desc, s->rx_desc_curr, min_size); | ||
632 | +} | ||
633 | + | ||
634 | +static uint32_t allwinner_sun8i_emac_tx_desc(AwSun8iEmacState *s, | ||
635 | + FrameDescriptor *desc, | ||
636 | + size_t min_size) | ||
637 | +{ | ||
638 | + return allwinner_sun8i_emac_get_desc(desc, s->tx_desc_head, min_size); | ||
639 | +} | ||
640 | + | ||
641 | +static void allwinner_sun8i_emac_flush_desc(FrameDescriptor *desc, | ||
642 | + uint32_t phys_addr) | ||
643 | +{ | ||
644 | + cpu_physical_memory_write(phys_addr, desc, sizeof(*desc)); | ||
645 | +} | ||
646 | + | ||
647 | +static int allwinner_sun8i_emac_can_receive(NetClientState *nc) | ||
648 | +{ | ||
649 | + AwSun8iEmacState *s = qemu_get_nic_opaque(nc); | ||
650 | + FrameDescriptor desc; | ||
651 | + | ||
652 | + return (s->rx_ctl0 & RX_CTL0_RX_EN) && | ||
653 | + (allwinner_sun8i_emac_rx_desc(s, &desc, 0) != 0); | ||
654 | +} | ||
655 | + | ||
656 | +static ssize_t allwinner_sun8i_emac_receive(NetClientState *nc, | ||
657 | + const uint8_t *buf, | ||
658 | + size_t size) | ||
659 | +{ | ||
660 | + AwSun8iEmacState *s = qemu_get_nic_opaque(nc); | ||
661 | + FrameDescriptor desc; | ||
662 | + size_t bytes_left = size; | ||
663 | + size_t desc_bytes = 0; | ||
664 | + size_t pad_fcs_size = 4; | ||
665 | + size_t padding = 0; | ||
666 | + | ||
667 | + if (!(s->rx_ctl0 & RX_CTL0_RX_EN)) { | ||
668 | + return -1; | ||
669 | + } | ||
670 | + | ||
671 | + s->rx_desc_curr = allwinner_sun8i_emac_rx_desc(s, &desc, | ||
672 | + AW_SUN8I_EMAC_MIN_PKT_SZ); | ||
673 | + if (!s->rx_desc_curr) { | ||
674 | + s->int_sta |= INT_STA_RX_BUF_UA; | ||
675 | + } | ||
676 | + | ||
677 | + /* Keep filling RX descriptors until the whole frame is written */ | ||
678 | + while (s->rx_desc_curr && bytes_left > 0) { | ||
679 | + desc.status &= ~DESC_STATUS_CTL; | ||
680 | + desc.status &= ~RX_DESC_STATUS_FRM_LEN_MASK; | ||
681 | + | ||
682 | + if (bytes_left == size) { | ||
683 | + desc.status |= RX_DESC_STATUS_FIRST_DESC; | ||
684 | + } | ||
685 | + | ||
686 | + if ((desc.status2 & DESC_STATUS2_BUF_SIZE_MASK) < | ||
687 | + (bytes_left + pad_fcs_size)) { | ||
688 | + desc_bytes = desc.status2 & DESC_STATUS2_BUF_SIZE_MASK; | ||
689 | + desc.status |= desc_bytes << RX_DESC_STATUS_FRM_LEN_SHIFT; | ||
690 | + } else { | ||
691 | + padding = pad_fcs_size; | ||
692 | + if (bytes_left < AW_SUN8I_EMAC_MIN_PKT_SZ) { | ||
693 | + padding += (AW_SUN8I_EMAC_MIN_PKT_SZ - bytes_left); | ||
694 | + } | ||
695 | + | ||
696 | + desc_bytes = (bytes_left); | ||
697 | + desc.status |= RX_DESC_STATUS_LAST_DESC; | ||
698 | + desc.status |= (bytes_left + padding) | ||
699 | + << RX_DESC_STATUS_FRM_LEN_SHIFT; | ||
700 | + } | ||
701 | + | ||
702 | + cpu_physical_memory_write(desc.addr, buf, desc_bytes); | ||
703 | + allwinner_sun8i_emac_flush_desc(&desc, s->rx_desc_curr); | ||
704 | + trace_allwinner_sun8i_emac_receive(s->rx_desc_curr, desc.addr, | ||
705 | + desc_bytes); | ||
706 | + | ||
707 | + /* Check if frame needs to raise the receive interrupt */ | ||
708 | + if (!(desc.status2 & RX_DESC_STATUS2_RX_INT_CTL)) { | ||
709 | + s->int_sta |= INT_STA_RX; | ||
710 | + } | ||
711 | + | ||
712 | + /* Increment variables */ | ||
713 | + buf += desc_bytes; | ||
714 | + bytes_left -= desc_bytes; | ||
715 | + | ||
716 | + /* Move to the next descriptor */ | ||
717 | + s->rx_desc_curr = allwinner_sun8i_emac_next_desc(&desc, 64); | ||
718 | + if (!s->rx_desc_curr) { | ||
719 | + /* Not enough buffer space available */ | ||
720 | + s->int_sta |= INT_STA_RX_BUF_UA; | ||
721 | + s->rx_desc_curr = s->rx_desc_head; | ||
722 | + break; | ||
723 | + } | ||
724 | + } | ||
725 | + | ||
726 | + /* Report receive DMA is finished */ | ||
727 | + s->rx_ctl1 &= ~RX_CTL1_RX_DMA_START; | ||
728 | + allwinner_sun8i_emac_update_irq(s); | ||
729 | + | ||
730 | + return size; | ||
731 | +} | ||
732 | + | ||
733 | +static void allwinner_sun8i_emac_transmit(AwSun8iEmacState *s) | ||
734 | +{ | ||
735 | + NetClientState *nc = qemu_get_queue(s->nic); | ||
736 | + FrameDescriptor desc; | ||
737 | + size_t bytes = 0; | ||
738 | + size_t packet_bytes = 0; | ||
739 | + size_t transmitted = 0; | ||
740 | + static uint8_t packet_buf[2048]; | ||
741 | + | ||
742 | + s->tx_desc_curr = allwinner_sun8i_emac_tx_desc(s, &desc, 0); | ||
743 | + | ||
744 | + /* Read all transmit descriptors */ | ||
745 | + while (s->tx_desc_curr != 0) { | ||
746 | + | ||
747 | + /* Read from physical memory into packet buffer */ | ||
748 | + bytes = desc.status2 & DESC_STATUS2_BUF_SIZE_MASK; | ||
749 | + if (bytes + packet_bytes > sizeof(packet_buf)) { | ||
750 | + desc.status |= TX_DESC_STATUS_LENGTH_ERR; | ||
751 | + break; | ||
752 | + } | ||
753 | + cpu_physical_memory_read(desc.addr, packet_buf + packet_bytes, bytes); | ||
754 | + packet_bytes += bytes; | ||
755 | + desc.status &= ~DESC_STATUS_CTL; | ||
756 | + allwinner_sun8i_emac_flush_desc(&desc, s->tx_desc_curr); | ||
757 | + | ||
758 | + /* After the last descriptor, send the packet */ | ||
759 | + if (desc.status2 & TX_DESC_STATUS2_LAST_DESC) { | ||
760 | + if (desc.status2 & TX_DESC_STATUS2_CHECKSUM_MASK) { | ||
761 | + net_checksum_calculate(packet_buf, packet_bytes); | ||
762 | + } | ||
763 | + | ||
764 | + qemu_send_packet(nc, packet_buf, packet_bytes); | ||
765 | + trace_allwinner_sun8i_emac_transmit(s->tx_desc_curr, desc.addr, | ||
766 | + bytes); | ||
767 | + | ||
768 | + packet_bytes = 0; | ||
769 | + transmitted++; | ||
770 | + } | ||
771 | + s->tx_desc_curr = allwinner_sun8i_emac_next_desc(&desc, 0); | ||
772 | + } | ||
773 | + | ||
774 | + /* Raise transmit completed interrupt */ | ||
775 | + if (transmitted > 0) { | ||
776 | + s->int_sta |= INT_STA_TX; | ||
777 | + s->tx_ctl1 &= ~TX_CTL1_TX_DMA_START; | ||
778 | + allwinner_sun8i_emac_update_irq(s); | ||
779 | + } | ||
780 | +} | ||
781 | + | ||
782 | +static void allwinner_sun8i_emac_reset(DeviceState *dev) | ||
783 | +{ | ||
784 | + AwSun8iEmacState *s = AW_SUN8I_EMAC(dev); | ||
785 | + NetClientState *nc = qemu_get_queue(s->nic); | ||
786 | + | ||
787 | + trace_allwinner_sun8i_emac_reset(); | ||
788 | + | ||
789 | + s->mii_cmd = 0; | ||
790 | + s->mii_data = 0; | ||
791 | + s->basic_ctl0 = 0; | ||
792 | + s->basic_ctl1 = REG_BASIC_CTL_1_RST; | ||
793 | + s->int_en = 0; | ||
794 | + s->int_sta = 0; | ||
795 | + s->frm_flt = 0; | ||
796 | + s->rx_ctl0 = 0; | ||
797 | + s->rx_ctl1 = RX_CTL1_RX_MD; | ||
798 | + s->rx_desc_head = 0; | ||
799 | + s->rx_desc_curr = 0; | ||
800 | + s->tx_ctl0 = 0; | ||
801 | + s->tx_ctl1 = 0; | ||
802 | + s->tx_desc_head = 0; | ||
803 | + s->tx_desc_curr = 0; | ||
804 | + s->tx_flowctl = 0; | ||
805 | + | ||
806 | + allwinner_sun8i_emac_mii_reset(s, !nc->link_down); | ||
807 | +} | ||
808 | + | ||
809 | +static uint64_t allwinner_sun8i_emac_read(void *opaque, hwaddr offset, | ||
810 | + unsigned size) | ||
811 | +{ | ||
812 | + AwSun8iEmacState *s = AW_SUN8I_EMAC(opaque); | ||
813 | + uint64_t value = 0; | ||
814 | + FrameDescriptor desc; | ||
815 | + | ||
816 | + switch (offset) { | ||
817 | + case REG_BASIC_CTL_0: /* Basic Control 0 */ | ||
818 | + value = s->basic_ctl0; | ||
819 | + break; | ||
820 | + case REG_BASIC_CTL_1: /* Basic Control 1 */ | ||
821 | + value = s->basic_ctl1; | ||
822 | + break; | ||
823 | + case REG_INT_STA: /* Interrupt Status */ | ||
824 | + value = s->int_sta; | ||
825 | + break; | ||
826 | + case REG_INT_EN: /* Interupt Enable */ | ||
827 | + value = s->int_en; | ||
828 | + break; | ||
829 | + case REG_TX_CTL_0: /* Transmit Control 0 */ | ||
830 | + value = s->tx_ctl0; | ||
831 | + break; | ||
832 | + case REG_TX_CTL_1: /* Transmit Control 1 */ | ||
833 | + value = s->tx_ctl1; | ||
834 | + break; | ||
835 | + case REG_TX_FLOW_CTL: /* Transmit Flow Control */ | ||
836 | + value = s->tx_flowctl; | ||
837 | + break; | ||
838 | + case REG_TX_DMA_DESC_LIST: /* Transmit Descriptor List Address */ | ||
839 | + value = s->tx_desc_head; | ||
840 | + break; | ||
841 | + case REG_RX_CTL_0: /* Receive Control 0 */ | ||
842 | + value = s->rx_ctl0; | ||
843 | + break; | ||
844 | + case REG_RX_CTL_1: /* Receive Control 1 */ | ||
845 | + value = s->rx_ctl1; | ||
846 | + break; | ||
847 | + case REG_RX_DMA_DESC_LIST: /* Receive Descriptor List Address */ | ||
848 | + value = s->rx_desc_head; | ||
849 | + break; | ||
850 | + case REG_FRM_FLT: /* Receive Frame Filter */ | ||
851 | + value = s->frm_flt; | ||
852 | + break; | ||
853 | + case REG_RX_HASH_0: /* Receive Hash Table 0 */ | ||
854 | + case REG_RX_HASH_1: /* Receive Hash Table 1 */ | ||
855 | + break; | ||
856 | + case REG_MII_CMD: /* Management Interface Command */ | ||
857 | + value = s->mii_cmd; | ||
858 | + break; | ||
859 | + case REG_MII_DATA: /* Management Interface Data */ | ||
860 | + value = s->mii_data; | ||
861 | + break; | ||
862 | + case REG_ADDR_HIGH: /* MAC Address High */ | ||
863 | + value = *(((uint32_t *) (s->conf.macaddr.a)) + 1); | ||
864 | + break; | ||
865 | + case REG_ADDR_LOW: /* MAC Address Low */ | ||
866 | + value = *(uint32_t *) (s->conf.macaddr.a); | ||
867 | + break; | ||
868 | + case REG_TX_DMA_STA: /* Transmit DMA Status */ | ||
869 | + break; | ||
870 | + case REG_TX_CUR_DESC: /* Transmit Current Descriptor */ | ||
871 | + value = s->tx_desc_curr; | ||
872 | + break; | ||
873 | + case REG_TX_CUR_BUF: /* Transmit Current Buffer */ | ||
874 | + if (s->tx_desc_curr != 0) { | ||
875 | + cpu_physical_memory_read(s->tx_desc_curr, &desc, sizeof(desc)); | ||
876 | + value = desc.addr; | ||
877 | + } else { | ||
878 | + value = 0; | ||
879 | + } | ||
880 | + break; | ||
881 | + case REG_RX_DMA_STA: /* Receive DMA Status */ | ||
882 | + break; | ||
883 | + case REG_RX_CUR_DESC: /* Receive Current Descriptor */ | ||
884 | + value = s->rx_desc_curr; | ||
885 | + break; | ||
886 | + case REG_RX_CUR_BUF: /* Receive Current Buffer */ | ||
887 | + if (s->rx_desc_curr != 0) { | ||
888 | + cpu_physical_memory_read(s->rx_desc_curr, &desc, sizeof(desc)); | ||
889 | + value = desc.addr; | ||
890 | + } else { | ||
891 | + value = 0; | ||
892 | + } | ||
893 | + break; | ||
894 | + case REG_RGMII_STA: /* RGMII Status */ | ||
895 | + break; | ||
896 | + default: | ||
897 | + qemu_log_mask(LOG_UNIMP, "allwinner-h3-emac: read access to unknown " | ||
898 | + "EMAC register 0x" TARGET_FMT_plx "\n", | ||
899 | + offset); | ||
900 | + } | ||
901 | + | ||
902 | + trace_allwinner_sun8i_emac_read(offset, value); | ||
903 | + return value; | ||
904 | +} | ||
905 | + | ||
906 | +static void allwinner_sun8i_emac_write(void *opaque, hwaddr offset, | ||
907 | + uint64_t value, unsigned size) | ||
908 | +{ | ||
909 | + AwSun8iEmacState *s = AW_SUN8I_EMAC(opaque); | ||
910 | + NetClientState *nc = qemu_get_queue(s->nic); | ||
911 | + | ||
912 | + trace_allwinner_sun8i_emac_write(offset, value); | ||
913 | + | ||
914 | + switch (offset) { | ||
915 | + case REG_BASIC_CTL_0: /* Basic Control 0 */ | ||
916 | + s->basic_ctl0 = value; | ||
917 | + break; | ||
918 | + case REG_BASIC_CTL_1: /* Basic Control 1 */ | ||
919 | + if (value & BASIC_CTL1_SOFTRST) { | ||
920 | + allwinner_sun8i_emac_reset(DEVICE(s)); | ||
921 | + value &= ~BASIC_CTL1_SOFTRST; | ||
922 | + } | ||
923 | + s->basic_ctl1 = value; | ||
924 | + if (allwinner_sun8i_emac_can_receive(nc)) { | ||
925 | + qemu_flush_queued_packets(nc); | ||
926 | + } | ||
927 | + break; | ||
928 | + case REG_INT_STA: /* Interrupt Status */ | ||
929 | + s->int_sta &= ~value; | ||
930 | + allwinner_sun8i_emac_update_irq(s); | ||
931 | + break; | ||
932 | + case REG_INT_EN: /* Interrupt Enable */ | ||
933 | + s->int_en = value; | ||
934 | + allwinner_sun8i_emac_update_irq(s); | ||
935 | + break; | ||
936 | + case REG_TX_CTL_0: /* Transmit Control 0 */ | ||
937 | + s->tx_ctl0 = value; | ||
938 | + break; | ||
939 | + case REG_TX_CTL_1: /* Transmit Control 1 */ | ||
940 | + s->tx_ctl1 = value; | ||
941 | + if (value & TX_CTL1_TX_DMA_EN) { | ||
942 | + allwinner_sun8i_emac_transmit(s); | ||
943 | + } | ||
944 | + break; | ||
945 | + case REG_TX_FLOW_CTL: /* Transmit Flow Control */ | ||
946 | + s->tx_flowctl = value; | ||
947 | + break; | ||
948 | + case REG_TX_DMA_DESC_LIST: /* Transmit Descriptor List Address */ | ||
949 | + s->tx_desc_head = value; | ||
950 | + s->tx_desc_curr = value; | ||
951 | + break; | ||
952 | + case REG_RX_CTL_0: /* Receive Control 0 */ | ||
953 | + s->rx_ctl0 = value; | ||
954 | + break; | ||
955 | + case REG_RX_CTL_1: /* Receive Control 1 */ | ||
956 | + s->rx_ctl1 = value | RX_CTL1_RX_MD; | ||
957 | + if ((value & RX_CTL1_RX_DMA_EN) && | ||
958 | + allwinner_sun8i_emac_can_receive(nc)) { | ||
959 | + qemu_flush_queued_packets(nc); | ||
960 | + } | ||
961 | + break; | ||
962 | + case REG_RX_DMA_DESC_LIST: /* Receive Descriptor List Address */ | ||
963 | + s->rx_desc_head = value; | ||
964 | + s->rx_desc_curr = value; | ||
965 | + break; | ||
966 | + case REG_FRM_FLT: /* Receive Frame Filter */ | ||
967 | + s->frm_flt = value; | ||
968 | + break; | ||
969 | + case REG_RX_HASH_0: /* Receive Hash Table 0 */ | ||
970 | + case REG_RX_HASH_1: /* Receive Hash Table 1 */ | ||
971 | + break; | ||
972 | + case REG_MII_CMD: /* Management Interface Command */ | ||
973 | + s->mii_cmd = value & ~MII_CMD_PHY_BUSY; | ||
974 | + allwinner_sun8i_emac_mii_cmd(s); | ||
975 | + break; | ||
976 | + case REG_MII_DATA: /* Management Interface Data */ | ||
977 | + s->mii_data = value; | ||
978 | + break; | ||
979 | + case REG_ADDR_HIGH: /* MAC Address High */ | ||
980 | + s->conf.macaddr.a[4] = (value & 0xff); | ||
981 | + s->conf.macaddr.a[5] = (value & 0xff00) >> 8; | ||
982 | + break; | ||
983 | + case REG_ADDR_LOW: /* MAC Address Low */ | ||
984 | + s->conf.macaddr.a[0] = (value & 0xff); | ||
985 | + s->conf.macaddr.a[1] = (value & 0xff00) >> 8; | ||
986 | + s->conf.macaddr.a[2] = (value & 0xff0000) >> 16; | ||
987 | + s->conf.macaddr.a[3] = (value & 0xff000000) >> 24; | ||
988 | + break; | ||
989 | + case REG_TX_DMA_STA: /* Transmit DMA Status */ | ||
990 | + case REG_TX_CUR_DESC: /* Transmit Current Descriptor */ | ||
991 | + case REG_TX_CUR_BUF: /* Transmit Current Buffer */ | ||
992 | + case REG_RX_DMA_STA: /* Receive DMA Status */ | ||
993 | + case REG_RX_CUR_DESC: /* Receive Current Descriptor */ | ||
994 | + case REG_RX_CUR_BUF: /* Receive Current Buffer */ | ||
995 | + case REG_RGMII_STA: /* RGMII Status */ | ||
996 | + break; | ||
997 | + default: | ||
998 | + qemu_log_mask(LOG_UNIMP, "allwinner-h3-emac: write access to unknown " | ||
999 | + "EMAC register 0x" TARGET_FMT_plx "\n", | ||
1000 | + offset); | ||
1001 | + } | ||
1002 | +} | ||
1003 | + | ||
1004 | +static void allwinner_sun8i_emac_set_link(NetClientState *nc) | ||
1005 | +{ | ||
1006 | + AwSun8iEmacState *s = qemu_get_nic_opaque(nc); | ||
1007 | + | ||
1008 | + trace_allwinner_sun8i_emac_set_link(!nc->link_down); | ||
1009 | + allwinner_sun8i_emac_mii_set_link(s, !nc->link_down); | ||
1010 | +} | ||
1011 | + | ||
1012 | +static const MemoryRegionOps allwinner_sun8i_emac_mem_ops = { | ||
1013 | + .read = allwinner_sun8i_emac_read, | ||
1014 | + .write = allwinner_sun8i_emac_write, | ||
1015 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
1016 | + .valid = { | ||
1017 | + .min_access_size = 4, | ||
1018 | + .max_access_size = 4, | ||
1019 | + }, | ||
1020 | + .impl.min_access_size = 4, | ||
1021 | +}; | ||
1022 | + | ||
1023 | +static NetClientInfo net_allwinner_sun8i_emac_info = { | ||
1024 | + .type = NET_CLIENT_DRIVER_NIC, | ||
1025 | + .size = sizeof(NICState), | ||
1026 | + .can_receive = allwinner_sun8i_emac_can_receive, | ||
1027 | + .receive = allwinner_sun8i_emac_receive, | ||
1028 | + .link_status_changed = allwinner_sun8i_emac_set_link, | ||
1029 | +}; | ||
1030 | + | ||
1031 | +static void allwinner_sun8i_emac_init(Object *obj) | ||
1032 | +{ | ||
1033 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
1034 | + AwSun8iEmacState *s = AW_SUN8I_EMAC(obj); | ||
1035 | + | ||
1036 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_sun8i_emac_mem_ops, | ||
1037 | + s, TYPE_AW_SUN8I_EMAC, 64 * KiB); | ||
1038 | + sysbus_init_mmio(sbd, &s->iomem); | ||
1039 | + sysbus_init_irq(sbd, &s->irq); | ||
1040 | +} | ||
1041 | + | ||
1042 | +static void allwinner_sun8i_emac_realize(DeviceState *dev, Error **errp) | ||
1043 | +{ | ||
1044 | + AwSun8iEmacState *s = AW_SUN8I_EMAC(dev); | ||
1045 | + | ||
1046 | + qemu_macaddr_default_if_unset(&s->conf.macaddr); | ||
1047 | + s->nic = qemu_new_nic(&net_allwinner_sun8i_emac_info, &s->conf, | ||
1048 | + object_get_typename(OBJECT(dev)), dev->id, s); | ||
1049 | + qemu_format_nic_info_str(qemu_get_queue(s->nic), s->conf.macaddr.a); | ||
1050 | +} | ||
1051 | + | ||
1052 | +static Property allwinner_sun8i_emac_properties[] = { | ||
1053 | + DEFINE_NIC_PROPERTIES(AwSun8iEmacState, conf), | ||
1054 | + DEFINE_PROP_UINT8("phy-addr", AwSun8iEmacState, mii_phy_addr, 0), | ||
1055 | + DEFINE_PROP_END_OF_LIST(), | ||
1056 | +}; | ||
1057 | + | ||
1058 | +static int allwinner_sun8i_emac_post_load(void *opaque, int version_id) | ||
1059 | +{ | ||
1060 | + AwSun8iEmacState *s = opaque; | ||
1061 | + | ||
1062 | + allwinner_sun8i_emac_set_link(qemu_get_queue(s->nic)); | ||
1063 | + | ||
1064 | + return 0; | ||
1065 | +} | ||
1066 | + | ||
1067 | +static const VMStateDescription vmstate_aw_emac = { | ||
1068 | + .name = "allwinner-sun8i-emac", | ||
1069 | + .version_id = 1, | ||
1070 | + .minimum_version_id = 1, | ||
1071 | + .post_load = allwinner_sun8i_emac_post_load, | ||
1072 | + .fields = (VMStateField[]) { | ||
1073 | + VMSTATE_UINT8(mii_phy_addr, AwSun8iEmacState), | ||
1074 | + VMSTATE_UINT32(mii_cmd, AwSun8iEmacState), | ||
1075 | + VMSTATE_UINT32(mii_data, AwSun8iEmacState), | ||
1076 | + VMSTATE_UINT32(mii_cr, AwSun8iEmacState), | ||
1077 | + VMSTATE_UINT32(mii_st, AwSun8iEmacState), | ||
1078 | + VMSTATE_UINT32(mii_adv, AwSun8iEmacState), | ||
1079 | + VMSTATE_UINT32(basic_ctl0, AwSun8iEmacState), | ||
1080 | + VMSTATE_UINT32(basic_ctl1, AwSun8iEmacState), | ||
1081 | + VMSTATE_UINT32(int_en, AwSun8iEmacState), | ||
1082 | + VMSTATE_UINT32(int_sta, AwSun8iEmacState), | ||
1083 | + VMSTATE_UINT32(frm_flt, AwSun8iEmacState), | ||
1084 | + VMSTATE_UINT32(rx_ctl0, AwSun8iEmacState), | ||
1085 | + VMSTATE_UINT32(rx_ctl1, AwSun8iEmacState), | ||
1086 | + VMSTATE_UINT32(rx_desc_head, AwSun8iEmacState), | ||
1087 | + VMSTATE_UINT32(rx_desc_curr, AwSun8iEmacState), | ||
1088 | + VMSTATE_UINT32(tx_ctl0, AwSun8iEmacState), | ||
1089 | + VMSTATE_UINT32(tx_ctl1, AwSun8iEmacState), | ||
1090 | + VMSTATE_UINT32(tx_desc_head, AwSun8iEmacState), | ||
1091 | + VMSTATE_UINT32(tx_desc_curr, AwSun8iEmacState), | ||
1092 | + VMSTATE_UINT32(tx_flowctl, AwSun8iEmacState), | ||
1093 | + VMSTATE_END_OF_LIST() | ||
1094 | + } | ||
1095 | +}; | ||
1096 | + | ||
1097 | +static void allwinner_sun8i_emac_class_init(ObjectClass *klass, void *data) | ||
1098 | +{ | ||
1099 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
1100 | + | ||
1101 | + dc->realize = allwinner_sun8i_emac_realize; | ||
1102 | + dc->reset = allwinner_sun8i_emac_reset; | ||
1103 | + dc->vmsd = &vmstate_aw_emac; | ||
1104 | + device_class_set_props(dc, allwinner_sun8i_emac_properties); | ||
1105 | +} | ||
1106 | + | ||
1107 | +static const TypeInfo allwinner_sun8i_emac_info = { | ||
1108 | + .name = TYPE_AW_SUN8I_EMAC, | ||
1109 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
1110 | + .instance_size = sizeof(AwSun8iEmacState), | ||
1111 | + .instance_init = allwinner_sun8i_emac_init, | ||
1112 | + .class_init = allwinner_sun8i_emac_class_init, | ||
1113 | +}; | ||
1114 | + | ||
1115 | +static void allwinner_sun8i_emac_register_types(void) | ||
1116 | +{ | ||
1117 | + type_register_static(&allwinner_sun8i_emac_info); | ||
1118 | +} | ||
1119 | + | ||
1120 | +type_init(allwinner_sun8i_emac_register_types) | ||
1121 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig | ||
1122 | index XXXXXXX..XXXXXXX 100644 | ||
1123 | --- a/hw/arm/Kconfig | ||
1124 | +++ b/hw/arm/Kconfig | ||
1125 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_A10 | ||
1126 | config ALLWINNER_H3 | ||
1127 | bool | ||
1128 | select ALLWINNER_A10_PIT | ||
1129 | + select ALLWINNER_SUN8I_EMAC | ||
1130 | select SERIAL | ||
1131 | select ARM_TIMER | ||
1132 | select ARM_GIC | ||
1133 | diff --git a/hw/net/Kconfig b/hw/net/Kconfig | ||
1134 | index XXXXXXX..XXXXXXX 100644 | ||
1135 | --- a/hw/net/Kconfig | ||
1136 | +++ b/hw/net/Kconfig | ||
1137 | @@ -XXX,XX +XXX,XX @@ config MIPSNET | ||
1138 | config ALLWINNER_EMAC | ||
1139 | bool | ||
1140 | |||
1141 | +config ALLWINNER_SUN8I_EMAC | ||
1142 | + bool | ||
1143 | + | ||
1144 | config IMX_FEC | ||
1145 | bool | ||
1146 | |||
1147 | diff --git a/hw/net/trace-events b/hw/net/trace-events | ||
1148 | index XXXXXXX..XXXXXXX 100644 | ||
1149 | --- a/hw/net/trace-events | ||
1150 | +++ b/hw/net/trace-events | ||
1151 | @@ -XXX,XX +XXX,XX @@ | ||
1152 | # See docs/devel/tracing.txt for syntax documentation. | ||
1153 | |||
1154 | +# allwinner-sun8i-emac.c | ||
1155 | +allwinner_sun8i_emac_mii_write_reg(uint32_t reg, uint32_t value) "MII write: reg=0x%" PRIx32 " value=0x%" PRIx32 | ||
1156 | +allwinner_sun8i_emac_mii_read_reg(uint32_t reg, uint32_t value) "MII read: reg=0x%" PRIx32 " value=0x%" PRIx32 | ||
1157 | +allwinner_sun8i_emac_receive(uint32_t desc, uint32_t paddr, uint32_t bytes) "RX packet: desc=0x%" PRIx32 " paddr=0x%" PRIx32 " bytes=%" PRIu32 | ||
1158 | +allwinner_sun8i_emac_transmit(uint32_t desc, uint32_t paddr, uint32_t bytes) "TX packet: desc=0x%" PRIx32 " paddr=0x%" PRIx32 " bytes=%" PRIu32 | ||
1159 | +allwinner_sun8i_emac_reset(void) "HW reset" | ||
1160 | +allwinner_sun8i_emac_set_link(bool active) "Set link: active=%u" | ||
1161 | +allwinner_sun8i_emac_read(uint64_t offset, uint64_t val) "MMIO read: offset=0x%" PRIx64 " value=0x%" PRIx64 | ||
1162 | +allwinner_sun8i_emac_write(uint64_t offset, uint64_t val) "MMIO write: offset=0x%" PRIx64 " value=0x%" PRIx64 | ||
1163 | + | ||
1164 | # etraxfs_eth.c | ||
1165 | mdio_phy_read(int regnum, uint16_t value) "read phy_reg:%d value:0x%04x" | ||
1166 | mdio_phy_write(int regnum, uint16_t value) "write phy_reg:%d value:0x%04x" | ||
1167 | -- | 155 | -- |
1168 | 2.20.1 | 156 | 2.20.1 |
1169 | 157 | ||
1170 | 158 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | Implement VFP fp16 support for the VMOV immediate insn. | ||
1 | 2 | ||
3 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Message-id: 20200828183354.27913-10-peter.maydell@linaro.org | ||
6 | --- | ||
7 | target/arm/vfp.decode | 2 ++ | ||
8 | target/arm/translate-vfp.c.inc | 22 ++++++++++++++++++++++ | ||
9 | 2 files changed, 24 insertions(+) | ||
10 | |||
11 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode | ||
12 | index XXXXXXX..XXXXXXX 100644 | ||
13 | --- a/target/arm/vfp.decode | ||
14 | +++ b/target/arm/vfp.decode | ||
15 | @@ -XXX,XX +XXX,XX @@ VFMS_dp ---- 1110 1.10 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
16 | VFNMA_dp ---- 1110 1.01 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
17 | VFNMS_dp ---- 1110 1.01 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
18 | |||
19 | +VMOV_imm_hp ---- 1110 1.11 .... .... 1001 0000 .... \ | ||
20 | + vd=%vd_sp imm=%vmov_imm | ||
21 | VMOV_imm_sp ---- 1110 1.11 .... .... 1010 0000 .... \ | ||
22 | vd=%vd_sp imm=%vmov_imm | ||
23 | VMOV_imm_dp ---- 1110 1.11 .... .... 1011 0000 .... \ | ||
24 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
25 | index XXXXXXX..XXXXXXX 100644 | ||
26 | --- a/target/arm/translate-vfp.c.inc | ||
27 | +++ b/target/arm/translate-vfp.c.inc | ||
28 | @@ -XXX,XX +XXX,XX @@ MAKE_VFM_TRANS_FNS(hp) | ||
29 | MAKE_VFM_TRANS_FNS(sp) | ||
30 | MAKE_VFM_TRANS_FNS(dp) | ||
31 | |||
32 | +static bool trans_VMOV_imm_hp(DisasContext *s, arg_VMOV_imm_sp *a) | ||
33 | +{ | ||
34 | + TCGv_i32 fd; | ||
35 | + | ||
36 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
37 | + return false; | ||
38 | + } | ||
39 | + | ||
40 | + if (s->vec_len != 0 || s->vec_stride != 0) { | ||
41 | + return false; | ||
42 | + } | ||
43 | + | ||
44 | + if (!vfp_access_check(s)) { | ||
45 | + return true; | ||
46 | + } | ||
47 | + | ||
48 | + fd = tcg_const_i32(vfp_expand_imm(MO_16, a->imm)); | ||
49 | + neon_store_reg32(fd, a->vd); | ||
50 | + tcg_temp_free_i32(fd); | ||
51 | + return true; | ||
52 | +} | ||
53 | + | ||
54 | static bool trans_VMOV_imm_sp(DisasContext *s, arg_VMOV_imm_sp *a) | ||
55 | { | ||
56 | uint32_t delta_d = 0; | ||
57 | -- | ||
58 | 2.20.1 | ||
59 | |||
60 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | Implement fp16 version of VCMP. | ||
1 | 2 | ||
3 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Message-id: 20200828183354.27913-11-peter.maydell@linaro.org | ||
6 | --- | ||
7 | target/arm/helper.h | 2 ++ | ||
8 | target/arm/vfp.decode | 2 ++ | ||
9 | target/arm/vfp_helper.c | 15 +++++++------ | ||
10 | target/arm/translate-vfp.c.inc | 39 ++++++++++++++++++++++++++++++++++ | ||
11 | 4 files changed, 51 insertions(+), 7 deletions(-) | ||
12 | |||
13 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
14 | index XXXXXXX..XXXXXXX 100644 | ||
15 | --- a/target/arm/helper.h | ||
16 | +++ b/target/arm/helper.h | ||
17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_1(vfp_absd, f64, f64) | ||
18 | DEF_HELPER_2(vfp_sqrth, f16, f16, env) | ||
19 | DEF_HELPER_2(vfp_sqrts, f32, f32, env) | ||
20 | DEF_HELPER_2(vfp_sqrtd, f64, f64, env) | ||
21 | +DEF_HELPER_3(vfp_cmph, void, f16, f16, env) | ||
22 | DEF_HELPER_3(vfp_cmps, void, f32, f32, env) | ||
23 | DEF_HELPER_3(vfp_cmpd, void, f64, f64, env) | ||
24 | +DEF_HELPER_3(vfp_cmpeh, void, f16, f16, env) | ||
25 | DEF_HELPER_3(vfp_cmpes, void, f32, f32, env) | ||
26 | DEF_HELPER_3(vfp_cmped, void, f64, f64, env) | ||
27 | |||
28 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode | ||
29 | index XXXXXXX..XXXXXXX 100644 | ||
30 | --- a/target/arm/vfp.decode | ||
31 | +++ b/target/arm/vfp.decode | ||
32 | @@ -XXX,XX +XXX,XX @@ VSQRT_hp ---- 1110 1.11 0001 .... 1001 11.0 .... @vfp_dm_ss | ||
33 | VSQRT_sp ---- 1110 1.11 0001 .... 1010 11.0 .... @vfp_dm_ss | ||
34 | VSQRT_dp ---- 1110 1.11 0001 .... 1011 11.0 .... @vfp_dm_dd | ||
35 | |||
36 | +VCMP_hp ---- 1110 1.11 010 z:1 .... 1001 e:1 1.0 .... \ | ||
37 | + vd=%vd_sp vm=%vm_sp | ||
38 | VCMP_sp ---- 1110 1.11 010 z:1 .... 1010 e:1 1.0 .... \ | ||
39 | vd=%vd_sp vm=%vm_sp | ||
40 | VCMP_dp ---- 1110 1.11 010 z:1 .... 1011 e:1 1.0 .... \ | ||
41 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
42 | index XXXXXXX..XXXXXXX 100644 | ||
43 | --- a/target/arm/vfp_helper.c | ||
44 | +++ b/target/arm/vfp_helper.c | ||
45 | @@ -XXX,XX +XXX,XX @@ static void softfloat_to_vfp_compare(CPUARMState *env, FloatRelation cmp) | ||
46 | } | ||
47 | |||
48 | /* XXX: check quiet/signaling case */ | ||
49 | -#define DO_VFP_cmp(p, type) \ | ||
50 | -void VFP_HELPER(cmp, p)(type a, type b, CPUARMState *env) \ | ||
51 | +#define DO_VFP_cmp(P, FLOATTYPE, ARGTYPE, FPST) \ | ||
52 | +void VFP_HELPER(cmp, P)(ARGTYPE a, ARGTYPE b, CPUARMState *env) \ | ||
53 | { \ | ||
54 | softfloat_to_vfp_compare(env, \ | ||
55 | - type ## _compare_quiet(a, b, &env->vfp.fp_status)); \ | ||
56 | + FLOATTYPE ## _compare_quiet(a, b, &env->vfp.FPST)); \ | ||
57 | } \ | ||
58 | -void VFP_HELPER(cmpe, p)(type a, type b, CPUARMState *env) \ | ||
59 | +void VFP_HELPER(cmpe, P)(ARGTYPE a, ARGTYPE b, CPUARMState *env) \ | ||
60 | { \ | ||
61 | softfloat_to_vfp_compare(env, \ | ||
62 | - type ## _compare(a, b, &env->vfp.fp_status)); \ | ||
63 | + FLOATTYPE ## _compare(a, b, &env->vfp.FPST)); \ | ||
64 | } | ||
65 | -DO_VFP_cmp(s, float32) | ||
66 | -DO_VFP_cmp(d, float64) | ||
67 | +DO_VFP_cmp(h, float16, dh_ctype_f16, fp_status_f16) | ||
68 | +DO_VFP_cmp(s, float32, float32, fp_status) | ||
69 | +DO_VFP_cmp(d, float64, float64, fp_status) | ||
70 | #undef DO_VFP_cmp | ||
71 | |||
72 | /* Integer to float and float to integer conversions */ | ||
73 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
74 | index XXXXXXX..XXXXXXX 100644 | ||
75 | --- a/target/arm/translate-vfp.c.inc | ||
76 | +++ b/target/arm/translate-vfp.c.inc | ||
77 | @@ -XXX,XX +XXX,XX @@ DO_VFP_2OP(VSQRT, hp, gen_VSQRT_hp) | ||
78 | DO_VFP_2OP(VSQRT, sp, gen_VSQRT_sp) | ||
79 | DO_VFP_2OP(VSQRT, dp, gen_VSQRT_dp) | ||
80 | |||
81 | +static bool trans_VCMP_hp(DisasContext *s, arg_VCMP_sp *a) | ||
82 | +{ | ||
83 | + TCGv_i32 vd, vm; | ||
84 | + | ||
85 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
86 | + return false; | ||
87 | + } | ||
88 | + | ||
89 | + /* Vm/M bits must be zero for the Z variant */ | ||
90 | + if (a->z && a->vm != 0) { | ||
91 | + return false; | ||
92 | + } | ||
93 | + | ||
94 | + if (!vfp_access_check(s)) { | ||
95 | + return true; | ||
96 | + } | ||
97 | + | ||
98 | + vd = tcg_temp_new_i32(); | ||
99 | + vm = tcg_temp_new_i32(); | ||
100 | + | ||
101 | + neon_load_reg32(vd, a->vd); | ||
102 | + if (a->z) { | ||
103 | + tcg_gen_movi_i32(vm, 0); | ||
104 | + } else { | ||
105 | + neon_load_reg32(vm, a->vm); | ||
106 | + } | ||
107 | + | ||
108 | + if (a->e) { | ||
109 | + gen_helper_vfp_cmpeh(vd, vm, cpu_env); | ||
110 | + } else { | ||
111 | + gen_helper_vfp_cmph(vd, vm, cpu_env); | ||
112 | + } | ||
113 | + | ||
114 | + tcg_temp_free_i32(vd); | ||
115 | + tcg_temp_free_i32(vm); | ||
116 | + | ||
117 | + return true; | ||
118 | +} | ||
119 | + | ||
120 | static bool trans_VCMP_sp(DisasContext *s, arg_VCMP_sp *a) | ||
121 | { | ||
122 | TCGv_i32 vd, vm; | ||
123 | -- | ||
124 | 2.20.1 | ||
125 | |||
126 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Implement the fp16 versions of the VFP VLDR/VSTR (immediate). |
---|---|---|---|
2 | 2 | ||
3 | A real Allwinner H3 SoC contains a Boot ROM which is the | 3 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | first code that runs right after the SoC is powered on. | 4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | The Boot ROM is responsible for loading user code (e.g. a bootloader) | 5 | Message-id: 20200828183354.27913-12-peter.maydell@linaro.org |
6 | from any of the supported external devices and writing the downloaded | 6 | --- |
7 | code to internal SRAM. After loading the SoC begins executing the code | 7 | target/arm/vfp.decode | 3 +-- |
8 | written to SRAM. | 8 | target/arm/translate-vfp.c.inc | 35 ++++++++++++++++++++++++++++++++++ |
9 | 2 files changed, 36 insertions(+), 2 deletions(-) | ||
9 | 10 | ||
10 | This commits adds emulation of the Boot ROM firmware setup functionality | 11 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode |
11 | by loading user code from SD card in the A1 SRAM. While the A1 SRAM is | ||
12 | 64KiB, we limit the size to 32KiB because the real H3 Boot ROM also rejects | ||
13 | sizes larger than 32KiB. For reference, this behaviour is documented | ||
14 | by the Linux Sunxi project wiki at: | ||
15 | |||
16 | https://linux-sunxi.org/BROM#U-Boot_SPL_limitations | ||
17 | |||
18 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
19 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
20 | Message-id: 20200311221854.30370-11-nieklinnenbank@gmail.com | ||
21 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
22 | --- | ||
23 | include/hw/arm/allwinner-h3.h | 21 +++++++++++++++++++++ | ||
24 | hw/arm/allwinner-h3.c | 17 +++++++++++++++++ | ||
25 | hw/arm/orangepi.c | 5 +++++ | ||
26 | 3 files changed, 43 insertions(+) | ||
27 | |||
28 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | ||
29 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
30 | --- a/include/hw/arm/allwinner-h3.h | 13 | --- a/target/arm/vfp.decode |
31 | +++ b/include/hw/arm/allwinner-h3.h | 14 | +++ b/target/arm/vfp.decode |
32 | @@ -XXX,XX +XXX,XX @@ | 15 | @@ -XXX,XX +XXX,XX @@ VMOV_single ---- 1110 000 l:1 .... rt:4 1010 . 001 0000 vn=%vn_sp |
33 | #include "hw/sd/allwinner-sdhost.h" | 16 | VMOV_64_sp ---- 1100 010 op:1 rt2:4 rt:4 1010 00.1 .... vm=%vm_sp |
34 | #include "hw/net/allwinner-sun8i-emac.h" | 17 | VMOV_64_dp ---- 1100 010 op:1 rt2:4 rt:4 1011 00.1 .... vm=%vm_dp |
35 | #include "target/arm/cpu.h" | 18 | |
36 | +#include "sysemu/block-backend.h" | 19 | -# Note that the half-precision variants of VLDR and VSTR are |
37 | 20 | -# not part of this decodetree at all because they have bits [9:8] == 0b01 | |
38 | /** | 21 | +VLDR_VSTR_hp ---- 1101 u:1 .0 l:1 rn:4 .... 1001 imm:8 vd=%vd_sp |
39 | * Allwinner H3 device list | 22 | VLDR_VSTR_sp ---- 1101 u:1 .0 l:1 rn:4 .... 1010 imm:8 vd=%vd_sp |
40 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | 23 | VLDR_VSTR_dp ---- 1101 u:1 .0 l:1 rn:4 .... 1011 imm:8 vd=%vd_dp |
41 | MemoryRegion sram_c; | 24 | |
42 | } AwH3State; | 25 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc |
43 | 26 | index XXXXXXX..XXXXXXX 100644 | |
44 | +/** | 27 | --- a/target/arm/translate-vfp.c.inc |
45 | + * Emulate Boot ROM firmware setup functionality. | 28 | +++ b/target/arm/translate-vfp.c.inc |
46 | + * | 29 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMOV_64_dp(DisasContext *s, arg_VMOV_64_dp *a) |
47 | + * A real Allwinner H3 SoC contains a Boot ROM | 30 | return true; |
48 | + * which is the first code that runs right after | 31 | } |
49 | + * the SoC is powered on. The Boot ROM is responsible | 32 | |
50 | + * for loading user code (e.g. a bootloader) from any | 33 | +static bool trans_VLDR_VSTR_hp(DisasContext *s, arg_VLDR_VSTR_sp *a) |
51 | + * of the supported external devices and writing the | 34 | +{ |
52 | + * downloaded code to internal SRAM. After loading the SoC | 35 | + uint32_t offset; |
53 | + * begins executing the code written to SRAM. | 36 | + TCGv_i32 addr, tmp; |
54 | + * | ||
55 | + * This function emulates the Boot ROM by copying 32 KiB | ||
56 | + * of data from the given block device and writes it to | ||
57 | + * the start of the first internal SRAM memory. | ||
58 | + * | ||
59 | + * @s: Allwinner H3 state object pointer | ||
60 | + * @blk: Block backend device object pointer | ||
61 | + */ | ||
62 | +void allwinner_h3_bootrom_setup(AwH3State *s, BlockBackend *blk); | ||
63 | + | 37 | + |
64 | #endif /* HW_ARM_ALLWINNER_H3_H */ | 38 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
65 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | 39 | + return false; |
66 | index XXXXXXX..XXXXXXX 100644 | ||
67 | --- a/hw/arm/allwinner-h3.c | ||
68 | +++ b/hw/arm/allwinner-h3.c | ||
69 | @@ -XXX,XX +XXX,XX @@ | ||
70 | #include "hw/char/serial.h" | ||
71 | #include "hw/misc/unimp.h" | ||
72 | #include "hw/usb/hcd-ehci.h" | ||
73 | +#include "hw/loader.h" | ||
74 | #include "sysemu/sysemu.h" | ||
75 | #include "hw/arm/allwinner-h3.h" | ||
76 | |||
77 | @@ -XXX,XX +XXX,XX @@ enum { | ||
78 | AW_H3_GIC_NUM_SPI = 128 | ||
79 | }; | ||
80 | |||
81 | +void allwinner_h3_bootrom_setup(AwH3State *s, BlockBackend *blk) | ||
82 | +{ | ||
83 | + const int64_t rom_size = 32 * KiB; | ||
84 | + g_autofree uint8_t *buffer = g_new0(uint8_t, rom_size); | ||
85 | + | ||
86 | + if (blk_pread(blk, 8 * KiB, buffer, rom_size) < 0) { | ||
87 | + error_setg(&error_fatal, "%s: failed to read BlockBackend data", | ||
88 | + __func__); | ||
89 | + return; | ||
90 | + } | 40 | + } |
91 | + | 41 | + |
92 | + rom_add_blob("allwinner-h3.bootrom", buffer, rom_size, | 42 | + if (!vfp_access_check(s)) { |
93 | + rom_size, s->memmap[AW_H3_SRAM_A1], | 43 | + return true; |
94 | + NULL, NULL, NULL, NULL, false); | 44 | + } |
45 | + | ||
46 | + /* imm8 field is offset/2 for fp16, unlike fp32 and fp64 */ | ||
47 | + offset = a->imm << 1; | ||
48 | + if (!a->u) { | ||
49 | + offset = -offset; | ||
50 | + } | ||
51 | + | ||
52 | + /* For thumb, use of PC is UNPREDICTABLE. */ | ||
53 | + addr = add_reg_for_lit(s, a->rn, offset); | ||
54 | + tmp = tcg_temp_new_i32(); | ||
55 | + if (a->l) { | ||
56 | + gen_aa32_ld16u(s, tmp, addr, get_mem_index(s)); | ||
57 | + neon_store_reg32(tmp, a->vd); | ||
58 | + } else { | ||
59 | + neon_load_reg32(tmp, a->vd); | ||
60 | + gen_aa32_st16(s, tmp, addr, get_mem_index(s)); | ||
61 | + } | ||
62 | + tcg_temp_free_i32(tmp); | ||
63 | + tcg_temp_free_i32(addr); | ||
64 | + | ||
65 | + return true; | ||
95 | +} | 66 | +} |
96 | + | 67 | + |
97 | static void allwinner_h3_init(Object *obj) | 68 | static bool trans_VLDR_VSTR_sp(DisasContext *s, arg_VLDR_VSTR_sp *a) |
98 | { | 69 | { |
99 | AwH3State *s = AW_H3(obj); | 70 | uint32_t offset; |
100 | diff --git a/hw/arm/orangepi.c b/hw/arm/orangepi.c | ||
101 | index XXXXXXX..XXXXXXX 100644 | ||
102 | --- a/hw/arm/orangepi.c | ||
103 | +++ b/hw/arm/orangepi.c | ||
104 | @@ -XXX,XX +XXX,XX @@ static void orangepi_init(MachineState *machine) | ||
105 | memory_region_add_subregion(get_system_memory(), h3->memmap[AW_H3_SDRAM], | ||
106 | machine->ram); | ||
107 | |||
108 | + /* Load target kernel or start using BootROM */ | ||
109 | + if (!machine->kernel_filename && blk_is_available(blk)) { | ||
110 | + /* Use Boot ROM to copy data from SD card to SRAM */ | ||
111 | + allwinner_h3_bootrom_setup(h3, blk); | ||
112 | + } | ||
113 | orangepi_binfo.loader_start = h3->memmap[AW_H3_SDRAM]; | ||
114 | orangepi_binfo.ram_size = machine->ram_size; | ||
115 | arm_load_kernel(ARM_CPU(first_cpu), machine, &orangepi_binfo); | ||
116 | -- | 71 | -- |
117 | 2.20.1 | 72 | 2.20.1 |
118 | 73 | ||
119 | 74 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Implement the fp16 versions of the VFP VCVT instruction forms which |
---|---|---|---|
2 | convert between floating point and integer. | ||
2 | 3 | ||
3 | The Allwinner H3 is a System on Chip containing four ARM Cortex A7 | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | processor cores. Features and specifications include DDR2/DDR3 memory, | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | SD/MMC storage cards, 10/100/1000Mbit Ethernet, USB 2.0, HDMI and | 6 | Message-id: 20200828183354.27913-13-peter.maydell@linaro.org |
6 | various I/O modules. This commit adds support for the Allwinner H3 | 7 | --- |
7 | System on Chip. | 8 | target/arm/vfp.decode | 4 +++ |
9 | target/arm/translate-vfp.c.inc | 65 ++++++++++++++++++++++++++++++++++ | ||
10 | 2 files changed, 69 insertions(+) | ||
8 | 11 | ||
9 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | 12 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode |
10 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
11 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
12 | Tested-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
13 | Message-id: 20200311221854.30370-2-nieklinnenbank@gmail.com | ||
14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
15 | --- | ||
16 | hw/arm/Makefile.objs | 1 + | ||
17 | include/hw/arm/allwinner-h3.h | 106 +++++++++++ | ||
18 | hw/arm/allwinner-h3.c | 327 ++++++++++++++++++++++++++++++++ | ||
19 | MAINTAINERS | 7 + | ||
20 | default-configs/arm-softmmu.mak | 1 + | ||
21 | hw/arm/Kconfig | 8 + | ||
22 | 6 files changed, 450 insertions(+) | ||
23 | create mode 100644 include/hw/arm/allwinner-h3.h | ||
24 | create mode 100644 hw/arm/allwinner-h3.c | ||
25 | |||
26 | diff --git a/hw/arm/Makefile.objs b/hw/arm/Makefile.objs | ||
27 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
28 | --- a/hw/arm/Makefile.objs | 14 | --- a/target/arm/vfp.decode |
29 | +++ b/hw/arm/Makefile.objs | 15 | +++ b/target/arm/vfp.decode |
30 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_DIGIC) += digic.o | 16 | @@ -XXX,XX +XXX,XX @@ VCVT_sp ---- 1110 1.11 0111 .... 1010 11.0 .... @vfp_dm_ds |
31 | obj-$(CONFIG_OMAP) += omap1.o omap2.o | 17 | VCVT_dp ---- 1110 1.11 0111 .... 1011 11.0 .... @vfp_dm_sd |
32 | obj-$(CONFIG_STRONGARM) += strongarm.o | 18 | |
33 | obj-$(CONFIG_ALLWINNER_A10) += allwinner-a10.o cubieboard.o | 19 | # VCVT from integer to floating point: Vm always single; Vd depends on size |
34 | +obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3.o | 20 | +VCVT_int_hp ---- 1110 1.11 1000 .... 1001 s:1 1.0 .... \ |
35 | obj-$(CONFIG_RASPI) += bcm2835_peripherals.o bcm2836.o raspi.o | 21 | + vd=%vd_sp vm=%vm_sp |
36 | obj-$(CONFIG_STM32F205_SOC) += stm32f205_soc.o | 22 | VCVT_int_sp ---- 1110 1.11 1000 .... 1010 s:1 1.0 .... \ |
37 | obj-$(CONFIG_STM32F405_SOC) += stm32f405_soc.o | 23 | vd=%vd_sp vm=%vm_sp |
38 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | 24 | VCVT_int_dp ---- 1110 1.11 1000 .... 1011 s:1 1.0 .... \ |
39 | new file mode 100644 | 25 | @@ -XXX,XX +XXX,XX @@ VCVT_fix_dp ---- 1110 1.11 1.1. .... 1011 .1.0 .... \ |
40 | index XXXXXXX..XXXXXXX | 26 | vd=%vd_dp imm=%vm_sp opc=%vcvt_fix_op |
41 | --- /dev/null | 27 | |
42 | +++ b/include/hw/arm/allwinner-h3.h | 28 | # VCVT float to integer (VCVT and VCVTR): Vd always single; Vd depends on size |
43 | @@ -XXX,XX +XXX,XX @@ | 29 | +VCVT_hp_int ---- 1110 1.11 110 s:1 .... 1001 rz:1 1.0 .... \ |
44 | +/* | 30 | + vd=%vd_sp vm=%vm_sp |
45 | + * Allwinner H3 System on Chip emulation | 31 | VCVT_sp_int ---- 1110 1.11 110 s:1 .... 1010 rz:1 1.0 .... \ |
46 | + * | 32 | vd=%vd_sp vm=%vm_sp |
47 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | 33 | VCVT_dp_int ---- 1110 1.11 110 s:1 .... 1011 rz:1 1.0 .... \ |
48 | + * | 34 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc |
49 | + * This program is free software: you can redistribute it and/or modify | 35 | index XXXXXXX..XXXXXXX 100644 |
50 | + * it under the terms of the GNU General Public License as published by | 36 | --- a/target/arm/translate-vfp.c.inc |
51 | + * the Free Software Foundation, either version 2 of the License, or | 37 | +++ b/target/arm/translate-vfp.c.inc |
52 | + * (at your option) any later version. | 38 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_dp(DisasContext *s, arg_VCVT_dp *a) |
53 | + * | 39 | return true; |
54 | + * This program is distributed in the hope that it will be useful, | 40 | } |
55 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | 41 | |
56 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | 42 | +static bool trans_VCVT_int_hp(DisasContext *s, arg_VCVT_int_sp *a) |
57 | + * GNU General Public License for more details. | 43 | +{ |
58 | + * | 44 | + TCGv_i32 vm; |
59 | + * You should have received a copy of the GNU General Public License | 45 | + TCGv_ptr fpst; |
60 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
61 | + */ | ||
62 | + | 46 | + |
63 | +/* | 47 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
64 | + * The Allwinner H3 is a System on Chip containing four ARM Cortex A7 | 48 | + return false; |
65 | + * processor cores. Features and specifications include DDR2/DDR3 memory, | ||
66 | + * SD/MMC storage cards, 10/100/1000Mbit Ethernet, USB 2.0, HDMI and | ||
67 | + * various I/O modules. | ||
68 | + * | ||
69 | + * This implementation is based on the following datasheet: | ||
70 | + * | ||
71 | + * https://linux-sunxi.org/File:Allwinner_H3_Datasheet_V1.2.pdf | ||
72 | + * | ||
73 | + * The latest datasheet and more info can be found on the Linux Sunxi wiki: | ||
74 | + * | ||
75 | + * https://linux-sunxi.org/H3 | ||
76 | + */ | ||
77 | + | ||
78 | +#ifndef HW_ARM_ALLWINNER_H3_H | ||
79 | +#define HW_ARM_ALLWINNER_H3_H | ||
80 | + | ||
81 | +#include "qom/object.h" | ||
82 | +#include "hw/arm/boot.h" | ||
83 | +#include "hw/timer/allwinner-a10-pit.h" | ||
84 | +#include "hw/intc/arm_gic.h" | ||
85 | +#include "target/arm/cpu.h" | ||
86 | + | ||
87 | +/** | ||
88 | + * Allwinner H3 device list | ||
89 | + * | ||
90 | + * This enumeration is can be used refer to a particular device in the | ||
91 | + * Allwinner H3 SoC. For example, the physical memory base address for | ||
92 | + * each device can be found in the AwH3State object in the memmap member | ||
93 | + * using the device enum value as index. | ||
94 | + * | ||
95 | + * @see AwH3State | ||
96 | + */ | ||
97 | +enum { | ||
98 | + AW_H3_SRAM_A1, | ||
99 | + AW_H3_SRAM_A2, | ||
100 | + AW_H3_SRAM_C, | ||
101 | + AW_H3_PIT, | ||
102 | + AW_H3_UART0, | ||
103 | + AW_H3_UART1, | ||
104 | + AW_H3_UART2, | ||
105 | + AW_H3_UART3, | ||
106 | + AW_H3_GIC_DIST, | ||
107 | + AW_H3_GIC_CPU, | ||
108 | + AW_H3_GIC_HYP, | ||
109 | + AW_H3_GIC_VCPU, | ||
110 | + AW_H3_SDRAM | ||
111 | +}; | ||
112 | + | ||
113 | +/** Total number of CPU cores in the H3 SoC */ | ||
114 | +#define AW_H3_NUM_CPUS (4) | ||
115 | + | ||
116 | +/** | ||
117 | + * Allwinner H3 object model | ||
118 | + * @{ | ||
119 | + */ | ||
120 | + | ||
121 | +/** Object type for the Allwinner H3 SoC */ | ||
122 | +#define TYPE_AW_H3 "allwinner-h3" | ||
123 | + | ||
124 | +/** Convert input object to Allwinner H3 state object */ | ||
125 | +#define AW_H3(obj) OBJECT_CHECK(AwH3State, (obj), TYPE_AW_H3) | ||
126 | + | ||
127 | +/** @} */ | ||
128 | + | ||
129 | +/** | ||
130 | + * Allwinner H3 object | ||
131 | + * | ||
132 | + * This struct contains the state of all the devices | ||
133 | + * which are currently emulated by the H3 SoC code. | ||
134 | + */ | ||
135 | +typedef struct AwH3State { | ||
136 | + /*< private >*/ | ||
137 | + DeviceState parent_obj; | ||
138 | + /*< public >*/ | ||
139 | + | ||
140 | + ARMCPU cpus[AW_H3_NUM_CPUS]; | ||
141 | + const hwaddr *memmap; | ||
142 | + AwA10PITState timer; | ||
143 | + GICState gic; | ||
144 | + MemoryRegion sram_a1; | ||
145 | + MemoryRegion sram_a2; | ||
146 | + MemoryRegion sram_c; | ||
147 | +} AwH3State; | ||
148 | + | ||
149 | +#endif /* HW_ARM_ALLWINNER_H3_H */ | ||
150 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
151 | new file mode 100644 | ||
152 | index XXXXXXX..XXXXXXX | ||
153 | --- /dev/null | ||
154 | +++ b/hw/arm/allwinner-h3.c | ||
155 | @@ -XXX,XX +XXX,XX @@ | ||
156 | +/* | ||
157 | + * Allwinner H3 System on Chip emulation | ||
158 | + * | ||
159 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
160 | + * | ||
161 | + * This program is free software: you can redistribute it and/or modify | ||
162 | + * it under the terms of the GNU General Public License as published by | ||
163 | + * the Free Software Foundation, either version 2 of the License, or | ||
164 | + * (at your option) any later version. | ||
165 | + * | ||
166 | + * This program is distributed in the hope that it will be useful, | ||
167 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
168 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
169 | + * GNU General Public License for more details. | ||
170 | + * | ||
171 | + * You should have received a copy of the GNU General Public License | ||
172 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
173 | + */ | ||
174 | + | ||
175 | +#include "qemu/osdep.h" | ||
176 | +#include "exec/address-spaces.h" | ||
177 | +#include "qapi/error.h" | ||
178 | +#include "qemu/error-report.h" | ||
179 | +#include "qemu/module.h" | ||
180 | +#include "qemu/units.h" | ||
181 | +#include "hw/qdev-core.h" | ||
182 | +#include "cpu.h" | ||
183 | +#include "hw/sysbus.h" | ||
184 | +#include "hw/char/serial.h" | ||
185 | +#include "hw/misc/unimp.h" | ||
186 | +#include "sysemu/sysemu.h" | ||
187 | +#include "hw/arm/allwinner-h3.h" | ||
188 | + | ||
189 | +/* Memory map */ | ||
190 | +const hwaddr allwinner_h3_memmap[] = { | ||
191 | + [AW_H3_SRAM_A1] = 0x00000000, | ||
192 | + [AW_H3_SRAM_A2] = 0x00044000, | ||
193 | + [AW_H3_SRAM_C] = 0x00010000, | ||
194 | + [AW_H3_PIT] = 0x01c20c00, | ||
195 | + [AW_H3_UART0] = 0x01c28000, | ||
196 | + [AW_H3_UART1] = 0x01c28400, | ||
197 | + [AW_H3_UART2] = 0x01c28800, | ||
198 | + [AW_H3_UART3] = 0x01c28c00, | ||
199 | + [AW_H3_GIC_DIST] = 0x01c81000, | ||
200 | + [AW_H3_GIC_CPU] = 0x01c82000, | ||
201 | + [AW_H3_GIC_HYP] = 0x01c84000, | ||
202 | + [AW_H3_GIC_VCPU] = 0x01c86000, | ||
203 | + [AW_H3_SDRAM] = 0x40000000 | ||
204 | +}; | ||
205 | + | ||
206 | +/* List of unimplemented devices */ | ||
207 | +struct AwH3Unimplemented { | ||
208 | + const char *device_name; | ||
209 | + hwaddr base; | ||
210 | + hwaddr size; | ||
211 | +} unimplemented[] = { | ||
212 | + { "d-engine", 0x01000000, 4 * MiB }, | ||
213 | + { "d-inter", 0x01400000, 128 * KiB }, | ||
214 | + { "syscon", 0x01c00000, 4 * KiB }, | ||
215 | + { "dma", 0x01c02000, 4 * KiB }, | ||
216 | + { "nfdc", 0x01c03000, 4 * KiB }, | ||
217 | + { "ts", 0x01c06000, 4 * KiB }, | ||
218 | + { "keymem", 0x01c0b000, 4 * KiB }, | ||
219 | + { "lcd0", 0x01c0c000, 4 * KiB }, | ||
220 | + { "lcd1", 0x01c0d000, 4 * KiB }, | ||
221 | + { "ve", 0x01c0e000, 4 * KiB }, | ||
222 | + { "mmc0", 0x01c0f000, 4 * KiB }, | ||
223 | + { "mmc1", 0x01c10000, 4 * KiB }, | ||
224 | + { "mmc2", 0x01c11000, 4 * KiB }, | ||
225 | + { "sid", 0x01c14000, 1 * KiB }, | ||
226 | + { "crypto", 0x01c15000, 4 * KiB }, | ||
227 | + { "msgbox", 0x01c17000, 4 * KiB }, | ||
228 | + { "spinlock", 0x01c18000, 4 * KiB }, | ||
229 | + { "usb0-otg", 0x01c19000, 4 * KiB }, | ||
230 | + { "usb0-phy", 0x01c1a000, 4 * KiB }, | ||
231 | + { "usb1-phy", 0x01c1b000, 4 * KiB }, | ||
232 | + { "usb2-phy", 0x01c1c000, 4 * KiB }, | ||
233 | + { "usb3-phy", 0x01c1d000, 4 * KiB }, | ||
234 | + { "smc", 0x01c1e000, 4 * KiB }, | ||
235 | + { "ccu", 0x01c20000, 1 * KiB }, | ||
236 | + { "pio", 0x01c20800, 1 * KiB }, | ||
237 | + { "owa", 0x01c21000, 1 * KiB }, | ||
238 | + { "pwm", 0x01c21400, 1 * KiB }, | ||
239 | + { "keyadc", 0x01c21800, 1 * KiB }, | ||
240 | + { "pcm0", 0x01c22000, 1 * KiB }, | ||
241 | + { "pcm1", 0x01c22400, 1 * KiB }, | ||
242 | + { "pcm2", 0x01c22800, 1 * KiB }, | ||
243 | + { "audio", 0x01c22c00, 2 * KiB }, | ||
244 | + { "smta", 0x01c23400, 1 * KiB }, | ||
245 | + { "ths", 0x01c25000, 1 * KiB }, | ||
246 | + { "uart0", 0x01c28000, 1 * KiB }, | ||
247 | + { "uart1", 0x01c28400, 1 * KiB }, | ||
248 | + { "uart2", 0x01c28800, 1 * KiB }, | ||
249 | + { "uart3", 0x01c28c00, 1 * KiB }, | ||
250 | + { "twi0", 0x01c2ac00, 1 * KiB }, | ||
251 | + { "twi1", 0x01c2b000, 1 * KiB }, | ||
252 | + { "twi2", 0x01c2b400, 1 * KiB }, | ||
253 | + { "scr", 0x01c2c400, 1 * KiB }, | ||
254 | + { "emac", 0x01c30000, 64 * KiB }, | ||
255 | + { "gpu", 0x01c40000, 64 * KiB }, | ||
256 | + { "hstmr", 0x01c60000, 4 * KiB }, | ||
257 | + { "dramcom", 0x01c62000, 4 * KiB }, | ||
258 | + { "dramctl0", 0x01c63000, 4 * KiB }, | ||
259 | + { "dramphy0", 0x01c65000, 4 * KiB }, | ||
260 | + { "spi0", 0x01c68000, 4 * KiB }, | ||
261 | + { "spi1", 0x01c69000, 4 * KiB }, | ||
262 | + { "csi", 0x01cb0000, 320 * KiB }, | ||
263 | + { "tve", 0x01e00000, 64 * KiB }, | ||
264 | + { "hdmi", 0x01ee0000, 128 * KiB }, | ||
265 | + { "rtc", 0x01f00000, 1 * KiB }, | ||
266 | + { "r_timer", 0x01f00800, 1 * KiB }, | ||
267 | + { "r_intc", 0x01f00c00, 1 * KiB }, | ||
268 | + { "r_wdog", 0x01f01000, 1 * KiB }, | ||
269 | + { "r_prcm", 0x01f01400, 1 * KiB }, | ||
270 | + { "r_twd", 0x01f01800, 1 * KiB }, | ||
271 | + { "r_cpucfg", 0x01f01c00, 1 * KiB }, | ||
272 | + { "r_cir-rx", 0x01f02000, 1 * KiB }, | ||
273 | + { "r_twi", 0x01f02400, 1 * KiB }, | ||
274 | + { "r_uart", 0x01f02800, 1 * KiB }, | ||
275 | + { "r_pio", 0x01f02c00, 1 * KiB }, | ||
276 | + { "r_pwm", 0x01f03800, 1 * KiB }, | ||
277 | + { "core-dbg", 0x3f500000, 128 * KiB }, | ||
278 | + { "tsgen-ro", 0x3f506000, 4 * KiB }, | ||
279 | + { "tsgen-ctl", 0x3f507000, 4 * KiB }, | ||
280 | + { "ddr-mem", 0x40000000, 2 * GiB }, | ||
281 | + { "n-brom", 0xffff0000, 32 * KiB }, | ||
282 | + { "s-brom", 0xffff0000, 64 * KiB } | ||
283 | +}; | ||
284 | + | ||
285 | +/* Per Processor Interrupts */ | ||
286 | +enum { | ||
287 | + AW_H3_GIC_PPI_MAINT = 9, | ||
288 | + AW_H3_GIC_PPI_HYPTIMER = 10, | ||
289 | + AW_H3_GIC_PPI_VIRTTIMER = 11, | ||
290 | + AW_H3_GIC_PPI_SECTIMER = 13, | ||
291 | + AW_H3_GIC_PPI_PHYSTIMER = 14 | ||
292 | +}; | ||
293 | + | ||
294 | +/* Shared Processor Interrupts */ | ||
295 | +enum { | ||
296 | + AW_H3_GIC_SPI_UART0 = 0, | ||
297 | + AW_H3_GIC_SPI_UART1 = 1, | ||
298 | + AW_H3_GIC_SPI_UART2 = 2, | ||
299 | + AW_H3_GIC_SPI_UART3 = 3, | ||
300 | + AW_H3_GIC_SPI_TIMER0 = 18, | ||
301 | + AW_H3_GIC_SPI_TIMER1 = 19, | ||
302 | +}; | ||
303 | + | ||
304 | +/* Allwinner H3 general constants */ | ||
305 | +enum { | ||
306 | + AW_H3_GIC_NUM_SPI = 128 | ||
307 | +}; | ||
308 | + | ||
309 | +static void allwinner_h3_init(Object *obj) | ||
310 | +{ | ||
311 | + AwH3State *s = AW_H3(obj); | ||
312 | + | ||
313 | + s->memmap = allwinner_h3_memmap; | ||
314 | + | ||
315 | + for (int i = 0; i < AW_H3_NUM_CPUS; i++) { | ||
316 | + object_initialize_child(obj, "cpu[*]", &s->cpus[i], sizeof(s->cpus[i]), | ||
317 | + ARM_CPU_TYPE_NAME("cortex-a7"), | ||
318 | + &error_abort, NULL); | ||
319 | + } | 49 | + } |
320 | + | 50 | + |
321 | + sysbus_init_child_obj(obj, "gic", &s->gic, sizeof(s->gic), | 51 | + if (!vfp_access_check(s)) { |
322 | + TYPE_ARM_GIC); | 52 | + return true; |
53 | + } | ||
323 | + | 54 | + |
324 | + sysbus_init_child_obj(obj, "timer", &s->timer, sizeof(s->timer), | 55 | + vm = tcg_temp_new_i32(); |
325 | + TYPE_AW_A10_PIT); | 56 | + neon_load_reg32(vm, a->vm); |
326 | + object_property_add_alias(obj, "clk0-freq", OBJECT(&s->timer), | 57 | + fpst = fpstatus_ptr(FPST_FPCR_F16); |
327 | + "clk0-freq", &error_abort); | 58 | + if (a->s) { |
328 | + object_property_add_alias(obj, "clk1-freq", OBJECT(&s->timer), | 59 | + /* i32 -> f16 */ |
329 | + "clk1-freq", &error_abort); | 60 | + gen_helper_vfp_sitoh(vm, vm, fpst); |
61 | + } else { | ||
62 | + /* u32 -> f16 */ | ||
63 | + gen_helper_vfp_uitoh(vm, vm, fpst); | ||
64 | + } | ||
65 | + neon_store_reg32(vm, a->vd); | ||
66 | + tcg_temp_free_i32(vm); | ||
67 | + tcg_temp_free_ptr(fpst); | ||
68 | + return true; | ||
330 | +} | 69 | +} |
331 | + | 70 | + |
332 | +static void allwinner_h3_realize(DeviceState *dev, Error **errp) | 71 | static bool trans_VCVT_int_sp(DisasContext *s, arg_VCVT_int_sp *a) |
72 | { | ||
73 | TCGv_i32 vm; | ||
74 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_fix_dp(DisasContext *s, arg_VCVT_fix_dp *a) | ||
75 | return true; | ||
76 | } | ||
77 | |||
78 | +static bool trans_VCVT_hp_int(DisasContext *s, arg_VCVT_sp_int *a) | ||
333 | +{ | 79 | +{ |
334 | + AwH3State *s = AW_H3(dev); | 80 | + TCGv_i32 vm; |
335 | + unsigned i; | 81 | + TCGv_ptr fpst; |
336 | + | 82 | + |
337 | + /* CPUs */ | 83 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
338 | + for (i = 0; i < AW_H3_NUM_CPUS; i++) { | 84 | + return false; |
339 | + | ||
340 | + /* Provide Power State Coordination Interface */ | ||
341 | + qdev_prop_set_int32(DEVICE(&s->cpus[i]), "psci-conduit", | ||
342 | + QEMU_PSCI_CONDUIT_HVC); | ||
343 | + | ||
344 | + /* Disable secondary CPUs */ | ||
345 | + qdev_prop_set_bit(DEVICE(&s->cpus[i]), "start-powered-off", | ||
346 | + i > 0); | ||
347 | + | ||
348 | + /* All exception levels required */ | ||
349 | + qdev_prop_set_bit(DEVICE(&s->cpus[i]), "has_el3", true); | ||
350 | + qdev_prop_set_bit(DEVICE(&s->cpus[i]), "has_el2", true); | ||
351 | + | ||
352 | + /* Mark realized */ | ||
353 | + qdev_init_nofail(DEVICE(&s->cpus[i])); | ||
354 | + } | 85 | + } |
355 | + | 86 | + |
356 | + /* Generic Interrupt Controller */ | 87 | + if (!vfp_access_check(s)) { |
357 | + qdev_prop_set_uint32(DEVICE(&s->gic), "num-irq", AW_H3_GIC_NUM_SPI + | 88 | + return true; |
358 | + GIC_INTERNAL); | ||
359 | + qdev_prop_set_uint32(DEVICE(&s->gic), "revision", 2); | ||
360 | + qdev_prop_set_uint32(DEVICE(&s->gic), "num-cpu", AW_H3_NUM_CPUS); | ||
361 | + qdev_prop_set_bit(DEVICE(&s->gic), "has-security-extensions", false); | ||
362 | + qdev_prop_set_bit(DEVICE(&s->gic), "has-virtualization-extensions", true); | ||
363 | + qdev_init_nofail(DEVICE(&s->gic)); | ||
364 | + | ||
365 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 0, s->memmap[AW_H3_GIC_DIST]); | ||
366 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 1, s->memmap[AW_H3_GIC_CPU]); | ||
367 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 2, s->memmap[AW_H3_GIC_HYP]); | ||
368 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->gic), 3, s->memmap[AW_H3_GIC_VCPU]); | ||
369 | + | ||
370 | + /* | ||
371 | + * Wire the outputs from each CPU's generic timer and the GICv3 | ||
372 | + * maintenance interrupt signal to the appropriate GIC PPI inputs, | ||
373 | + * and the GIC's IRQ/FIQ/VIRQ/VFIQ interrupt outputs to the CPU's inputs. | ||
374 | + */ | ||
375 | + for (i = 0; i < AW_H3_NUM_CPUS; i++) { | ||
376 | + DeviceState *cpudev = DEVICE(&s->cpus[i]); | ||
377 | + int ppibase = AW_H3_GIC_NUM_SPI + i * GIC_INTERNAL + GIC_NR_SGIS; | ||
378 | + int irq; | ||
379 | + /* | ||
380 | + * Mapping from the output timer irq lines from the CPU to the | ||
381 | + * GIC PPI inputs used for this board. | ||
382 | + */ | ||
383 | + const int timer_irq[] = { | ||
384 | + [GTIMER_PHYS] = AW_H3_GIC_PPI_PHYSTIMER, | ||
385 | + [GTIMER_VIRT] = AW_H3_GIC_PPI_VIRTTIMER, | ||
386 | + [GTIMER_HYP] = AW_H3_GIC_PPI_HYPTIMER, | ||
387 | + [GTIMER_SEC] = AW_H3_GIC_PPI_SECTIMER, | ||
388 | + }; | ||
389 | + | ||
390 | + /* Connect CPU timer outputs to GIC PPI inputs */ | ||
391 | + for (irq = 0; irq < ARRAY_SIZE(timer_irq); irq++) { | ||
392 | + qdev_connect_gpio_out(cpudev, irq, | ||
393 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
394 | + ppibase + timer_irq[irq])); | ||
395 | + } | ||
396 | + | ||
397 | + /* Connect GIC outputs to CPU interrupt inputs */ | ||
398 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i, | ||
399 | + qdev_get_gpio_in(cpudev, ARM_CPU_IRQ)); | ||
400 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + AW_H3_NUM_CPUS, | ||
401 | + qdev_get_gpio_in(cpudev, ARM_CPU_FIQ)); | ||
402 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + (2 * AW_H3_NUM_CPUS), | ||
403 | + qdev_get_gpio_in(cpudev, ARM_CPU_VIRQ)); | ||
404 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + (3 * AW_H3_NUM_CPUS), | ||
405 | + qdev_get_gpio_in(cpudev, ARM_CPU_VFIQ)); | ||
406 | + | ||
407 | + /* GIC maintenance signal */ | ||
408 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->gic), i + (4 * AW_H3_NUM_CPUS), | ||
409 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
410 | + ppibase + AW_H3_GIC_PPI_MAINT)); | ||
411 | + } | 89 | + } |
412 | + | 90 | + |
413 | + /* Timer */ | 91 | + fpst = fpstatus_ptr(FPST_FPCR_F16); |
414 | + qdev_init_nofail(DEVICE(&s->timer)); | 92 | + vm = tcg_temp_new_i32(); |
415 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->timer), 0, s->memmap[AW_H3_PIT]); | 93 | + neon_load_reg32(vm, a->vm); |
416 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer), 0, | ||
417 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_TIMER0)); | ||
418 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer), 1, | ||
419 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_TIMER1)); | ||
420 | + | 94 | + |
421 | + /* SRAM */ | 95 | + if (a->s) { |
422 | + memory_region_init_ram(&s->sram_a1, OBJECT(dev), "sram A1", | 96 | + if (a->rz) { |
423 | + 64 * KiB, &error_abort); | 97 | + gen_helper_vfp_tosizh(vm, vm, fpst); |
424 | + memory_region_init_ram(&s->sram_a2, OBJECT(dev), "sram A2", | 98 | + } else { |
425 | + 32 * KiB, &error_abort); | 99 | + gen_helper_vfp_tosih(vm, vm, fpst); |
426 | + memory_region_init_ram(&s->sram_c, OBJECT(dev), "sram C", | 100 | + } |
427 | + 44 * KiB, &error_abort); | 101 | + } else { |
428 | + memory_region_add_subregion(get_system_memory(), s->memmap[AW_H3_SRAM_A1], | 102 | + if (a->rz) { |
429 | + &s->sram_a1); | 103 | + gen_helper_vfp_touizh(vm, vm, fpst); |
430 | + memory_region_add_subregion(get_system_memory(), s->memmap[AW_H3_SRAM_A2], | 104 | + } else { |
431 | + &s->sram_a2); | 105 | + gen_helper_vfp_touih(vm, vm, fpst); |
432 | + memory_region_add_subregion(get_system_memory(), s->memmap[AW_H3_SRAM_C], | 106 | + } |
433 | + &s->sram_c); | ||
434 | + | ||
435 | + /* UART0. For future clocktree API: All UARTS are connected to APB2_CLK. */ | ||
436 | + serial_mm_init(get_system_memory(), s->memmap[AW_H3_UART0], 2, | ||
437 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART0), | ||
438 | + 115200, serial_hd(0), DEVICE_NATIVE_ENDIAN); | ||
439 | + /* UART1 */ | ||
440 | + serial_mm_init(get_system_memory(), s->memmap[AW_H3_UART1], 2, | ||
441 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART1), | ||
442 | + 115200, serial_hd(1), DEVICE_NATIVE_ENDIAN); | ||
443 | + /* UART2 */ | ||
444 | + serial_mm_init(get_system_memory(), s->memmap[AW_H3_UART2], 2, | ||
445 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART2), | ||
446 | + 115200, serial_hd(2), DEVICE_NATIVE_ENDIAN); | ||
447 | + /* UART3 */ | ||
448 | + serial_mm_init(get_system_memory(), s->memmap[AW_H3_UART3], 2, | ||
449 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART3), | ||
450 | + 115200, serial_hd(3), DEVICE_NATIVE_ENDIAN); | ||
451 | + | ||
452 | + /* Unimplemented devices */ | ||
453 | + for (i = 0; i < ARRAY_SIZE(unimplemented); i++) { | ||
454 | + create_unimplemented_device(unimplemented[i].device_name, | ||
455 | + unimplemented[i].base, | ||
456 | + unimplemented[i].size); | ||
457 | + } | 107 | + } |
108 | + neon_store_reg32(vm, a->vd); | ||
109 | + tcg_temp_free_i32(vm); | ||
110 | + tcg_temp_free_ptr(fpst); | ||
111 | + return true; | ||
458 | +} | 112 | +} |
459 | + | 113 | + |
460 | +static void allwinner_h3_class_init(ObjectClass *oc, void *data) | 114 | static bool trans_VCVT_sp_int(DisasContext *s, arg_VCVT_sp_int *a) |
461 | +{ | 115 | { |
462 | + DeviceClass *dc = DEVICE_CLASS(oc); | 116 | TCGv_i32 vm; |
463 | + | ||
464 | + dc->realize = allwinner_h3_realize; | ||
465 | + /* Reason: uses serial_hd() in realize function */ | ||
466 | + dc->user_creatable = false; | ||
467 | +} | ||
468 | + | ||
469 | +static const TypeInfo allwinner_h3_type_info = { | ||
470 | + .name = TYPE_AW_H3, | ||
471 | + .parent = TYPE_DEVICE, | ||
472 | + .instance_size = sizeof(AwH3State), | ||
473 | + .instance_init = allwinner_h3_init, | ||
474 | + .class_init = allwinner_h3_class_init, | ||
475 | +}; | ||
476 | + | ||
477 | +static void allwinner_h3_register_types(void) | ||
478 | +{ | ||
479 | + type_register_static(&allwinner_h3_type_info); | ||
480 | +} | ||
481 | + | ||
482 | +type_init(allwinner_h3_register_types) | ||
483 | diff --git a/MAINTAINERS b/MAINTAINERS | ||
484 | index XXXXXXX..XXXXXXX 100644 | ||
485 | --- a/MAINTAINERS | ||
486 | +++ b/MAINTAINERS | ||
487 | @@ -XXX,XX +XXX,XX @@ F: hw/*/allwinner* | ||
488 | F: include/hw/*/allwinner* | ||
489 | F: hw/arm/cubieboard.c | ||
490 | |||
491 | +Allwinner-h3 | ||
492 | +M: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
493 | +L: qemu-arm@nongnu.org | ||
494 | +S: Maintained | ||
495 | +F: hw/*/allwinner-h3* | ||
496 | +F: include/hw/*/allwinner-h3* | ||
497 | + | ||
498 | ARM PrimeCell and CMSDK devices | ||
499 | M: Peter Maydell <peter.maydell@linaro.org> | ||
500 | L: qemu-arm@nongnu.org | ||
501 | diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak | ||
502 | index XXXXXXX..XXXXXXX 100644 | ||
503 | --- a/default-configs/arm-softmmu.mak | ||
504 | +++ b/default-configs/arm-softmmu.mak | ||
505 | @@ -XXX,XX +XXX,XX @@ CONFIG_FSL_IMX25=y | ||
506 | CONFIG_FSL_IMX7=y | ||
507 | CONFIG_FSL_IMX6UL=y | ||
508 | CONFIG_SEMIHOSTING=y | ||
509 | +CONFIG_ALLWINNER_H3=y | ||
510 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig | ||
511 | index XXXXXXX..XXXXXXX 100644 | ||
512 | --- a/hw/arm/Kconfig | ||
513 | +++ b/hw/arm/Kconfig | ||
514 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_A10 | ||
515 | select SERIAL | ||
516 | select UNIMP | ||
517 | |||
518 | +config ALLWINNER_H3 | ||
519 | + bool | ||
520 | + select ALLWINNER_A10_PIT | ||
521 | + select SERIAL | ||
522 | + select ARM_TIMER | ||
523 | + select ARM_GIC | ||
524 | + select UNIMP | ||
525 | + | ||
526 | config RASPI | ||
527 | bool | ||
528 | select FRAMEBUFFER | ||
529 | -- | 117 | -- |
530 | 2.20.1 | 118 | 2.20.1 |
531 | 119 | ||
532 | 120 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | Currently the VFP_CONV_FIX macros take a single fsz argument for the | ||
2 | size of the float type, which is used both to select the name of | ||
3 | the functions to call (eg float32_is_any_nan()) and also for the | ||
4 | type to use for the float inputs and outputs (eg float32). | ||
1 | 5 | ||
6 | Separate these into fsz and ftype arguments, so that we can use them | ||
7 | for fp16, which uses 'float16' in the function names but is still | ||
8 | passing inputs and outputs in a 32-bit sized type. | ||
9 | |||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
12 | Message-id: 20200828183354.27913-14-peter.maydell@linaro.org | ||
13 | --- | ||
14 | target/arm/vfp_helper.c | 46 ++++++++++++++++++++--------------------- | ||
15 | 1 file changed, 23 insertions(+), 23 deletions(-) | ||
16 | |||
17 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
18 | index XXXXXXX..XXXXXXX 100644 | ||
19 | --- a/target/arm/vfp_helper.c | ||
20 | +++ b/target/arm/vfp_helper.c | ||
21 | @@ -XXX,XX +XXX,XX @@ float32 VFP_HELPER(fcvts, d)(float64 x, CPUARMState *env) | ||
22 | } | ||
23 | |||
24 | /* VFP3 fixed point conversion. */ | ||
25 | -#define VFP_CONV_FIX_FLOAT(name, p, fsz, isz, itype) \ | ||
26 | -float##fsz HELPER(vfp_##name##to##p)(uint##isz##_t x, uint32_t shift, \ | ||
27 | +#define VFP_CONV_FIX_FLOAT(name, p, fsz, ftype, isz, itype) \ | ||
28 | +ftype HELPER(vfp_##name##to##p)(uint##isz##_t x, uint32_t shift, \ | ||
29 | void *fpstp) \ | ||
30 | { return itype##_to_##float##fsz##_scalbn(x, -shift, fpstp); } | ||
31 | |||
32 | -#define VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, isz, itype, ROUND, suff) \ | ||
33 | -uint##isz##_t HELPER(vfp_to##name##p##suff)(float##fsz x, uint32_t shift, \ | ||
34 | +#define VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, ftype, isz, itype, ROUND, suff) \ | ||
35 | +uint##isz##_t HELPER(vfp_to##name##p##suff)(ftype x, uint32_t shift, \ | ||
36 | void *fpst) \ | ||
37 | { \ | ||
38 | if (unlikely(float##fsz##_is_any_nan(x))) { \ | ||
39 | @@ -XXX,XX +XXX,XX @@ uint##isz##_t HELPER(vfp_to##name##p##suff)(float##fsz x, uint32_t shift, \ | ||
40 | return float##fsz##_to_##itype##_scalbn(x, ROUND, shift, fpst); \ | ||
41 | } | ||
42 | |||
43 | -#define VFP_CONV_FIX(name, p, fsz, isz, itype) \ | ||
44 | -VFP_CONV_FIX_FLOAT(name, p, fsz, isz, itype) \ | ||
45 | -VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, isz, itype, \ | ||
46 | +#define VFP_CONV_FIX(name, p, fsz, ftype, isz, itype) \ | ||
47 | +VFP_CONV_FIX_FLOAT(name, p, fsz, ftype, isz, itype) \ | ||
48 | +VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, ftype, isz, itype, \ | ||
49 | float_round_to_zero, _round_to_zero) \ | ||
50 | -VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, isz, itype, \ | ||
51 | +VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, ftype, isz, itype, \ | ||
52 | get_float_rounding_mode(fpst), ) | ||
53 | |||
54 | -#define VFP_CONV_FIX_A64(name, p, fsz, isz, itype) \ | ||
55 | -VFP_CONV_FIX_FLOAT(name, p, fsz, isz, itype) \ | ||
56 | -VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, isz, itype, \ | ||
57 | +#define VFP_CONV_FIX_A64(name, p, fsz, ftype, isz, itype) \ | ||
58 | +VFP_CONV_FIX_FLOAT(name, p, fsz, ftype, isz, itype) \ | ||
59 | +VFP_CONV_FLOAT_FIX_ROUND(name, p, fsz, ftype, isz, itype, \ | ||
60 | get_float_rounding_mode(fpst), ) | ||
61 | |||
62 | -VFP_CONV_FIX(sh, d, 64, 64, int16) | ||
63 | -VFP_CONV_FIX(sl, d, 64, 64, int32) | ||
64 | -VFP_CONV_FIX_A64(sq, d, 64, 64, int64) | ||
65 | -VFP_CONV_FIX(uh, d, 64, 64, uint16) | ||
66 | -VFP_CONV_FIX(ul, d, 64, 64, uint32) | ||
67 | -VFP_CONV_FIX_A64(uq, d, 64, 64, uint64) | ||
68 | -VFP_CONV_FIX(sh, s, 32, 32, int16) | ||
69 | -VFP_CONV_FIX(sl, s, 32, 32, int32) | ||
70 | -VFP_CONV_FIX_A64(sq, s, 32, 64, int64) | ||
71 | -VFP_CONV_FIX(uh, s, 32, 32, uint16) | ||
72 | -VFP_CONV_FIX(ul, s, 32, 32, uint32) | ||
73 | -VFP_CONV_FIX_A64(uq, s, 32, 64, uint64) | ||
74 | +VFP_CONV_FIX(sh, d, 64, float64, 64, int16) | ||
75 | +VFP_CONV_FIX(sl, d, 64, float64, 64, int32) | ||
76 | +VFP_CONV_FIX_A64(sq, d, 64, float64, 64, int64) | ||
77 | +VFP_CONV_FIX(uh, d, 64, float64, 64, uint16) | ||
78 | +VFP_CONV_FIX(ul, d, 64, float64, 64, uint32) | ||
79 | +VFP_CONV_FIX_A64(uq, d, 64, float64, 64, uint64) | ||
80 | +VFP_CONV_FIX(sh, s, 32, float32, 32, int16) | ||
81 | +VFP_CONV_FIX(sl, s, 32, float32, 32, int32) | ||
82 | +VFP_CONV_FIX_A64(sq, s, 32, float32, 64, int64) | ||
83 | +VFP_CONV_FIX(uh, s, 32, float32, 32, uint16) | ||
84 | +VFP_CONV_FIX(ul, s, 32, float32, 32, uint32) | ||
85 | +VFP_CONV_FIX_A64(uq, s, 32, float32, 64, uint64) | ||
86 | |||
87 | #undef VFP_CONV_FIX | ||
88 | #undef VFP_CONV_FIX_FLOAT | ||
89 | -- | ||
90 | 2.20.1 | ||
91 | |||
92 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | Now the VFP_CONV_FIX macros can handle fp16's distinction between the | ||
2 | width of the operation and the width of the type used to pass operands, | ||
3 | use the macros rather than the open-coded functions. | ||
1 | 4 | ||
5 | This creates an extra six helper functions, all of which we are going | ||
6 | to need for the AArch32 VFP fp16 instructions. | ||
7 | |||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
10 | Message-id: 20200828183354.27913-15-peter.maydell@linaro.org | ||
11 | --- | ||
12 | target/arm/helper.h | 6 +++ | ||
13 | target/arm/vfp_helper.c | 86 +++-------------------------------------- | ||
14 | 2 files changed, 12 insertions(+), 80 deletions(-) | ||
15 | |||
16 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
17 | index XXXXXXX..XXXXXXX 100644 | ||
18 | --- a/target/arm/helper.h | ||
19 | +++ b/target/arm/helper.h | ||
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_2(vfp_tosizh, s32, f16, ptr) | ||
21 | DEF_HELPER_2(vfp_tosizs, s32, f32, ptr) | ||
22 | DEF_HELPER_2(vfp_tosizd, s32, f64, ptr) | ||
23 | |||
24 | +DEF_HELPER_3(vfp_toshh_round_to_zero, i32, f16, i32, ptr) | ||
25 | +DEF_HELPER_3(vfp_toslh_round_to_zero, i32, f16, i32, ptr) | ||
26 | +DEF_HELPER_3(vfp_touhh_round_to_zero, i32, f16, i32, ptr) | ||
27 | +DEF_HELPER_3(vfp_toulh_round_to_zero, i32, f16, i32, ptr) | ||
28 | DEF_HELPER_3(vfp_toshs_round_to_zero, i32, f32, i32, ptr) | ||
29 | DEF_HELPER_3(vfp_tosls_round_to_zero, i32, f32, i32, ptr) | ||
30 | DEF_HELPER_3(vfp_touhs_round_to_zero, i32, f32, i32, ptr) | ||
31 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_sqtod, f64, i64, i32, ptr) | ||
32 | DEF_HELPER_3(vfp_uhtod, f64, i64, i32, ptr) | ||
33 | DEF_HELPER_3(vfp_ultod, f64, i64, i32, ptr) | ||
34 | DEF_HELPER_3(vfp_uqtod, f64, i64, i32, ptr) | ||
35 | +DEF_HELPER_3(vfp_shtoh, f16, i32, i32, ptr) | ||
36 | +DEF_HELPER_3(vfp_uhtoh, f16, i32, i32, ptr) | ||
37 | DEF_HELPER_3(vfp_sltoh, f16, i32, i32, ptr) | ||
38 | DEF_HELPER_3(vfp_ultoh, f16, i32, i32, ptr) | ||
39 | DEF_HELPER_3(vfp_sqtoh, f16, i64, i32, ptr) | ||
40 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
41 | index XXXXXXX..XXXXXXX 100644 | ||
42 | --- a/target/arm/vfp_helper.c | ||
43 | +++ b/target/arm/vfp_helper.c | ||
44 | @@ -XXX,XX +XXX,XX @@ VFP_CONV_FIX_A64(sq, s, 32, float32, 64, int64) | ||
45 | VFP_CONV_FIX(uh, s, 32, float32, 32, uint16) | ||
46 | VFP_CONV_FIX(ul, s, 32, float32, 32, uint32) | ||
47 | VFP_CONV_FIX_A64(uq, s, 32, float32, 64, uint64) | ||
48 | +VFP_CONV_FIX(sh, h, 16, dh_ctype_f16, 32, int16) | ||
49 | +VFP_CONV_FIX(sl, h, 16, dh_ctype_f16, 32, int32) | ||
50 | +VFP_CONV_FIX_A64(sq, h, 16, dh_ctype_f16, 64, int64) | ||
51 | +VFP_CONV_FIX(uh, h, 16, dh_ctype_f16, 32, uint16) | ||
52 | +VFP_CONV_FIX(ul, h, 16, dh_ctype_f16, 32, uint32) | ||
53 | +VFP_CONV_FIX_A64(uq, h, 16, dh_ctype_f16, 64, uint64) | ||
54 | |||
55 | #undef VFP_CONV_FIX | ||
56 | #undef VFP_CONV_FIX_FLOAT | ||
57 | #undef VFP_CONV_FLOAT_FIX_ROUND | ||
58 | #undef VFP_CONV_FIX_A64 | ||
59 | |||
60 | -uint32_t HELPER(vfp_sltoh)(uint32_t x, uint32_t shift, void *fpst) | ||
61 | -{ | ||
62 | - return int32_to_float16_scalbn(x, -shift, fpst); | ||
63 | -} | ||
64 | - | ||
65 | -uint32_t HELPER(vfp_ultoh)(uint32_t x, uint32_t shift, void *fpst) | ||
66 | -{ | ||
67 | - return uint32_to_float16_scalbn(x, -shift, fpst); | ||
68 | -} | ||
69 | - | ||
70 | -uint32_t HELPER(vfp_sqtoh)(uint64_t x, uint32_t shift, void *fpst) | ||
71 | -{ | ||
72 | - return int64_to_float16_scalbn(x, -shift, fpst); | ||
73 | -} | ||
74 | - | ||
75 | -uint32_t HELPER(vfp_uqtoh)(uint64_t x, uint32_t shift, void *fpst) | ||
76 | -{ | ||
77 | - return uint64_to_float16_scalbn(x, -shift, fpst); | ||
78 | -} | ||
79 | - | ||
80 | -uint32_t HELPER(vfp_toshh)(uint32_t x, uint32_t shift, void *fpst) | ||
81 | -{ | ||
82 | - if (unlikely(float16_is_any_nan(x))) { | ||
83 | - float_raise(float_flag_invalid, fpst); | ||
84 | - return 0; | ||
85 | - } | ||
86 | - return float16_to_int16_scalbn(x, get_float_rounding_mode(fpst), | ||
87 | - shift, fpst); | ||
88 | -} | ||
89 | - | ||
90 | -uint32_t HELPER(vfp_touhh)(uint32_t x, uint32_t shift, void *fpst) | ||
91 | -{ | ||
92 | - if (unlikely(float16_is_any_nan(x))) { | ||
93 | - float_raise(float_flag_invalid, fpst); | ||
94 | - return 0; | ||
95 | - } | ||
96 | - return float16_to_uint16_scalbn(x, get_float_rounding_mode(fpst), | ||
97 | - shift, fpst); | ||
98 | -} | ||
99 | - | ||
100 | -uint32_t HELPER(vfp_toslh)(uint32_t x, uint32_t shift, void *fpst) | ||
101 | -{ | ||
102 | - if (unlikely(float16_is_any_nan(x))) { | ||
103 | - float_raise(float_flag_invalid, fpst); | ||
104 | - return 0; | ||
105 | - } | ||
106 | - return float16_to_int32_scalbn(x, get_float_rounding_mode(fpst), | ||
107 | - shift, fpst); | ||
108 | -} | ||
109 | - | ||
110 | -uint32_t HELPER(vfp_toulh)(uint32_t x, uint32_t shift, void *fpst) | ||
111 | -{ | ||
112 | - if (unlikely(float16_is_any_nan(x))) { | ||
113 | - float_raise(float_flag_invalid, fpst); | ||
114 | - return 0; | ||
115 | - } | ||
116 | - return float16_to_uint32_scalbn(x, get_float_rounding_mode(fpst), | ||
117 | - shift, fpst); | ||
118 | -} | ||
119 | - | ||
120 | -uint64_t HELPER(vfp_tosqh)(uint32_t x, uint32_t shift, void *fpst) | ||
121 | -{ | ||
122 | - if (unlikely(float16_is_any_nan(x))) { | ||
123 | - float_raise(float_flag_invalid, fpst); | ||
124 | - return 0; | ||
125 | - } | ||
126 | - return float16_to_int64_scalbn(x, get_float_rounding_mode(fpst), | ||
127 | - shift, fpst); | ||
128 | -} | ||
129 | - | ||
130 | -uint64_t HELPER(vfp_touqh)(uint32_t x, uint32_t shift, void *fpst) | ||
131 | -{ | ||
132 | - if (unlikely(float16_is_any_nan(x))) { | ||
133 | - float_raise(float_flag_invalid, fpst); | ||
134 | - return 0; | ||
135 | - } | ||
136 | - return float16_to_uint64_scalbn(x, get_float_rounding_mode(fpst), | ||
137 | - shift, fpst); | ||
138 | -} | ||
139 | - | ||
140 | /* Set the current fp rounding mode and return the old one. | ||
141 | * The argument is a softfloat float_round_ value. | ||
142 | */ | ||
143 | -- | ||
144 | 2.20.1 | ||
145 | |||
146 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Implement the fp16 versions of the VFP VCVT instruction forms which |
---|---|---|---|
2 | convert between floating point and fixed-point. | ||
2 | 3 | ||
3 | The Security Identifier device found in various Allwinner System on Chip | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | designs gives applications a per-board unique identifier. This commit | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | adds support for the Allwinner Security Identifier using a 128-bit | 6 | Message-id: 20200828183354.27913-16-peter.maydell@linaro.org |
6 | UUID value as input. | 7 | --- |
8 | target/arm/vfp.decode | 2 ++ | ||
9 | target/arm/translate-vfp.c.inc | 59 ++++++++++++++++++++++++++++++++++ | ||
10 | 2 files changed, 61 insertions(+) | ||
7 | 11 | ||
8 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | 12 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode |
9 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
10 | Message-id: 20200311221854.30370-8-nieklinnenbank@gmail.com | ||
11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
12 | --- | ||
13 | hw/misc/Makefile.objs | 1 + | ||
14 | include/hw/arm/allwinner-h3.h | 3 + | ||
15 | include/hw/misc/allwinner-sid.h | 60 ++++++++++++ | ||
16 | hw/arm/allwinner-h3.c | 11 ++- | ||
17 | hw/arm/orangepi.c | 8 ++ | ||
18 | hw/misc/allwinner-sid.c | 168 ++++++++++++++++++++++++++++++++ | ||
19 | hw/misc/trace-events | 4 + | ||
20 | 7 files changed, 254 insertions(+), 1 deletion(-) | ||
21 | create mode 100644 include/hw/misc/allwinner-sid.h | ||
22 | create mode 100644 hw/misc/allwinner-sid.c | ||
23 | |||
24 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs | ||
25 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
26 | --- a/hw/misc/Makefile.objs | 14 | --- a/target/arm/vfp.decode |
27 | +++ b/hw/misc/Makefile.objs | 15 | +++ b/target/arm/vfp.decode |
28 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_IVSHMEM_DEVICE) += ivshmem.o | 16 | @@ -XXX,XX +XXX,XX @@ VJCVT ---- 1110 1.11 1001 .... 1011 11.0 .... @vfp_dm_sd |
29 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-ccu.o | 17 | # We assemble bits 18 (op), 16 (u) and 7 (sx) into a single opc field |
30 | obj-$(CONFIG_ALLWINNER_H3) += allwinner-cpucfg.o | 18 | # for the convenience of the trans_VCVT_fix functions. |
31 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-sysctrl.o | 19 | %vcvt_fix_op 18:1 16:1 7:1 |
32 | +common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-sid.o | 20 | +VCVT_fix_hp ---- 1110 1.11 1.1. .... 1001 .1.0 .... \ |
33 | common-obj-$(CONFIG_REALVIEW) += arm_sysctl.o | 21 | + vd=%vd_sp imm=%vm_sp opc=%vcvt_fix_op |
34 | common-obj-$(CONFIG_NSERIES) += cbus.o | 22 | VCVT_fix_sp ---- 1110 1.11 1.1. .... 1010 .1.0 .... \ |
35 | common-obj-$(CONFIG_ECCMEMCTL) += eccmemctl.o | 23 | vd=%vd_sp imm=%vm_sp opc=%vcvt_fix_op |
36 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | 24 | VCVT_fix_dp ---- 1110 1.11 1.1. .... 1011 .1.0 .... \ |
25 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
37 | index XXXXXXX..XXXXXXX 100644 | 26 | index XXXXXXX..XXXXXXX 100644 |
38 | --- a/include/hw/arm/allwinner-h3.h | 27 | --- a/target/arm/translate-vfp.c.inc |
39 | +++ b/include/hw/arm/allwinner-h3.h | 28 | +++ b/target/arm/translate-vfp.c.inc |
40 | @@ -XXX,XX +XXX,XX @@ | 29 | @@ -XXX,XX +XXX,XX @@ static bool trans_VJCVT(DisasContext *s, arg_VJCVT *a) |
41 | #include "hw/misc/allwinner-h3-ccu.h" | 30 | return true; |
42 | #include "hw/misc/allwinner-cpucfg.h" | 31 | } |
43 | #include "hw/misc/allwinner-h3-sysctrl.h" | 32 | |
44 | +#include "hw/misc/allwinner-sid.h" | 33 | +static bool trans_VCVT_fix_hp(DisasContext *s, arg_VCVT_fix_sp *a) |
45 | #include "target/arm/cpu.h" | 34 | +{ |
46 | 35 | + TCGv_i32 vd, shift; | |
47 | /** | 36 | + TCGv_ptr fpst; |
48 | @@ -XXX,XX +XXX,XX @@ enum { | 37 | + int frac_bits; |
49 | AW_H3_SRAM_A2, | ||
50 | AW_H3_SRAM_C, | ||
51 | AW_H3_SYSCTRL, | ||
52 | + AW_H3_SID, | ||
53 | AW_H3_EHCI0, | ||
54 | AW_H3_OHCI0, | ||
55 | AW_H3_EHCI1, | ||
56 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
57 | AwH3ClockCtlState ccu; | ||
58 | AwCpuCfgState cpucfg; | ||
59 | AwH3SysCtrlState sysctrl; | ||
60 | + AwSidState sid; | ||
61 | GICState gic; | ||
62 | MemoryRegion sram_a1; | ||
63 | MemoryRegion sram_a2; | ||
64 | diff --git a/include/hw/misc/allwinner-sid.h b/include/hw/misc/allwinner-sid.h | ||
65 | new file mode 100644 | ||
66 | index XXXXXXX..XXXXXXX | ||
67 | --- /dev/null | ||
68 | +++ b/include/hw/misc/allwinner-sid.h | ||
69 | @@ -XXX,XX +XXX,XX @@ | ||
70 | +/* | ||
71 | + * Allwinner Security ID emulation | ||
72 | + * | ||
73 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
74 | + * | ||
75 | + * This program is free software: you can redistribute it and/or modify | ||
76 | + * it under the terms of the GNU General Public License as published by | ||
77 | + * the Free Software Foundation, either version 2 of the License, or | ||
78 | + * (at your option) any later version. | ||
79 | + * | ||
80 | + * This program is distributed in the hope that it will be useful, | ||
81 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
82 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
83 | + * GNU General Public License for more details. | ||
84 | + * | ||
85 | + * You should have received a copy of the GNU General Public License | ||
86 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
87 | + */ | ||
88 | + | 38 | + |
89 | +#ifndef HW_MISC_ALLWINNER_SID_H | 39 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
90 | +#define HW_MISC_ALLWINNER_SID_H | 40 | + return false; |
91 | + | ||
92 | +#include "qom/object.h" | ||
93 | +#include "hw/sysbus.h" | ||
94 | +#include "qemu/uuid.h" | ||
95 | + | ||
96 | +/** | ||
97 | + * Object model | ||
98 | + * @{ | ||
99 | + */ | ||
100 | + | ||
101 | +#define TYPE_AW_SID "allwinner-sid" | ||
102 | +#define AW_SID(obj) \ | ||
103 | + OBJECT_CHECK(AwSidState, (obj), TYPE_AW_SID) | ||
104 | + | ||
105 | +/** @} */ | ||
106 | + | ||
107 | +/** | ||
108 | + * Allwinner Security ID object instance state | ||
109 | + */ | ||
110 | +typedef struct AwSidState { | ||
111 | + /*< private >*/ | ||
112 | + SysBusDevice parent_obj; | ||
113 | + /*< public >*/ | ||
114 | + | ||
115 | + /** Maps I/O registers in physical memory */ | ||
116 | + MemoryRegion iomem; | ||
117 | + | ||
118 | + /** Control register defines how and what to read */ | ||
119 | + uint32_t control; | ||
120 | + | ||
121 | + /** RdKey register contains the data retrieved by the device */ | ||
122 | + uint32_t rdkey; | ||
123 | + | ||
124 | + /** Stores the emulated device identifier */ | ||
125 | + QemuUUID identifier; | ||
126 | + | ||
127 | +} AwSidState; | ||
128 | + | ||
129 | +#endif /* HW_MISC_ALLWINNER_SID_H */ | ||
130 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
131 | index XXXXXXX..XXXXXXX 100644 | ||
132 | --- a/hw/arm/allwinner-h3.c | ||
133 | +++ b/hw/arm/allwinner-h3.c | ||
134 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
135 | [AW_H3_SRAM_A2] = 0x00044000, | ||
136 | [AW_H3_SRAM_C] = 0x00010000, | ||
137 | [AW_H3_SYSCTRL] = 0x01c00000, | ||
138 | + [AW_H3_SID] = 0x01c14000, | ||
139 | [AW_H3_EHCI0] = 0x01c1a000, | ||
140 | [AW_H3_OHCI0] = 0x01c1a400, | ||
141 | [AW_H3_EHCI1] = 0x01c1b000, | ||
142 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
143 | { "mmc0", 0x01c0f000, 4 * KiB }, | ||
144 | { "mmc1", 0x01c10000, 4 * KiB }, | ||
145 | { "mmc2", 0x01c11000, 4 * KiB }, | ||
146 | - { "sid", 0x01c14000, 1 * KiB }, | ||
147 | { "crypto", 0x01c15000, 4 * KiB }, | ||
148 | { "msgbox", 0x01c17000, 4 * KiB }, | ||
149 | { "spinlock", 0x01c18000, 4 * KiB }, | ||
150 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
151 | |||
152 | sysbus_init_child_obj(obj, "cpucfg", &s->cpucfg, sizeof(s->cpucfg), | ||
153 | TYPE_AW_CPUCFG); | ||
154 | + | ||
155 | + sysbus_init_child_obj(obj, "sid", &s->sid, sizeof(s->sid), | ||
156 | + TYPE_AW_SID); | ||
157 | + object_property_add_alias(obj, "identifier", OBJECT(&s->sid), | ||
158 | + "identifier", &error_abort); | ||
159 | } | ||
160 | |||
161 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
162 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
163 | qdev_init_nofail(DEVICE(&s->cpucfg)); | ||
164 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->cpucfg), 0, s->memmap[AW_H3_CPUCFG]); | ||
165 | |||
166 | + /* Security Identifier */ | ||
167 | + qdev_init_nofail(DEVICE(&s->sid)); | ||
168 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->sid), 0, s->memmap[AW_H3_SID]); | ||
169 | + | ||
170 | /* Universal Serial Bus */ | ||
171 | sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI0], | ||
172 | qdev_get_gpio_in(DEVICE(&s->gic), | ||
173 | diff --git a/hw/arm/orangepi.c b/hw/arm/orangepi.c | ||
174 | index XXXXXXX..XXXXXXX 100644 | ||
175 | --- a/hw/arm/orangepi.c | ||
176 | +++ b/hw/arm/orangepi.c | ||
177 | @@ -XXX,XX +XXX,XX @@ static void orangepi_init(MachineState *machine) | ||
178 | object_property_set_int(OBJECT(h3), 24 * 1000 * 1000, "clk1-freq", | ||
179 | &error_abort); | ||
180 | |||
181 | + /* Setup SID properties. Currently using a default fixed SID identifier. */ | ||
182 | + if (qemu_uuid_is_null(&h3->sid.identifier)) { | ||
183 | + qdev_prop_set_string(DEVICE(h3), "identifier", | ||
184 | + "02c00081-1111-2222-3333-000044556677"); | ||
185 | + } else if (ldl_be_p(&h3->sid.identifier.data[0]) != 0x02c00081) { | ||
186 | + warn_report("Security Identifier value does not include H3 prefix"); | ||
187 | + } | 41 | + } |
188 | + | 42 | + |
189 | /* Mark H3 object realized */ | 43 | + if (!vfp_access_check(s)) { |
190 | object_property_set_bool(OBJECT(h3), true, "realized", &error_abort); | 44 | + return true; |
191 | 45 | + } | |
192 | diff --git a/hw/misc/allwinner-sid.c b/hw/misc/allwinner-sid.c | ||
193 | new file mode 100644 | ||
194 | index XXXXXXX..XXXXXXX | ||
195 | --- /dev/null | ||
196 | +++ b/hw/misc/allwinner-sid.c | ||
197 | @@ -XXX,XX +XXX,XX @@ | ||
198 | +/* | ||
199 | + * Allwinner Security ID emulation | ||
200 | + * | ||
201 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
202 | + * | ||
203 | + * This program is free software: you can redistribute it and/or modify | ||
204 | + * it under the terms of the GNU General Public License as published by | ||
205 | + * the Free Software Foundation, either version 2 of the License, or | ||
206 | + * (at your option) any later version. | ||
207 | + * | ||
208 | + * This program is distributed in the hope that it will be useful, | ||
209 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
210 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
211 | + * GNU General Public License for more details. | ||
212 | + * | ||
213 | + * You should have received a copy of the GNU General Public License | ||
214 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
215 | + */ | ||
216 | + | 46 | + |
217 | +#include "qemu/osdep.h" | 47 | + frac_bits = (a->opc & 1) ? (32 - a->imm) : (16 - a->imm); |
218 | +#include "qemu/units.h" | ||
219 | +#include "hw/sysbus.h" | ||
220 | +#include "migration/vmstate.h" | ||
221 | +#include "qemu/log.h" | ||
222 | +#include "qemu/module.h" | ||
223 | +#include "qemu/guest-random.h" | ||
224 | +#include "qapi/error.h" | ||
225 | +#include "hw/qdev-properties.h" | ||
226 | +#include "hw/misc/allwinner-sid.h" | ||
227 | +#include "trace.h" | ||
228 | + | 48 | + |
229 | +/* SID register offsets */ | 49 | + vd = tcg_temp_new_i32(); |
230 | +enum { | 50 | + neon_load_reg32(vd, a->vd); |
231 | + REG_PRCTL = 0x40, /* Control */ | ||
232 | + REG_RDKEY = 0x60, /* Read Key */ | ||
233 | +}; | ||
234 | + | 51 | + |
235 | +/* SID register flags */ | 52 | + fpst = fpstatus_ptr(FPST_FPCR_F16); |
236 | +enum { | 53 | + shift = tcg_const_i32(frac_bits); |
237 | + REG_PRCTL_WRITE = 0x0002, /* Unknown write flag */ | ||
238 | + REG_PRCTL_OP_LOCK = 0xAC00, /* Lock operation */ | ||
239 | +}; | ||
240 | + | 54 | + |
241 | +static uint64_t allwinner_sid_read(void *opaque, hwaddr offset, | 55 | + /* Switch on op:U:sx bits */ |
242 | + unsigned size) | 56 | + switch (a->opc) { |
243 | +{ | 57 | + case 0: |
244 | + const AwSidState *s = AW_SID(opaque); | 58 | + gen_helper_vfp_shtoh(vd, vd, shift, fpst); |
245 | + uint64_t val = 0; | ||
246 | + | ||
247 | + switch (offset) { | ||
248 | + case REG_PRCTL: /* Control */ | ||
249 | + val = s->control; | ||
250 | + break; | 59 | + break; |
251 | + case REG_RDKEY: /* Read Key */ | 60 | + case 1: |
252 | + val = s->rdkey; | 61 | + gen_helper_vfp_sltoh(vd, vd, shift, fpst); |
62 | + break; | ||
63 | + case 2: | ||
64 | + gen_helper_vfp_uhtoh(vd, vd, shift, fpst); | ||
65 | + break; | ||
66 | + case 3: | ||
67 | + gen_helper_vfp_ultoh(vd, vd, shift, fpst); | ||
68 | + break; | ||
69 | + case 4: | ||
70 | + gen_helper_vfp_toshh_round_to_zero(vd, vd, shift, fpst); | ||
71 | + break; | ||
72 | + case 5: | ||
73 | + gen_helper_vfp_toslh_round_to_zero(vd, vd, shift, fpst); | ||
74 | + break; | ||
75 | + case 6: | ||
76 | + gen_helper_vfp_touhh_round_to_zero(vd, vd, shift, fpst); | ||
77 | + break; | ||
78 | + case 7: | ||
79 | + gen_helper_vfp_toulh_round_to_zero(vd, vd, shift, fpst); | ||
253 | + break; | 80 | + break; |
254 | + default: | 81 | + default: |
255 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | 82 | + g_assert_not_reached(); |
256 | + __func__, (uint32_t)offset); | ||
257 | + return 0; | ||
258 | + } | 83 | + } |
259 | + | 84 | + |
260 | + trace_allwinner_sid_read(offset, val, size); | 85 | + neon_store_reg32(vd, a->vd); |
261 | + | 86 | + tcg_temp_free_i32(vd); |
262 | + return val; | 87 | + tcg_temp_free_i32(shift); |
88 | + tcg_temp_free_ptr(fpst); | ||
89 | + return true; | ||
263 | +} | 90 | +} |
264 | + | 91 | + |
265 | +static void allwinner_sid_write(void *opaque, hwaddr offset, | 92 | static bool trans_VCVT_fix_sp(DisasContext *s, arg_VCVT_fix_sp *a) |
266 | + uint64_t val, unsigned size) | 93 | { |
267 | +{ | 94 | TCGv_i32 vd, shift; |
268 | + AwSidState *s = AW_SID(opaque); | ||
269 | + | ||
270 | + trace_allwinner_sid_write(offset, val, size); | ||
271 | + | ||
272 | + switch (offset) { | ||
273 | + case REG_PRCTL: /* Control */ | ||
274 | + s->control = val; | ||
275 | + | ||
276 | + if ((s->control & REG_PRCTL_OP_LOCK) && | ||
277 | + (s->control & REG_PRCTL_WRITE)) { | ||
278 | + uint32_t id = s->control >> 16; | ||
279 | + | ||
280 | + if (id <= sizeof(QemuUUID) - sizeof(s->rdkey)) { | ||
281 | + s->rdkey = ldl_be_p(&s->identifier.data[id]); | ||
282 | + } | ||
283 | + } | ||
284 | + s->control &= ~REG_PRCTL_WRITE; | ||
285 | + break; | ||
286 | + case REG_RDKEY: /* Read Key */ | ||
287 | + break; | ||
288 | + default: | ||
289 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
290 | + __func__, (uint32_t)offset); | ||
291 | + break; | ||
292 | + } | ||
293 | +} | ||
294 | + | ||
295 | +static const MemoryRegionOps allwinner_sid_ops = { | ||
296 | + .read = allwinner_sid_read, | ||
297 | + .write = allwinner_sid_write, | ||
298 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
299 | + .valid = { | ||
300 | + .min_access_size = 4, | ||
301 | + .max_access_size = 4, | ||
302 | + }, | ||
303 | + .impl.min_access_size = 4, | ||
304 | +}; | ||
305 | + | ||
306 | +static void allwinner_sid_reset(DeviceState *dev) | ||
307 | +{ | ||
308 | + AwSidState *s = AW_SID(dev); | ||
309 | + | ||
310 | + /* Set default values for registers */ | ||
311 | + s->control = 0; | ||
312 | + s->rdkey = 0; | ||
313 | +} | ||
314 | + | ||
315 | +static void allwinner_sid_init(Object *obj) | ||
316 | +{ | ||
317 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
318 | + AwSidState *s = AW_SID(obj); | ||
319 | + | ||
320 | + /* Memory mapping */ | ||
321 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_sid_ops, s, | ||
322 | + TYPE_AW_SID, 1 * KiB); | ||
323 | + sysbus_init_mmio(sbd, &s->iomem); | ||
324 | +} | ||
325 | + | ||
326 | +static Property allwinner_sid_properties[] = { | ||
327 | + DEFINE_PROP_UUID_NODEFAULT("identifier", AwSidState, identifier), | ||
328 | + DEFINE_PROP_END_OF_LIST() | ||
329 | +}; | ||
330 | + | ||
331 | +static const VMStateDescription allwinner_sid_vmstate = { | ||
332 | + .name = "allwinner-sid", | ||
333 | + .version_id = 1, | ||
334 | + .minimum_version_id = 1, | ||
335 | + .fields = (VMStateField[]) { | ||
336 | + VMSTATE_UINT32(control, AwSidState), | ||
337 | + VMSTATE_UINT32(rdkey, AwSidState), | ||
338 | + VMSTATE_UINT8_ARRAY_V(identifier.data, AwSidState, sizeof(QemuUUID), 1), | ||
339 | + VMSTATE_END_OF_LIST() | ||
340 | + } | ||
341 | +}; | ||
342 | + | ||
343 | +static void allwinner_sid_class_init(ObjectClass *klass, void *data) | ||
344 | +{ | ||
345 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
346 | + | ||
347 | + dc->reset = allwinner_sid_reset; | ||
348 | + dc->vmsd = &allwinner_sid_vmstate; | ||
349 | + device_class_set_props(dc, allwinner_sid_properties); | ||
350 | +} | ||
351 | + | ||
352 | +static const TypeInfo allwinner_sid_info = { | ||
353 | + .name = TYPE_AW_SID, | ||
354 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
355 | + .instance_init = allwinner_sid_init, | ||
356 | + .instance_size = sizeof(AwSidState), | ||
357 | + .class_init = allwinner_sid_class_init, | ||
358 | +}; | ||
359 | + | ||
360 | +static void allwinner_sid_register(void) | ||
361 | +{ | ||
362 | + type_register_static(&allwinner_sid_info); | ||
363 | +} | ||
364 | + | ||
365 | +type_init(allwinner_sid_register) | ||
366 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events | ||
367 | index XXXXXXX..XXXXXXX 100644 | ||
368 | --- a/hw/misc/trace-events | ||
369 | +++ b/hw/misc/trace-events | ||
370 | @@ -XXX,XX +XXX,XX @@ allwinner_cpucfg_cpu_reset(uint8_t cpu_id, uint32_t reset_addr) "id %u, reset_ad | ||
371 | allwinner_cpucfg_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
372 | allwinner_cpucfg_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
373 | |||
374 | +# allwinner-sid.c | ||
375 | +allwinner_sid_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
376 | +allwinner_sid_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
377 | + | ||
378 | # eccmemctl.c | ||
379 | ecc_mem_writel_mer(uint32_t val) "Write memory enable 0x%08x" | ||
380 | ecc_mem_writel_mdr(uint32_t val) "Write memory delay 0x%08x" | ||
381 | -- | 95 | -- |
382 | 2.20.1 | 96 | 2.20.1 |
383 | 97 | ||
384 | 98 | diff view generated by jsdifflib |
1 | From: Beata Michalska <beata.michalska@linaro.org> | 1 | Implement the fp16 versions of the VFP VCVT instruction forms |
---|---|---|---|
2 | which convert between floating point and integer with a specified | ||
3 | rounding mode. | ||
2 | 4 | ||
3 | KVM_SET_VCPU_EVENTS might actually lead to vcpu registers being modified. | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | As such this should be the last step of sync to avoid potential overwriting | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | of whatever changes KVM might have done. | 7 | Message-id: 20200828183354.27913-17-peter.maydell@linaro.org |
8 | --- | ||
9 | target/arm/vfp-uncond.decode | 6 ++++-- | ||
10 | target/arm/translate-vfp.c.inc | 32 ++++++++++++++++++++++++-------- | ||
11 | 2 files changed, 28 insertions(+), 10 deletions(-) | ||
6 | 12 | ||
7 | Signed-off-by: Beata Michalska <beata.michalska@linaro.org> | 13 | diff --git a/target/arm/vfp-uncond.decode b/target/arm/vfp-uncond.decode |
8 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
9 | Message-id: 20200312003401.29017-2-beata.michalska@linaro.org | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | --- | ||
12 | target/arm/kvm32.c | 15 ++++++++++----- | ||
13 | target/arm/kvm64.c | 15 ++++++++++----- | ||
14 | 2 files changed, 20 insertions(+), 10 deletions(-) | ||
15 | |||
16 | diff --git a/target/arm/kvm32.c b/target/arm/kvm32.c | ||
17 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/kvm32.c | 15 | --- a/target/arm/vfp-uncond.decode |
19 | +++ b/target/arm/kvm32.c | 16 | +++ b/target/arm/vfp-uncond.decode |
20 | @@ -XXX,XX +XXX,XX @@ int kvm_arch_put_registers(CPUState *cs, int level) | 17 | @@ -XXX,XX +XXX,XX @@ VRINT 1111 1110 1.11 10 rm:2 .... 1011 01.0 .... \ |
21 | return ret; | 18 | vm=%vm_dp vd=%vd_dp dp=1 |
19 | |||
20 | # VCVT float to int with specified rounding mode; Vd is always single-precision | ||
21 | +VCVT 1111 1110 1.11 11 rm:2 .... 1001 op:1 1.0 .... \ | ||
22 | + vm=%vm_sp vd=%vd_sp sz=1 | ||
23 | VCVT 1111 1110 1.11 11 rm:2 .... 1010 op:1 1.0 .... \ | ||
24 | - vm=%vm_sp vd=%vd_sp dp=0 | ||
25 | + vm=%vm_sp vd=%vd_sp sz=2 | ||
26 | VCVT 1111 1110 1.11 11 rm:2 .... 1011 op:1 1.0 .... \ | ||
27 | - vm=%vm_dp vd=%vd_sp dp=1 | ||
28 | + vm=%vm_dp vd=%vd_sp sz=3 | ||
29 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/translate-vfp.c.inc | ||
32 | +++ b/target/arm/translate-vfp.c.inc | ||
33 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINT(DisasContext *s, arg_VRINT *a) | ||
34 | static bool trans_VCVT(DisasContext *s, arg_VCVT *a) | ||
35 | { | ||
36 | uint32_t rd, rm; | ||
37 | - bool dp = a->dp; | ||
38 | + int sz = a->sz; | ||
39 | TCGv_ptr fpst; | ||
40 | TCGv_i32 tcg_rmode, tcg_shift; | ||
41 | int rounding = fp_decode_rm[a->rm]; | ||
42 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCVT(DisasContext *s, arg_VCVT *a) | ||
43 | return false; | ||
22 | } | 44 | } |
23 | 45 | ||
24 | - ret = kvm_put_vcpu_events(cpu); | 46 | - if (dp && !dc_isar_feature(aa32_fpdp_v2, s)) { |
25 | - if (ret) { | 47 | + if (sz == 3 && !dc_isar_feature(aa32_fpdp_v2, s)) { |
26 | - return ret; | 48 | + return false; |
27 | - } | ||
28 | - | ||
29 | write_cpustate_to_list(cpu, true); | ||
30 | |||
31 | if (!write_list_to_kvmstate(cpu, level)) { | ||
32 | return EINVAL; | ||
33 | } | ||
34 | |||
35 | + /* | ||
36 | + * Setting VCPU events should be triggered after syncing the registers | ||
37 | + * to avoid overwriting potential changes made by KVM upon calling | ||
38 | + * KVM_SET_VCPU_EVENTS ioctl | ||
39 | + */ | ||
40 | + ret = kvm_put_vcpu_events(cpu); | ||
41 | + if (ret) { | ||
42 | + return ret; | ||
43 | + } | 49 | + } |
44 | + | 50 | + |
45 | kvm_arm_sync_mpstate_to_kvm(cpu); | 51 | + if (sz == 1 && !dc_isar_feature(aa32_fp16_arith, s)) { |
46 | 52 | return false; | |
47 | return ret; | ||
48 | diff --git a/target/arm/kvm64.c b/target/arm/kvm64.c | ||
49 | index XXXXXXX..XXXXXXX 100644 | ||
50 | --- a/target/arm/kvm64.c | ||
51 | +++ b/target/arm/kvm64.c | ||
52 | @@ -XXX,XX +XXX,XX @@ int kvm_arch_put_registers(CPUState *cs, int level) | ||
53 | return ret; | ||
54 | } | 53 | } |
55 | 54 | ||
56 | - ret = kvm_put_vcpu_events(cpu); | 55 | /* UNDEF accesses to D16-D31 if they don't exist */ |
57 | - if (ret) { | 56 | - if (dp && !dc_isar_feature(aa32_simd_r32, s) && (a->vm & 0x10)) { |
58 | - return ret; | 57 | + if (sz == 3 && !dc_isar_feature(aa32_simd_r32, s) && (a->vm & 0x10)) { |
59 | - } | 58 | return false; |
60 | - | ||
61 | write_cpustate_to_list(cpu, true); | ||
62 | |||
63 | if (!write_list_to_kvmstate(cpu, level)) { | ||
64 | return -EINVAL; | ||
65 | } | 59 | } |
66 | 60 | ||
67 | + /* | 61 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCVT(DisasContext *s, arg_VCVT *a) |
68 | + * Setting VCPU events should be triggered after syncing the registers | 62 | return true; |
69 | + * to avoid overwriting potential changes made by KVM upon calling | 63 | } |
70 | + * KVM_SET_VCPU_EVENTS ioctl | 64 | |
71 | + */ | 65 | - fpst = fpstatus_ptr(FPST_FPCR); |
72 | + ret = kvm_put_vcpu_events(cpu); | 66 | + if (sz == 1) { |
73 | + if (ret) { | 67 | + fpst = fpstatus_ptr(FPST_FPCR_F16); |
74 | + return ret; | 68 | + } else { |
69 | + fpst = fpstatus_ptr(FPST_FPCR); | ||
75 | + } | 70 | + } |
76 | + | 71 | |
77 | kvm_arm_sync_mpstate_to_kvm(cpu); | 72 | tcg_shift = tcg_const_i32(0); |
78 | 73 | ||
79 | return ret; | 74 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rounding)); |
75 | gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
76 | |||
77 | - if (dp) { | ||
78 | + if (sz == 3) { | ||
79 | TCGv_i64 tcg_double, tcg_res; | ||
80 | TCGv_i32 tcg_tmp; | ||
81 | tcg_double = tcg_temp_new_i64(); | ||
82 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCVT(DisasContext *s, arg_VCVT *a) | ||
83 | tcg_single = tcg_temp_new_i32(); | ||
84 | tcg_res = tcg_temp_new_i32(); | ||
85 | neon_load_reg32(tcg_single, rm); | ||
86 | - if (is_signed) { | ||
87 | - gen_helper_vfp_tosls(tcg_res, tcg_single, tcg_shift, fpst); | ||
88 | + if (sz == 1) { | ||
89 | + if (is_signed) { | ||
90 | + gen_helper_vfp_toslh(tcg_res, tcg_single, tcg_shift, fpst); | ||
91 | + } else { | ||
92 | + gen_helper_vfp_toulh(tcg_res, tcg_single, tcg_shift, fpst); | ||
93 | + } | ||
94 | } else { | ||
95 | - gen_helper_vfp_touls(tcg_res, tcg_single, tcg_shift, fpst); | ||
96 | + if (is_signed) { | ||
97 | + gen_helper_vfp_tosls(tcg_res, tcg_single, tcg_shift, fpst); | ||
98 | + } else { | ||
99 | + gen_helper_vfp_touls(tcg_res, tcg_single, tcg_shift, fpst); | ||
100 | + } | ||
101 | } | ||
102 | neon_store_reg32(tcg_res, rd); | ||
103 | tcg_temp_free_i32(tcg_res); | ||
80 | -- | 104 | -- |
81 | 2.20.1 | 105 | 2.20.1 |
82 | 106 | ||
83 | 107 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | Implement the fp16 versions of the VFP VSEL instruction. | ||
1 | 2 | ||
3 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Message-id: 20200828183354.27913-18-peter.maydell@linaro.org | ||
6 | --- | ||
7 | target/arm/vfp-uncond.decode | 6 ++++-- | ||
8 | target/arm/translate-vfp.c.inc | 16 ++++++++++++---- | ||
9 | 2 files changed, 16 insertions(+), 6 deletions(-) | ||
10 | |||
11 | diff --git a/target/arm/vfp-uncond.decode b/target/arm/vfp-uncond.decode | ||
12 | index XXXXXXX..XXXXXXX 100644 | ||
13 | --- a/target/arm/vfp-uncond.decode | ||
14 | +++ b/target/arm/vfp-uncond.decode | ||
15 | @@ -XXX,XX +XXX,XX @@ | ||
16 | @vfp_dnm_s ................................ vm=%vm_sp vn=%vn_sp vd=%vd_sp | ||
17 | @vfp_dnm_d ................................ vm=%vm_dp vn=%vn_dp vd=%vd_dp | ||
18 | |||
19 | +VSEL 1111 1110 0. cc:2 .... .... 1001 .0.0 .... \ | ||
20 | + vm=%vm_sp vn=%vn_sp vd=%vd_sp sz=1 | ||
21 | VSEL 1111 1110 0. cc:2 .... .... 1010 .0.0 .... \ | ||
22 | - vm=%vm_sp vn=%vn_sp vd=%vd_sp dp=0 | ||
23 | + vm=%vm_sp vn=%vn_sp vd=%vd_sp sz=2 | ||
24 | VSEL 1111 1110 0. cc:2 .... .... 1011 .0.0 .... \ | ||
25 | - vm=%vm_dp vn=%vn_dp vd=%vd_dp dp=1 | ||
26 | + vm=%vm_dp vn=%vn_dp vd=%vd_dp sz=3 | ||
27 | |||
28 | VMAXNM_hp 1111 1110 1.00 .... .... 1001 .0.0 .... @vfp_dnm_s | ||
29 | VMINNM_hp 1111 1110 1.00 .... .... 1001 .1.0 .... @vfp_dnm_s | ||
30 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
31 | index XXXXXXX..XXXXXXX 100644 | ||
32 | --- a/target/arm/translate-vfp.c.inc | ||
33 | +++ b/target/arm/translate-vfp.c.inc | ||
34 | @@ -XXX,XX +XXX,XX @@ static bool vfp_access_check(DisasContext *s) | ||
35 | static bool trans_VSEL(DisasContext *s, arg_VSEL *a) | ||
36 | { | ||
37 | uint32_t rd, rn, rm; | ||
38 | - bool dp = a->dp; | ||
39 | + int sz = a->sz; | ||
40 | |||
41 | if (!dc_isar_feature(aa32_vsel, s)) { | ||
42 | return false; | ||
43 | } | ||
44 | |||
45 | - if (dp && !dc_isar_feature(aa32_fpdp_v2, s)) { | ||
46 | + if (sz == 3 && !dc_isar_feature(aa32_fpdp_v2, s)) { | ||
47 | + return false; | ||
48 | + } | ||
49 | + | ||
50 | + if (sz == 1 && !dc_isar_feature(aa32_fp16_arith, s)) { | ||
51 | return false; | ||
52 | } | ||
53 | |||
54 | /* UNDEF accesses to D16-D31 if they don't exist */ | ||
55 | - if (dp && !dc_isar_feature(aa32_simd_r32, s) && | ||
56 | + if (sz == 3 && !dc_isar_feature(aa32_simd_r32, s) && | ||
57 | ((a->vm | a->vn | a->vd) & 0x10)) { | ||
58 | return false; | ||
59 | } | ||
60 | @@ -XXX,XX +XXX,XX @@ static bool trans_VSEL(DisasContext *s, arg_VSEL *a) | ||
61 | return true; | ||
62 | } | ||
63 | |||
64 | - if (dp) { | ||
65 | + if (sz == 3) { | ||
66 | TCGv_i64 frn, frm, dest; | ||
67 | TCGv_i64 tmp, zero, zf, nf, vf; | ||
68 | |||
69 | @@ -XXX,XX +XXX,XX @@ static bool trans_VSEL(DisasContext *s, arg_VSEL *a) | ||
70 | tcg_temp_free_i32(tmp); | ||
71 | break; | ||
72 | } | ||
73 | + /* For fp16 the top half is always zeroes */ | ||
74 | + if (sz == 1) { | ||
75 | + tcg_gen_andi_i32(dest, dest, 0xffff); | ||
76 | + } | ||
77 | neon_store_reg32(dest, rd); | ||
78 | tcg_temp_free_i32(frn); | ||
79 | tcg_temp_free_i32(frm); | ||
80 | -- | ||
81 | 2.20.1 | ||
82 | |||
83 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | 1 | Implement the fp16 version of the VFP VRINT* insns. | |
2 | |||
3 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
5 | Message-id: 20200828183354.27913-19-peter.maydell@linaro.org | ||
6 | --- | ||
7 | target/arm/helper.h | 2 + | ||
8 | target/arm/vfp-uncond.decode | 6 ++- | ||
9 | target/arm/vfp.decode | 3 ++ | ||
10 | target/arm/vfp_helper.c | 21 ++++++++ | ||
11 | target/arm/translate-vfp.c.inc | 98 +++++++++++++++++++++++++++++++--- | ||
12 | 5 files changed, 122 insertions(+), 8 deletions(-) | ||
13 | |||
14 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
15 | index XXXXXXX..XXXXXXX 100644 | ||
16 | --- a/target/arm/helper.h | ||
17 | +++ b/target/arm/helper.h | ||
18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(shr_cc, i32, env, i32, i32) | ||
19 | DEF_HELPER_3(sar_cc, i32, env, i32, i32) | ||
20 | DEF_HELPER_3(ror_cc, i32, env, i32, i32) | ||
21 | |||
22 | +DEF_HELPER_FLAGS_2(rinth_exact, TCG_CALL_NO_RWG, f16, f16, ptr) | ||
23 | DEF_HELPER_FLAGS_2(rints_exact, TCG_CALL_NO_RWG, f32, f32, ptr) | ||
24 | DEF_HELPER_FLAGS_2(rintd_exact, TCG_CALL_NO_RWG, f64, f64, ptr) | ||
25 | +DEF_HELPER_FLAGS_2(rinth, TCG_CALL_NO_RWG, f16, f16, ptr) | ||
26 | DEF_HELPER_FLAGS_2(rints, TCG_CALL_NO_RWG, f32, f32, ptr) | ||
27 | DEF_HELPER_FLAGS_2(rintd, TCG_CALL_NO_RWG, f64, f64, ptr) | ||
28 | |||
29 | diff --git a/target/arm/vfp-uncond.decode b/target/arm/vfp-uncond.decode | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/vfp-uncond.decode | ||
32 | +++ b/target/arm/vfp-uncond.decode | ||
33 | @@ -XXX,XX +XXX,XX @@ VMINNM_sp 1111 1110 1.00 .... .... 1010 .1.0 .... @vfp_dnm_s | ||
34 | VMAXNM_dp 1111 1110 1.00 .... .... 1011 .0.0 .... @vfp_dnm_d | ||
35 | VMINNM_dp 1111 1110 1.00 .... .... 1011 .1.0 .... @vfp_dnm_d | ||
36 | |||
37 | +VRINT 1111 1110 1.11 10 rm:2 .... 1001 01.0 .... \ | ||
38 | + vm=%vm_sp vd=%vd_sp sz=1 | ||
39 | VRINT 1111 1110 1.11 10 rm:2 .... 1010 01.0 .... \ | ||
40 | - vm=%vm_sp vd=%vd_sp dp=0 | ||
41 | + vm=%vm_sp vd=%vd_sp sz=2 | ||
42 | VRINT 1111 1110 1.11 10 rm:2 .... 1011 01.0 .... \ | ||
43 | - vm=%vm_dp vd=%vd_dp dp=1 | ||
44 | + vm=%vm_dp vd=%vd_dp sz=3 | ||
45 | |||
46 | # VCVT float to int with specified rounding mode; Vd is always single-precision | ||
47 | VCVT 1111 1110 1.11 11 rm:2 .... 1001 op:1 1.0 .... \ | ||
48 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode | ||
49 | index XXXXXXX..XXXXXXX 100644 | ||
50 | --- a/target/arm/vfp.decode | ||
51 | +++ b/target/arm/vfp.decode | ||
52 | @@ -XXX,XX +XXX,XX @@ VCVT_f16_f32 ---- 1110 1.11 0011 .... 1010 t:1 1.0 .... \ | ||
53 | VCVT_f16_f64 ---- 1110 1.11 0011 .... 1011 t:1 1.0 .... \ | ||
54 | vd=%vd_sp vm=%vm_dp | ||
55 | |||
56 | +VRINTR_hp ---- 1110 1.11 0110 .... 1001 01.0 .... @vfp_dm_ss | ||
57 | VRINTR_sp ---- 1110 1.11 0110 .... 1010 01.0 .... @vfp_dm_ss | ||
58 | VRINTR_dp ---- 1110 1.11 0110 .... 1011 01.0 .... @vfp_dm_dd | ||
59 | |||
60 | +VRINTZ_hp ---- 1110 1.11 0110 .... 1001 11.0 .... @vfp_dm_ss | ||
61 | VRINTZ_sp ---- 1110 1.11 0110 .... 1010 11.0 .... @vfp_dm_ss | ||
62 | VRINTZ_dp ---- 1110 1.11 0110 .... 1011 11.0 .... @vfp_dm_dd | ||
63 | |||
64 | +VRINTX_hp ---- 1110 1.11 0111 .... 1001 01.0 .... @vfp_dm_ss | ||
65 | VRINTX_sp ---- 1110 1.11 0111 .... 1010 01.0 .... @vfp_dm_ss | ||
66 | VRINTX_dp ---- 1110 1.11 0111 .... 1011 01.0 .... @vfp_dm_dd | ||
67 | |||
68 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
69 | index XXXXXXX..XXXXXXX 100644 | ||
70 | --- a/target/arm/vfp_helper.c | ||
71 | +++ b/target/arm/vfp_helper.c | ||
72 | @@ -XXX,XX +XXX,XX @@ float64 VFP_HELPER(muladd, d)(float64 a, float64 b, float64 c, void *fpstp) | ||
73 | } | ||
74 | |||
75 | /* ARMv8 round to integral */ | ||
76 | +dh_ctype_f16 HELPER(rinth_exact)(dh_ctype_f16 x, void *fp_status) | ||
77 | +{ | ||
78 | + return float16_round_to_int(x, fp_status); | ||
79 | +} | ||
80 | + | ||
81 | float32 HELPER(rints_exact)(float32 x, void *fp_status) | ||
82 | { | ||
83 | return float32_round_to_int(x, fp_status); | ||
84 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(rintd_exact)(float64 x, void *fp_status) | ||
85 | return float64_round_to_int(x, fp_status); | ||
86 | } | ||
87 | |||
88 | +dh_ctype_f16 HELPER(rinth)(dh_ctype_f16 x, void *fp_status) | ||
89 | +{ | ||
90 | + int old_flags = get_float_exception_flags(fp_status), new_flags; | ||
91 | + float16 ret; | ||
92 | + | ||
93 | + ret = float16_round_to_int(x, fp_status); | ||
94 | + | ||
95 | + /* Suppress any inexact exceptions the conversion produced */ | ||
96 | + if (!(old_flags & float_flag_inexact)) { | ||
97 | + new_flags = get_float_exception_flags(fp_status); | ||
98 | + set_float_exception_flags(new_flags & ~float_flag_inexact, fp_status); | ||
99 | + } | ||
100 | + | ||
101 | + return ret; | ||
102 | +} | ||
103 | + | ||
104 | float32 HELPER(rints)(float32 x, void *fp_status) | ||
105 | { | ||
106 | int old_flags = get_float_exception_flags(fp_status), new_flags; | ||
107 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | ||
108 | index XXXXXXX..XXXXXXX 100644 | ||
109 | --- a/target/arm/translate-vfp.c.inc | ||
110 | +++ b/target/arm/translate-vfp.c.inc | ||
111 | @@ -XXX,XX +XXX,XX @@ static const uint8_t fp_decode_rm[] = { | ||
112 | static bool trans_VRINT(DisasContext *s, arg_VRINT *a) | ||
113 | { | ||
114 | uint32_t rd, rm; | ||
115 | - bool dp = a->dp; | ||
116 | + int sz = a->sz; | ||
117 | TCGv_ptr fpst; | ||
118 | TCGv_i32 tcg_rmode; | ||
119 | int rounding = fp_decode_rm[a->rm]; | ||
120 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINT(DisasContext *s, arg_VRINT *a) | ||
121 | return false; | ||
122 | } | ||
123 | |||
124 | - if (dp && !dc_isar_feature(aa32_fpdp_v2, s)) { | ||
125 | + if (sz == 3 && !dc_isar_feature(aa32_fpdp_v2, s)) { | ||
126 | + return false; | ||
127 | + } | ||
128 | + | ||
129 | + if (sz == 1 && !dc_isar_feature(aa32_fp16_arith, s)) { | ||
130 | return false; | ||
131 | } | ||
132 | |||
133 | /* UNDEF accesses to D16-D31 if they don't exist */ | ||
134 | - if (dp && !dc_isar_feature(aa32_simd_r32, s) && | ||
135 | + if (sz == 3 && !dc_isar_feature(aa32_simd_r32, s) && | ||
136 | ((a->vm | a->vd) & 0x10)) { | ||
137 | return false; | ||
138 | } | ||
139 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINT(DisasContext *s, arg_VRINT *a) | ||
140 | return true; | ||
141 | } | ||
142 | |||
143 | - fpst = fpstatus_ptr(FPST_FPCR); | ||
144 | + if (sz == 1) { | ||
145 | + fpst = fpstatus_ptr(FPST_FPCR_F16); | ||
146 | + } else { | ||
147 | + fpst = fpstatus_ptr(FPST_FPCR); | ||
148 | + } | ||
149 | |||
150 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rounding)); | ||
151 | gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
152 | |||
153 | - if (dp) { | ||
154 | + if (sz == 3) { | ||
155 | TCGv_i64 tcg_op; | ||
156 | TCGv_i64 tcg_res; | ||
157 | tcg_op = tcg_temp_new_i64(); | ||
158 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINT(DisasContext *s, arg_VRINT *a) | ||
159 | tcg_op = tcg_temp_new_i32(); | ||
160 | tcg_res = tcg_temp_new_i32(); | ||
161 | neon_load_reg32(tcg_op, rm); | ||
162 | - gen_helper_rints(tcg_res, tcg_op, fpst); | ||
163 | + if (sz == 1) { | ||
164 | + gen_helper_rinth(tcg_res, tcg_op, fpst); | ||
165 | + } else { | ||
166 | + gen_helper_rints(tcg_res, tcg_op, fpst); | ||
167 | + } | ||
168 | neon_store_reg32(tcg_res, rd); | ||
169 | tcg_temp_free_i32(tcg_op); | ||
170 | tcg_temp_free_i32(tcg_res); | ||
171 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCVT_f16_f64(DisasContext *s, arg_VCVT_f16_f64 *a) | ||
172 | return true; | ||
173 | } | ||
174 | |||
175 | +static bool trans_VRINTR_hp(DisasContext *s, arg_VRINTR_sp *a) | ||
176 | +{ | ||
177 | + TCGv_ptr fpst; | ||
178 | + TCGv_i32 tmp; | ||
179 | + | ||
180 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
181 | + return false; | ||
182 | + } | ||
183 | + | ||
184 | + if (!vfp_access_check(s)) { | ||
185 | + return true; | ||
186 | + } | ||
187 | + | ||
188 | + tmp = tcg_temp_new_i32(); | ||
189 | + neon_load_reg32(tmp, a->vm); | ||
190 | + fpst = fpstatus_ptr(FPST_FPCR_F16); | ||
191 | + gen_helper_rinth(tmp, tmp, fpst); | ||
192 | + neon_store_reg32(tmp, a->vd); | ||
193 | + tcg_temp_free_ptr(fpst); | ||
194 | + tcg_temp_free_i32(tmp); | ||
195 | + return true; | ||
196 | +} | ||
197 | + | ||
198 | static bool trans_VRINTR_sp(DisasContext *s, arg_VRINTR_sp *a) | ||
199 | { | ||
200 | TCGv_ptr fpst; | ||
201 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINTR_dp(DisasContext *s, arg_VRINTR_dp *a) | ||
202 | return true; | ||
203 | } | ||
204 | |||
205 | +static bool trans_VRINTZ_hp(DisasContext *s, arg_VRINTZ_sp *a) | ||
206 | +{ | ||
207 | + TCGv_ptr fpst; | ||
208 | + TCGv_i32 tmp; | ||
209 | + TCGv_i32 tcg_rmode; | ||
210 | + | ||
211 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
212 | + return false; | ||
213 | + } | ||
214 | + | ||
215 | + if (!vfp_access_check(s)) { | ||
216 | + return true; | ||
217 | + } | ||
218 | + | ||
219 | + tmp = tcg_temp_new_i32(); | ||
220 | + neon_load_reg32(tmp, a->vm); | ||
221 | + fpst = fpstatus_ptr(FPST_FPCR_F16); | ||
222 | + tcg_rmode = tcg_const_i32(float_round_to_zero); | ||
223 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
224 | + gen_helper_rinth(tmp, tmp, fpst); | ||
225 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
226 | + neon_store_reg32(tmp, a->vd); | ||
227 | + tcg_temp_free_ptr(fpst); | ||
228 | + tcg_temp_free_i32(tcg_rmode); | ||
229 | + tcg_temp_free_i32(tmp); | ||
230 | + return true; | ||
231 | +} | ||
232 | + | ||
233 | static bool trans_VRINTZ_sp(DisasContext *s, arg_VRINTZ_sp *a) | ||
234 | { | ||
235 | TCGv_ptr fpst; | ||
236 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINTZ_dp(DisasContext *s, arg_VRINTZ_dp *a) | ||
237 | return true; | ||
238 | } | ||
239 | |||
240 | +static bool trans_VRINTX_hp(DisasContext *s, arg_VRINTX_sp *a) | ||
241 | +{ | ||
242 | + TCGv_ptr fpst; | ||
243 | + TCGv_i32 tmp; | ||
244 | + | ||
245 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
246 | + return false; | ||
247 | + } | ||
248 | + | ||
249 | + if (!vfp_access_check(s)) { | ||
250 | + return true; | ||
251 | + } | ||
252 | + | ||
253 | + tmp = tcg_temp_new_i32(); | ||
254 | + neon_load_reg32(tmp, a->vm); | ||
255 | + fpst = fpstatus_ptr(FPST_FPCR_F16); | ||
256 | + gen_helper_rinth_exact(tmp, tmp, fpst); | ||
257 | + neon_store_reg32(tmp, a->vd); | ||
258 | + tcg_temp_free_ptr(fpst); | ||
259 | + tcg_temp_free_i32(tmp); | ||
260 | + return true; | ||
261 | +} | ||
262 | + | ||
263 | static bool trans_VRINTX_sp(DisasContext *s, arg_VRINTX_sp *a) | ||
264 | { | ||
265 | TCGv_ptr fpst; | ||
266 | -- | ||
267 | 2.20.1 | ||
268 | |||
269 | diff view generated by jsdifflib |
1 | From: Eric Auger <eric.auger@redhat.com> | 1 | The fp16 extension includes a new instruction VINS, which copies the |
---|---|---|---|
2 | lower 16 bits of a 32-bit source VFP register into the upper 16 bits | ||
3 | of the destination. Implement it. | ||
2 | 4 | ||
3 | At the moment if the end-user does not specify the gic-version along | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | with KVM acceleration, v2 is set by default. However most of the | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | systems now have GICv3 and sometimes they do not support GICv2 | 7 | Message-id: 20200828183354.27913-20-peter.maydell@linaro.org |
6 | compatibility. | 8 | --- |
9 | target/arm/vfp-uncond.decode | 3 +++ | ||
10 | target/arm/translate-vfp.c.inc | 28 ++++++++++++++++++++++++++++ | ||
11 | 2 files changed, 31 insertions(+) | ||
7 | 12 | ||
8 | This patch keeps the default v2 selection in all cases except | 13 | diff --git a/target/arm/vfp-uncond.decode b/target/arm/vfp-uncond.decode |
9 | in the KVM accelerated mode when either | ||
10 | - the host does not support GICv2 in-kernel emulation or | ||
11 | - number of VCPUS exceeds 8. | ||
12 | |||
13 | Those cases did not work anyway so we do not break any compatibility. | ||
14 | Now we get v3 selected in such a case. | ||
15 | |||
16 | Signed-off-by: Eric Auger <eric.auger@redhat.com> | ||
17 | Reported-by: Dr. David Alan Gilbert <dgilbert@redhat.com> | ||
18 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
19 | Message-id: 20200311131618.7187-7-eric.auger@redhat.com | ||
20 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
21 | --- | ||
22 | hw/arm/virt.c | 17 ++++++++++++++++- | ||
23 | 1 file changed, 16 insertions(+), 1 deletion(-) | ||
24 | |||
25 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c | ||
26 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
27 | --- a/hw/arm/virt.c | 15 | --- a/target/arm/vfp-uncond.decode |
28 | +++ b/hw/arm/virt.c | 16 | +++ b/target/arm/vfp-uncond.decode |
29 | @@ -XXX,XX +XXX,XX @@ static void virt_set_memmap(VirtMachineState *vms) | 17 | @@ -XXX,XX +XXX,XX @@ VCVT 1111 1110 1.11 11 rm:2 .... 1010 op:1 1.0 .... \ |
30 | */ | 18 | vm=%vm_sp vd=%vd_sp sz=2 |
31 | static void finalize_gic_version(VirtMachineState *vms) | 19 | VCVT 1111 1110 1.11 11 rm:2 .... 1011 op:1 1.0 .... \ |
32 | { | 20 | vm=%vm_dp vd=%vd_sp sz=3 |
33 | + unsigned int max_cpus = MACHINE(vms)->smp.max_cpus; | ||
34 | + | 21 | + |
35 | if (kvm_enabled()) { | 22 | +VINS 1111 1110 1.11 0000 .... 1010 11 . 0 .... \ |
36 | int probe_bitmap; | 23 | + vd=%vd_sp vm=%vm_sp |
37 | 24 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc | |
38 | @@ -XXX,XX +XXX,XX @@ static void finalize_gic_version(VirtMachineState *vms) | 25 | index XXXXXXX..XXXXXXX 100644 |
39 | } | 26 | --- a/target/arm/translate-vfp.c.inc |
40 | return; | 27 | +++ b/target/arm/translate-vfp.c.inc |
41 | case VIRT_GIC_VERSION_NOSEL: | 28 | @@ -XXX,XX +XXX,XX @@ static bool trans_NOCP(DisasContext *s, arg_NOCP *a) |
42 | - vms->gic_version = VIRT_GIC_VERSION_2; | 29 | |
43 | + if ((probe_bitmap & KVM_ARM_VGIC_V2) && max_cpus <= GIC_NCPU) { | 30 | return false; |
44 | + vms->gic_version = VIRT_GIC_VERSION_2; | 31 | } |
45 | + } else if (probe_bitmap & KVM_ARM_VGIC_V3) { | 32 | + |
46 | + /* | 33 | +static bool trans_VINS(DisasContext *s, arg_VINS *a) |
47 | + * in case the host does not support v2 in-kernel emulation or | 34 | +{ |
48 | + * the end-user requested more than 8 VCPUs we now default | 35 | + TCGv_i32 rd, rm; |
49 | + * to v3. In any case defaulting to v2 would be broken. | 36 | + |
50 | + */ | 37 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
51 | + vms->gic_version = VIRT_GIC_VERSION_3; | 38 | + return false; |
52 | + } else if (max_cpus > GIC_NCPU) { | 39 | + } |
53 | + error_report("host only supports in-kernel GICv2 emulation " | 40 | + |
54 | + "but more than 8 vcpus are requested"); | 41 | + if (s->vec_len != 0 || s->vec_stride != 0) { |
55 | + exit(1); | 42 | + return false; |
56 | + } | 43 | + } |
57 | break; | 44 | + |
58 | case VIRT_GIC_VERSION_2: | 45 | + if (!vfp_access_check(s)) { |
59 | case VIRT_GIC_VERSION_3: | 46 | + return true; |
47 | + } | ||
48 | + | ||
49 | + /* Insert low half of Vm into high half of Vd */ | ||
50 | + rm = tcg_temp_new_i32(); | ||
51 | + rd = tcg_temp_new_i32(); | ||
52 | + neon_load_reg32(rm, a->vm); | ||
53 | + neon_load_reg32(rd, a->vd); | ||
54 | + tcg_gen_deposit_i32(rd, rd, rm, 16, 16); | ||
55 | + neon_store_reg32(rd, a->vd); | ||
56 | + tcg_temp_free_i32(rm); | ||
57 | + tcg_temp_free_i32(rd); | ||
58 | + return true; | ||
59 | +} | ||
60 | -- | 60 | -- |
61 | 2.20.1 | 61 | 2.20.1 |
62 | 62 | ||
63 | 63 | diff view generated by jsdifflib |
1 | From: Guenter Roeck <linux@roeck-us.net> | 1 | The fp16 extension includes a new instruction VMOVX, which copies the |
---|---|---|---|
2 | upper 16 bits of a 32-bit source VFP register into the lower 16 | ||
3 | bits of the destination and zeroes the high half of the destination. | ||
4 | Implement it. | ||
2 | 5 | ||
3 | Wire up eSDHC controllers in fsl-imx25. For imx25-pdk, connect drives | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | provided on the command line to available eSDHC controllers. | 7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20200828183354.27913-21-peter.maydell@linaro.org | ||
9 | --- | ||
10 | target/arm/vfp-uncond.decode | 3 +++ | ||
11 | target/arm/translate-vfp.c.inc | 25 +++++++++++++++++++++++++ | ||
12 | 2 files changed, 28 insertions(+) | ||
5 | 13 | ||
6 | This patch enables booting the imx25-pdk emulation from SD card. | 14 | diff --git a/target/arm/vfp-uncond.decode b/target/arm/vfp-uncond.decode |
7 | |||
8 | Signed-off-by: Guenter Roeck <linux@roeck-us.net> | ||
9 | Message-id: 20200310215146.19688-2-linux@roeck-us.net | ||
10 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | [PMM: made commit subject consistent with other patch] | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | --- | ||
14 | include/hw/arm/fsl-imx25.h | 9 +++++++++ | ||
15 | hw/arm/fsl-imx25.c | 32 ++++++++++++++++++++++++++++++++ | ||
16 | hw/arm/imx25_pdk.c | 16 ++++++++++++++++ | ||
17 | 3 files changed, 57 insertions(+) | ||
18 | |||
19 | diff --git a/include/hw/arm/fsl-imx25.h b/include/hw/arm/fsl-imx25.h | ||
20 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
21 | --- a/include/hw/arm/fsl-imx25.h | 16 | --- a/target/arm/vfp-uncond.decode |
22 | +++ b/include/hw/arm/fsl-imx25.h | 17 | +++ b/target/arm/vfp-uncond.decode |
23 | @@ -XXX,XX +XXX,XX @@ | 18 | @@ -XXX,XX +XXX,XX @@ VCVT 1111 1110 1.11 11 rm:2 .... 1010 op:1 1.0 .... \ |
24 | #include "hw/misc/imx_rngc.h" | 19 | VCVT 1111 1110 1.11 11 rm:2 .... 1011 op:1 1.0 .... \ |
25 | #include "hw/i2c/imx_i2c.h" | 20 | vm=%vm_dp vd=%vd_sp sz=3 |
26 | #include "hw/gpio/imx_gpio.h" | 21 | |
27 | +#include "hw/sd/sdhci.h" | 22 | +VMOVX 1111 1110 1.11 0000 .... 1010 01 . 0 .... \ |
28 | #include "exec/memory.h" | 23 | + vd=%vd_sp vm=%vm_sp |
29 | #include "target/arm/cpu.h" | 24 | + |
30 | 25 | VINS 1111 1110 1.11 0000 .... 1010 11 . 0 .... \ | |
31 | @@ -XXX,XX +XXX,XX @@ | 26 | vd=%vd_sp vm=%vm_sp |
32 | #define FSL_IMX25_NUM_EPITS 2 | 27 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc |
33 | #define FSL_IMX25_NUM_I2CS 3 | ||
34 | #define FSL_IMX25_NUM_GPIOS 4 | ||
35 | +#define FSL_IMX25_NUM_ESDHCS 2 | ||
36 | |||
37 | typedef struct FslIMX25State { | ||
38 | /*< private >*/ | ||
39 | @@ -XXX,XX +XXX,XX @@ typedef struct FslIMX25State { | ||
40 | IMXRNGCState rngc; | ||
41 | IMXI2CState i2c[FSL_IMX25_NUM_I2CS]; | ||
42 | IMXGPIOState gpio[FSL_IMX25_NUM_GPIOS]; | ||
43 | + SDHCIState esdhc[FSL_IMX25_NUM_ESDHCS]; | ||
44 | MemoryRegion rom[2]; | ||
45 | MemoryRegion iram; | ||
46 | MemoryRegion iram_alias; | ||
47 | @@ -XXX,XX +XXX,XX @@ typedef struct FslIMX25State { | ||
48 | #define FSL_IMX25_GPIO3_SIZE 0x4000 | ||
49 | #define FSL_IMX25_RNGC_ADDR 0x53FB0000 | ||
50 | #define FSL_IMX25_RNGC_SIZE 0x4000 | ||
51 | +#define FSL_IMX25_ESDHC1_ADDR 0x53FB4000 | ||
52 | +#define FSL_IMX25_ESDHC1_SIZE 0x4000 | ||
53 | +#define FSL_IMX25_ESDHC2_ADDR 0x53FB8000 | ||
54 | +#define FSL_IMX25_ESDHC2_SIZE 0x4000 | ||
55 | #define FSL_IMX25_GPIO1_ADDR 0x53FCC000 | ||
56 | #define FSL_IMX25_GPIO1_SIZE 0x4000 | ||
57 | #define FSL_IMX25_GPIO2_ADDR 0x53FD0000 | ||
58 | @@ -XXX,XX +XXX,XX @@ typedef struct FslIMX25State { | ||
59 | #define FSL_IMX25_GPIO2_IRQ 51 | ||
60 | #define FSL_IMX25_GPIO3_IRQ 16 | ||
61 | #define FSL_IMX25_GPIO4_IRQ 23 | ||
62 | +#define FSL_IMX25_ESDHC1_IRQ 9 | ||
63 | +#define FSL_IMX25_ESDHC2_IRQ 8 | ||
64 | |||
65 | #endif /* FSL_IMX25_H */ | ||
66 | diff --git a/hw/arm/fsl-imx25.c b/hw/arm/fsl-imx25.c | ||
67 | index XXXXXXX..XXXXXXX 100644 | 28 | index XXXXXXX..XXXXXXX 100644 |
68 | --- a/hw/arm/fsl-imx25.c | 29 | --- a/target/arm/translate-vfp.c.inc |
69 | +++ b/hw/arm/fsl-imx25.c | 30 | +++ b/target/arm/translate-vfp.c.inc |
70 | @@ -XXX,XX +XXX,XX @@ | 31 | @@ -XXX,XX +XXX,XX @@ static bool trans_VINS(DisasContext *s, arg_VINS *a) |
71 | #include "hw/qdev-properties.h" | 32 | tcg_temp_free_i32(rd); |
72 | #include "chardev/char.h" | 33 | return true; |
73 | 34 | } | |
74 | +#define IMX25_ESDHC_CAPABILITIES 0x07e20000 | ||
75 | + | 35 | + |
76 | static void fsl_imx25_init(Object *obj) | 36 | +static bool trans_VMOVX(DisasContext *s, arg_VINS *a) |
77 | { | 37 | +{ |
78 | FslIMX25State *s = FSL_IMX25(obj); | 38 | + TCGv_i32 rm; |
79 | @@ -XXX,XX +XXX,XX @@ static void fsl_imx25_init(Object *obj) | ||
80 | sysbus_init_child_obj(obj, "gpio[*]", &s->gpio[i], sizeof(s->gpio[i]), | ||
81 | TYPE_IMX_GPIO); | ||
82 | } | ||
83 | + | 39 | + |
84 | + for (i = 0; i < FSL_IMX25_NUM_ESDHCS; i++) { | 40 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
85 | + sysbus_init_child_obj(obj, "sdhc[*]", &s->esdhc[i], sizeof(s->esdhc[i]), | 41 | + return false; |
86 | + TYPE_IMX_USDHC); | ||
87 | + } | ||
88 | } | ||
89 | |||
90 | static void fsl_imx25_realize(DeviceState *dev, Error **errp) | ||
91 | @@ -XXX,XX +XXX,XX @@ static void fsl_imx25_realize(DeviceState *dev, Error **errp) | ||
92 | gpio_table[i].irq)); | ||
93 | } | ||
94 | |||
95 | + /* Initialize all SDHC */ | ||
96 | + for (i = 0; i < FSL_IMX25_NUM_ESDHCS; i++) { | ||
97 | + static const struct { | ||
98 | + hwaddr addr; | ||
99 | + unsigned int irq; | ||
100 | + } esdhc_table[FSL_IMX25_NUM_ESDHCS] = { | ||
101 | + { FSL_IMX25_ESDHC1_ADDR, FSL_IMX25_ESDHC1_IRQ }, | ||
102 | + { FSL_IMX25_ESDHC2_ADDR, FSL_IMX25_ESDHC2_IRQ }, | ||
103 | + }; | ||
104 | + | ||
105 | + object_property_set_uint(OBJECT(&s->esdhc[i]), 2, "sd-spec-version", | ||
106 | + &err); | ||
107 | + object_property_set_uint(OBJECT(&s->esdhc[i]), IMX25_ESDHC_CAPABILITIES, | ||
108 | + "capareg", &err); | ||
109 | + object_property_set_bool(OBJECT(&s->esdhc[i]), true, "realized", &err); | ||
110 | + if (err) { | ||
111 | + error_propagate(errp, err); | ||
112 | + return; | ||
113 | + } | ||
114 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->esdhc[i]), 0, esdhc_table[i].addr); | ||
115 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->esdhc[i]), 0, | ||
116 | + qdev_get_gpio_in(DEVICE(&s->avic), | ||
117 | + esdhc_table[i].irq)); | ||
118 | + } | 42 | + } |
119 | + | 43 | + |
120 | /* initialize 2 x 16 KB ROM */ | 44 | + if (s->vec_len != 0 || s->vec_stride != 0) { |
121 | memory_region_init_rom(&s->rom[0], NULL, | 45 | + return false; |
122 | "imx25.rom0", FSL_IMX25_ROM0_SIZE, &err); | ||
123 | diff --git a/hw/arm/imx25_pdk.c b/hw/arm/imx25_pdk.c | ||
124 | index XXXXXXX..XXXXXXX 100644 | ||
125 | --- a/hw/arm/imx25_pdk.c | ||
126 | +++ b/hw/arm/imx25_pdk.c | ||
127 | @@ -XXX,XX +XXX,XX @@ | ||
128 | #include "qemu/osdep.h" | ||
129 | #include "qapi/error.h" | ||
130 | #include "cpu.h" | ||
131 | +#include "hw/qdev-properties.h" | ||
132 | #include "hw/arm/fsl-imx25.h" | ||
133 | #include "hw/boards.h" | ||
134 | #include "qemu/error-report.h" | ||
135 | @@ -XXX,XX +XXX,XX @@ static void imx25_pdk_init(MachineState *machine) | ||
136 | imx25_pdk_binfo.board_id = 1771, | ||
137 | imx25_pdk_binfo.nb_cpus = 1; | ||
138 | |||
139 | + for (i = 0; i < FSL_IMX25_NUM_ESDHCS; i++) { | ||
140 | + BusState *bus; | ||
141 | + DeviceState *carddev; | ||
142 | + DriveInfo *di; | ||
143 | + BlockBackend *blk; | ||
144 | + | ||
145 | + di = drive_get_next(IF_SD); | ||
146 | + blk = di ? blk_by_legacy_dinfo(di) : NULL; | ||
147 | + bus = qdev_get_child_bus(DEVICE(&s->soc.esdhc[i]), "sd-bus"); | ||
148 | + carddev = qdev_create(bus, TYPE_SD_CARD); | ||
149 | + qdev_prop_set_drive(carddev, "drive", blk, &error_fatal); | ||
150 | + object_property_set_bool(OBJECT(carddev), true, | ||
151 | + "realized", &error_fatal); | ||
152 | + } | 46 | + } |
153 | + | 47 | + |
154 | /* | 48 | + if (!vfp_access_check(s)) { |
155 | * We test explicitly for qtest here as it is not done (yet?) in | 49 | + return true; |
156 | * arm_load_kernel(). Without this the "make check" command would | 50 | + } |
51 | + | ||
52 | + /* Set Vd to high half of Vm */ | ||
53 | + rm = tcg_temp_new_i32(); | ||
54 | + neon_load_reg32(rm, a->vm); | ||
55 | + tcg_gen_shri_i32(rm, rm, 16); | ||
56 | + neon_store_reg32(rm, a->vd); | ||
57 | + tcg_temp_free_i32(rm); | ||
58 | + return true; | ||
59 | +} | ||
157 | -- | 60 | -- |
158 | 2.20.1 | 61 | 2.20.1 |
159 | 62 | ||
160 | 63 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Implement the VFP fp16 variant of VMOV that transfers a 16-bit |
---|---|---|---|
2 | value between a general purpose register and a VFP register. | ||
2 | 3 | ||
3 | The Xunlong Orange Pi PC is an Allwinner H3 System on Chip | 4 | Note that Rt == 15 is UNPREDICTABLE; since this insn is v8 and later |
4 | based embedded computer with mainline support in both U-Boot | 5 | only we have no need to replicate the old "updates CPSR.NZCV" |
5 | and Linux. The board comes with a Quad Core Cortex A7 @ 1.3GHz, | 6 | behaviour that the singleprec version of this insn does. |
6 | 1GiB RAM, 100Mbit ethernet, USB, SD/MMC, USB, HDMI and | ||
7 | various other I/O. This commit add support for the Xunlong | ||
8 | Orange Pi PC machine. | ||
9 | 7 | ||
10 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
11 | Tested-by: KONRAD Frederic <frederic.konrad@adacore.com> | ||
12 | Tested-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
13 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
14 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
15 | Acked-by: Igor Mammedov <imammedo@redhat.com> | ||
16 | Message-id: 20200311221854.30370-3-nieklinnenbank@gmail.com | ||
17 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
10 | Message-id: 20200828183354.27913-22-peter.maydell@linaro.org | ||
18 | --- | 11 | --- |
19 | hw/arm/Makefile.objs | 2 +- | 12 | target/arm/vfp.decode | 1 + |
20 | hw/arm/orangepi.c | 92 ++++++++++++++++++++++++++++++++++++++++++++ | 13 | target/arm/translate-vfp.c.inc | 34 ++++++++++++++++++++++++++++++++++ |
21 | MAINTAINERS | 1 + | 14 | 2 files changed, 35 insertions(+) |
22 | 3 files changed, 94 insertions(+), 1 deletion(-) | ||
23 | create mode 100644 hw/arm/orangepi.c | ||
24 | 15 | ||
25 | diff --git a/hw/arm/Makefile.objs b/hw/arm/Makefile.objs | 16 | diff --git a/target/arm/vfp.decode b/target/arm/vfp.decode |
26 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
27 | --- a/hw/arm/Makefile.objs | 18 | --- a/target/arm/vfp.decode |
28 | +++ b/hw/arm/Makefile.objs | 19 | +++ b/target/arm/vfp.decode |
29 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_DIGIC) += digic.o | 20 | @@ -XXX,XX +XXX,XX @@ VDUP ---- 1110 1 b:1 q:1 0 .... rt:4 1011 . 0 e:1 1 0000 \ |
30 | obj-$(CONFIG_OMAP) += omap1.o omap2.o | 21 | vn=%vn_dp |
31 | obj-$(CONFIG_STRONGARM) += strongarm.o | 22 | |
32 | obj-$(CONFIG_ALLWINNER_A10) += allwinner-a10.o cubieboard.o | 23 | VMSR_VMRS ---- 1110 111 l:1 reg:4 rt:4 1010 0001 0000 |
33 | -obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3.o | 24 | +VMOV_half ---- 1110 000 l:1 .... rt:4 1001 . 001 0000 vn=%vn_sp |
34 | +obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3.o orangepi.o | 25 | VMOV_single ---- 1110 000 l:1 .... rt:4 1010 . 001 0000 vn=%vn_sp |
35 | obj-$(CONFIG_RASPI) += bcm2835_peripherals.o bcm2836.o raspi.o | 26 | |
36 | obj-$(CONFIG_STM32F205_SOC) += stm32f205_soc.o | 27 | VMOV_64_sp ---- 1100 010 op:1 rt2:4 rt:4 1010 00.1 .... vm=%vm_sp |
37 | obj-$(CONFIG_STM32F405_SOC) += stm32f405_soc.o | 28 | diff --git a/target/arm/translate-vfp.c.inc b/target/arm/translate-vfp.c.inc |
38 | diff --git a/hw/arm/orangepi.c b/hw/arm/orangepi.c | 29 | index XXXXXXX..XXXXXXX 100644 |
39 | new file mode 100644 | 30 | --- a/target/arm/translate-vfp.c.inc |
40 | index XXXXXXX..XXXXXXX | 31 | +++ b/target/arm/translate-vfp.c.inc |
41 | --- /dev/null | 32 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMSR_VMRS(DisasContext *s, arg_VMSR_VMRS *a) |
42 | +++ b/hw/arm/orangepi.c | 33 | return true; |
43 | @@ -XXX,XX +XXX,XX @@ | 34 | } |
44 | +/* | 35 | |
45 | + * Orange Pi emulation | 36 | +static bool trans_VMOV_half(DisasContext *s, arg_VMOV_single *a) |
46 | + * | 37 | +{ |
47 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | 38 | + TCGv_i32 tmp; |
48 | + * | ||
49 | + * This program is free software: you can redistribute it and/or modify | ||
50 | + * it under the terms of the GNU General Public License as published by | ||
51 | + * the Free Software Foundation, either version 2 of the License, or | ||
52 | + * (at your option) any later version. | ||
53 | + * | ||
54 | + * This program is distributed in the hope that it will be useful, | ||
55 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
56 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
57 | + * GNU General Public License for more details. | ||
58 | + * | ||
59 | + * You should have received a copy of the GNU General Public License | ||
60 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
61 | + */ | ||
62 | + | 39 | + |
63 | +#include "qemu/osdep.h" | 40 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
64 | +#include "qemu/units.h" | 41 | + return false; |
65 | +#include "exec/address-spaces.h" | ||
66 | +#include "qapi/error.h" | ||
67 | +#include "cpu.h" | ||
68 | +#include "hw/sysbus.h" | ||
69 | +#include "hw/boards.h" | ||
70 | +#include "hw/qdev-properties.h" | ||
71 | +#include "hw/arm/allwinner-h3.h" | ||
72 | +#include "sysemu/sysemu.h" | ||
73 | + | ||
74 | +static struct arm_boot_info orangepi_binfo = { | ||
75 | + .nb_cpus = AW_H3_NUM_CPUS, | ||
76 | +}; | ||
77 | + | ||
78 | +static void orangepi_init(MachineState *machine) | ||
79 | +{ | ||
80 | + AwH3State *h3; | ||
81 | + | ||
82 | + /* BIOS is not supported by this board */ | ||
83 | + if (bios_name) { | ||
84 | + error_report("BIOS not supported for this machine"); | ||
85 | + exit(1); | ||
86 | + } | 42 | + } |
87 | + | 43 | + |
88 | + /* This board has fixed size RAM */ | 44 | + if (a->rt == 15) { |
89 | + if (machine->ram_size != 1 * GiB) { | 45 | + /* UNPREDICTABLE; we choose to UNDEF */ |
90 | + error_report("This machine can only be used with 1GiB of RAM"); | 46 | + return false; |
91 | + exit(1); | ||
92 | + } | 47 | + } |
93 | + | 48 | + |
94 | + /* Only allow Cortex-A7 for this board */ | 49 | + if (!vfp_access_check(s)) { |
95 | + if (strcmp(machine->cpu_type, ARM_CPU_TYPE_NAME("cortex-a7")) != 0) { | 50 | + return true; |
96 | + error_report("This board can only be used with cortex-a7 CPU"); | ||
97 | + exit(1); | ||
98 | + } | 51 | + } |
99 | + | 52 | + |
100 | + h3 = AW_H3(object_new(TYPE_AW_H3)); | 53 | + if (a->l) { |
101 | + object_property_add_child(OBJECT(machine), "soc", OBJECT(h3), | 54 | + /* VFP to general purpose register */ |
102 | + &error_abort); | 55 | + tmp = tcg_temp_new_i32(); |
103 | + object_unref(OBJECT(h3)); | 56 | + neon_load_reg32(tmp, a->vn); |
57 | + tcg_gen_andi_i32(tmp, tmp, 0xffff); | ||
58 | + store_reg(s, a->rt, tmp); | ||
59 | + } else { | ||
60 | + /* general purpose register to VFP */ | ||
61 | + tmp = load_reg(s, a->rt); | ||
62 | + tcg_gen_andi_i32(tmp, tmp, 0xffff); | ||
63 | + neon_store_reg32(tmp, a->vn); | ||
64 | + tcg_temp_free_i32(tmp); | ||
65 | + } | ||
104 | + | 66 | + |
105 | + /* Setup timer properties */ | 67 | + return true; |
106 | + object_property_set_int(OBJECT(h3), 32768, "clk0-freq", | ||
107 | + &error_abort); | ||
108 | + object_property_set_int(OBJECT(h3), 24 * 1000 * 1000, "clk1-freq", | ||
109 | + &error_abort); | ||
110 | + | ||
111 | + /* Mark H3 object realized */ | ||
112 | + object_property_set_bool(OBJECT(h3), true, "realized", &error_abort); | ||
113 | + | ||
114 | + /* SDRAM */ | ||
115 | + memory_region_add_subregion(get_system_memory(), h3->memmap[AW_H3_SDRAM], | ||
116 | + machine->ram); | ||
117 | + | ||
118 | + orangepi_binfo.loader_start = h3->memmap[AW_H3_SDRAM]; | ||
119 | + orangepi_binfo.ram_size = machine->ram_size; | ||
120 | + arm_load_kernel(ARM_CPU(first_cpu), machine, &orangepi_binfo); | ||
121 | +} | 68 | +} |
122 | + | 69 | + |
123 | +static void orangepi_machine_init(MachineClass *mc) | 70 | static bool trans_VMOV_single(DisasContext *s, arg_VMOV_single *a) |
124 | +{ | 71 | { |
125 | + mc->desc = "Orange Pi PC"; | 72 | TCGv_i32 tmp; |
126 | + mc->init = orangepi_init; | ||
127 | + mc->min_cpus = AW_H3_NUM_CPUS; | ||
128 | + mc->max_cpus = AW_H3_NUM_CPUS; | ||
129 | + mc->default_cpus = AW_H3_NUM_CPUS; | ||
130 | + mc->default_cpu_type = ARM_CPU_TYPE_NAME("cortex-a7"); | ||
131 | + mc->default_ram_size = 1 * GiB; | ||
132 | + mc->default_ram_id = "orangepi.ram"; | ||
133 | +} | ||
134 | + | ||
135 | +DEFINE_MACHINE("orangepi-pc", orangepi_machine_init) | ||
136 | diff --git a/MAINTAINERS b/MAINTAINERS | ||
137 | index XXXXXXX..XXXXXXX 100644 | ||
138 | --- a/MAINTAINERS | ||
139 | +++ b/MAINTAINERS | ||
140 | @@ -XXX,XX +XXX,XX @@ L: qemu-arm@nongnu.org | ||
141 | S: Maintained | ||
142 | F: hw/*/allwinner-h3* | ||
143 | F: include/hw/*/allwinner-h3* | ||
144 | +F: hw/arm/orangepi.c | ||
145 | |||
146 | ARM PrimeCell and CMSDK devices | ||
147 | M: Peter Maydell <peter.maydell@linaro.org> | ||
148 | -- | 73 | -- |
149 | 2.20.1 | 74 | 2.20.1 |
150 | 75 | ||
151 | 76 | diff view generated by jsdifflib |
1 | A write to the CONTROL register can change our current EL (by | 1 | Implement FP16 support for the Neon insns which use the DO_3S_FP_GVEC |
---|---|---|---|
2 | writing to the nPRIV bit). That means that we can't assume | 2 | macro: VADD, VSUB, VABD, VMUL. |
3 | that s->current_el is still valid in trans_MSR_v7m() when | ||
4 | we try to rebuild the hflags. | ||
5 | 3 | ||
6 | Add a new helper rebuild_hflags_m32_newel() which, like the | 4 | For VABD this requires us to implement a new gvec_fabd_h helper |
7 | existing rebuild_hflags_a32_newel(), recalculates the current | 5 | using the machinery we have already for the other helpers. |
8 | EL from scratch, and use it in trans_MSR_v7m(). | ||
9 | |||
10 | This fixes an assertion about an hflags mismatch when the | ||
11 | guest changes privilege by writing to CONTROL. | ||
12 | 6 | ||
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
14 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
15 | Message-id: 20200303174950.3298-4-peter.maydell@linaro.org | 9 | Message-id: 20200828183354.27913-24-peter.maydell@linaro.org |
16 | --- | 10 | --- |
17 | target/arm/helper.h | 1 + | 11 | target/arm/helper.h | 1 + |
18 | target/arm/helper.c | 12 ++++++++++++ | 12 | target/arm/vec_helper.c | 6 ++++++ |
19 | target/arm/translate.c | 7 +++---- | 13 | target/arm/translate-neon.c.inc | 36 +++++++++++++++++---------------- |
20 | 3 files changed, 16 insertions(+), 4 deletions(-) | 14 | 3 files changed, 26 insertions(+), 17 deletions(-) |
21 | 15 | ||
22 | diff --git a/target/arm/helper.h b/target/arm/helper.h | 16 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
23 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
24 | --- a/target/arm/helper.h | 18 | --- a/target/arm/helper.h |
25 | +++ b/target/arm/helper.h | 19 | +++ b/target/arm/helper.h |
26 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_4(msr_banked, void, env, i32, i32, i32) | 20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmul_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
27 | DEF_HELPER_2(get_user_reg, i32, env, i32) | 21 | DEF_HELPER_FLAGS_5(gvec_fmul_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
28 | DEF_HELPER_3(set_user_reg, void, env, i32, i32) | 22 | DEF_HELPER_FLAGS_5(gvec_fmul_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
29 | 23 | ||
30 | +DEF_HELPER_FLAGS_1(rebuild_hflags_m32_newel, TCG_CALL_NO_RWG, void, env) | 24 | +DEF_HELPER_FLAGS_5(gvec_fabd_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
31 | DEF_HELPER_FLAGS_2(rebuild_hflags_m32, TCG_CALL_NO_RWG, void, env, int) | 25 | DEF_HELPER_FLAGS_5(gvec_fabd_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
32 | DEF_HELPER_FLAGS_1(rebuild_hflags_a32_newel, TCG_CALL_NO_RWG, void, env) | 26 | |
33 | DEF_HELPER_FLAGS_2(rebuild_hflags_a32, TCG_CALL_NO_RWG, void, env, int) | 27 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, |
34 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 28 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
35 | index XXXXXXX..XXXXXXX 100644 | 29 | index XXXXXXX..XXXXXXX 100644 |
36 | --- a/target/arm/helper.c | 30 | --- a/target/arm/vec_helper.c |
37 | +++ b/target/arm/helper.c | 31 | +++ b/target/arm/vec_helper.c |
38 | @@ -XXX,XX +XXX,XX @@ void arm_rebuild_hflags(CPUARMState *env) | 32 | @@ -XXX,XX +XXX,XX @@ static float64 float64_ftsmul(float64 op1, uint64_t op2, float_status *stat) |
39 | env->hflags = rebuild_hflags_internal(env); | 33 | return result; |
40 | } | 34 | } |
41 | 35 | ||
42 | +/* | 36 | +static float16 float16_abd(float16 op1, float16 op2, float_status *stat) |
43 | + * If we have triggered a EL state change we can't rely on the | ||
44 | + * translator having passed it to us, we need to recompute. | ||
45 | + */ | ||
46 | +void HELPER(rebuild_hflags_m32_newel)(CPUARMState *env) | ||
47 | +{ | 37 | +{ |
48 | + int el = arm_current_el(env); | 38 | + return float16_abs(float16_sub(op1, op2, stat)); |
49 | + int fp_el = fp_exception_el(env, el); | ||
50 | + ARMMMUIdx mmu_idx = arm_mmu_idx_el(env, el); | ||
51 | + env->hflags = rebuild_hflags_m32(env, fp_el, mmu_idx); | ||
52 | +} | 39 | +} |
53 | + | 40 | + |
54 | void HELPER(rebuild_hflags_m32)(CPUARMState *env, int el) | 41 | static float32 float32_abd(float32 op1, float32 op2, float_status *stat) |
55 | { | 42 | { |
56 | int fp_el = fp_exception_el(env, el); | 43 | return float32_abs(float32_sub(op1, op2, stat)); |
57 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 44 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_ftsmul_h, float16_ftsmul, float16) |
45 | DO_3OP(gvec_ftsmul_s, float32_ftsmul, float32) | ||
46 | DO_3OP(gvec_ftsmul_d, float64_ftsmul, float64) | ||
47 | |||
48 | +DO_3OP(gvec_fabd_h, float16_abd, float16) | ||
49 | DO_3OP(gvec_fabd_s, float32_abd, float32) | ||
50 | |||
51 | #ifdef TARGET_AARCH64 | ||
52 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
58 | index XXXXXXX..XXXXXXX 100644 | 53 | index XXXXXXX..XXXXXXX 100644 |
59 | --- a/target/arm/translate.c | 54 | --- a/target/arm/translate-neon.c.inc |
60 | +++ b/target/arm/translate.c | 55 | +++ b/target/arm/translate-neon.c.inc |
61 | @@ -XXX,XX +XXX,XX @@ static bool trans_MRS_v7m(DisasContext *s, arg_MRS_v7m *a) | 56 | @@ -XXX,XX +XXX,XX @@ static bool do_3same_fp(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn, |
62 | |||
63 | static bool trans_MSR_v7m(DisasContext *s, arg_MSR_v7m *a) | ||
64 | { | ||
65 | - TCGv_i32 addr, reg, el; | ||
66 | + TCGv_i32 addr, reg; | ||
67 | |||
68 | if (!arm_dc_feature(s, ARM_FEATURE_M)) { | ||
69 | return false; | ||
70 | @@ -XXX,XX +XXX,XX @@ static bool trans_MSR_v7m(DisasContext *s, arg_MSR_v7m *a) | ||
71 | gen_helper_v7m_msr(cpu_env, addr, reg); | ||
72 | tcg_temp_free_i32(addr); | ||
73 | tcg_temp_free_i32(reg); | ||
74 | - el = tcg_const_i32(s->current_el); | ||
75 | - gen_helper_rebuild_hflags_m32(cpu_env, el); | ||
76 | - tcg_temp_free_i32(el); | ||
77 | + /* If we wrote to CONTROL, the EL might have changed */ | ||
78 | + gen_helper_rebuild_hflags_m32_newel(cpu_env); | ||
79 | gen_lookup_tb(s); | ||
80 | return true; | 57 | return true; |
81 | } | 58 | } |
59 | |||
60 | -/* | ||
61 | - * For all the functions using this macro, size == 1 means fp16, | ||
62 | - * which is an architecture extension we don't implement yet. | ||
63 | - */ | ||
64 | -#define DO_3S_FP_GVEC(INSN,FUNC) \ | ||
65 | - static void gen_##INSN##_3s(unsigned vece, uint32_t rd_ofs, \ | ||
66 | - uint32_t rn_ofs, uint32_t rm_ofs, \ | ||
67 | - uint32_t oprsz, uint32_t maxsz) \ | ||
68 | +#define WRAP_FP_GVEC(WRAPNAME, FPST, FUNC) \ | ||
69 | + static void WRAPNAME(unsigned vece, uint32_t rd_ofs, \ | ||
70 | + uint32_t rn_ofs, uint32_t rm_ofs, \ | ||
71 | + uint32_t oprsz, uint32_t maxsz) \ | ||
72 | { \ | ||
73 | - TCGv_ptr fpst = fpstatus_ptr(FPST_STD); \ | ||
74 | + TCGv_ptr fpst = fpstatus_ptr(FPST); \ | ||
75 | tcg_gen_gvec_3_ptr(rd_ofs, rn_ofs, rm_ofs, fpst, \ | ||
76 | oprsz, maxsz, 0, FUNC); \ | ||
77 | tcg_temp_free_ptr(fpst); \ | ||
78 | - } \ | ||
79 | + } | ||
80 | + | ||
81 | +#define DO_3S_FP_GVEC(INSN,SFUNC,HFUNC) \ | ||
82 | + WRAP_FP_GVEC(gen_##INSN##_fp32_3s, FPST_STD, SFUNC) \ | ||
83 | + WRAP_FP_GVEC(gen_##INSN##_fp16_3s, FPST_STD_F16, HFUNC) \ | ||
84 | static bool trans_##INSN##_fp_3s(DisasContext *s, arg_3same *a) \ | ||
85 | { \ | ||
86 | if (a->size != 0) { \ | ||
87 | - /* TODO fp16 support */ \ | ||
88 | - return false; \ | ||
89 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { \ | ||
90 | + return false; \ | ||
91 | + } \ | ||
92 | + return do_3same(s, a, gen_##INSN##_fp16_3s); \ | ||
93 | } \ | ||
94 | - return do_3same(s, a, gen_##INSN##_3s); \ | ||
95 | + return do_3same(s, a, gen_##INSN##_fp32_3s); \ | ||
96 | } | ||
97 | |||
98 | |||
99 | -DO_3S_FP_GVEC(VADD, gen_helper_gvec_fadd_s) | ||
100 | -DO_3S_FP_GVEC(VSUB, gen_helper_gvec_fsub_s) | ||
101 | -DO_3S_FP_GVEC(VABD, gen_helper_gvec_fabd_s) | ||
102 | -DO_3S_FP_GVEC(VMUL, gen_helper_gvec_fmul_s) | ||
103 | +DO_3S_FP_GVEC(VADD, gen_helper_gvec_fadd_s, gen_helper_gvec_fadd_h) | ||
104 | +DO_3S_FP_GVEC(VSUB, gen_helper_gvec_fsub_s, gen_helper_gvec_fsub_h) | ||
105 | +DO_3S_FP_GVEC(VABD, gen_helper_gvec_fabd_s, gen_helper_gvec_fabd_h) | ||
106 | +DO_3S_FP_GVEC(VMUL, gen_helper_gvec_fmul_s, gen_helper_gvec_fmul_h) | ||
107 | |||
108 | /* | ||
109 | * For all the functions using this macro, size == 1 means fp16, | ||
82 | -- | 110 | -- |
83 | 2.20.1 | 111 | 2.20.1 |
84 | 112 | ||
85 | 113 | diff view generated by jsdifflib |
1 | From: Eric Auger <eric.auger@redhat.com> | 1 | We already have gvec helpers for floating point VRECPE and |
---|---|---|---|
2 | VRQSRTE, so convert the Neon decoder to use them and | ||
3 | add the fp16 support. | ||
2 | 4 | ||
3 | Mention 'max' value in the gic-version property description. | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20200828183354.27913-25-peter.maydell@linaro.org | ||
8 | --- | ||
9 | target/arm/translate-neon.c.inc | 31 +++++++++++++++++++++++++++++-- | ||
10 | 1 file changed, 29 insertions(+), 2 deletions(-) | ||
4 | 11 | ||
5 | Signed-off-by: Eric Auger <eric.auger@redhat.com> | 12 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
8 | Message-id: 20200311131618.7187-2-eric.auger@redhat.com | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | hw/arm/virt.c | 3 ++- | ||
12 | 1 file changed, 2 insertions(+), 1 deletion(-) | ||
13 | |||
14 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/hw/arm/virt.c | 14 | --- a/target/arm/translate-neon.c.inc |
17 | +++ b/hw/arm/virt.c | 15 | +++ b/target/arm/translate-neon.c.inc |
18 | @@ -XXX,XX +XXX,XX @@ static void virt_instance_init(Object *obj) | 16 | @@ -XXX,XX +XXX,XX @@ static bool do_2misc_fp(DisasContext *s, arg_2misc *a, |
19 | virt_set_gic_version, NULL); | 17 | return do_2misc_fp(s, a, FUNC); \ |
20 | object_property_set_description(obj, "gic-version", | 18 | } |
21 | "Set GIC version. " | 19 | |
22 | - "Valid values are 2, 3 and host", NULL); | 20 | -DO_2MISC_FP(VRECPE_F, gen_helper_recpe_f32) |
23 | + "Valid values are 2, 3, host and max", | 21 | -DO_2MISC_FP(VRSQRTE_F, gen_helper_rsqrte_f32) |
24 | + NULL); | 22 | DO_2MISC_FP(VCVT_FS, gen_helper_vfp_sitos) |
25 | 23 | DO_2MISC_FP(VCVT_FU, gen_helper_vfp_uitos) | |
26 | vms->highmem_ecam = !vmc->no_highmem_ecam; | 24 | DO_2MISC_FP(VCVT_SF, gen_helper_vfp_tosizs) |
27 | 25 | DO_2MISC_FP(VCVT_UF, gen_helper_vfp_touizs) | |
26 | |||
27 | +#define DO_2MISC_FP_VEC(INSN, HFUNC, SFUNC) \ | ||
28 | + static void gen_##INSN(unsigned vece, uint32_t rd_ofs, \ | ||
29 | + uint32_t rm_ofs, \ | ||
30 | + uint32_t oprsz, uint32_t maxsz) \ | ||
31 | + { \ | ||
32 | + static gen_helper_gvec_2_ptr * const fns[4] = { \ | ||
33 | + NULL, HFUNC, SFUNC, NULL, \ | ||
34 | + }; \ | ||
35 | + TCGv_ptr fpst; \ | ||
36 | + fpst = fpstatus_ptr(vece == MO_16 ? FPST_STD_F16 : FPST_STD); \ | ||
37 | + tcg_gen_gvec_2_ptr(rd_ofs, rm_ofs, fpst, oprsz, maxsz, 0, \ | ||
38 | + fns[vece]); \ | ||
39 | + tcg_temp_free_ptr(fpst); \ | ||
40 | + } \ | ||
41 | + static bool trans_##INSN(DisasContext *s, arg_2misc *a) \ | ||
42 | + { \ | ||
43 | + if (a->size == MO_16) { \ | ||
44 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { \ | ||
45 | + return false; \ | ||
46 | + } \ | ||
47 | + } else if (a->size != MO_32) { \ | ||
48 | + return false; \ | ||
49 | + } \ | ||
50 | + return do_2misc_vec(s, a, gen_##INSN); \ | ||
51 | + } | ||
52 | + | ||
53 | +DO_2MISC_FP_VEC(VRECPE_F, gen_helper_gvec_frecpe_h, gen_helper_gvec_frecpe_s) | ||
54 | +DO_2MISC_FP_VEC(VRSQRTE_F, gen_helper_gvec_frsqrte_h, gen_helper_gvec_frsqrte_s) | ||
55 | + | ||
56 | static bool trans_VRINTX(DisasContext *s, arg_2misc *a) | ||
57 | { | ||
58 | if (!arm_dc_feature(s, ARM_FEATURE_V8)) { | ||
28 | -- | 59 | -- |
29 | 2.20.1 | 60 | 2.20.1 |
30 | 61 | ||
31 | 62 | diff view generated by jsdifflib |
1 | From: Eric Auger <eric.auger@redhat.com> | 1 | Rewrite Neon VABS/VNEG of floats to use gvec logical AND and XOR, so |
---|---|---|---|
2 | that we can implement the fp16 version of the insns. | ||
2 | 3 | ||
3 | Convert kvm_arm_vgic_probe() so that it returns a | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | bitmap of supported in-kernel emulation VGIC versions instead | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | of the max version: at the moment values can be v2 and v3. | 6 | Message-id: 20200828183354.27913-26-peter.maydell@linaro.org |
6 | This allows to expose the case where the host GICv3 also | 7 | --- |
7 | supports GICv2 emulation. This will be useful to choose the | 8 | target/arm/translate-neon.c.inc | 34 +++++++++++++++++++++++++++------ |
8 | default version in KVM accelerated mode. | 9 | 1 file changed, 28 insertions(+), 6 deletions(-) |
9 | 10 | ||
10 | Signed-off-by: Eric Auger <eric.auger@redhat.com> | 11 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
11 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
12 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
13 | Message-id: 20200311131618.7187-5-eric.auger@redhat.com | ||
14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
15 | --- | ||
16 | target/arm/kvm_arm.h | 3 +++ | ||
17 | hw/arm/virt.c | 11 +++++++++-- | ||
18 | target/arm/kvm.c | 14 ++++++++------ | ||
19 | 3 files changed, 20 insertions(+), 8 deletions(-) | ||
20 | |||
21 | diff --git a/target/arm/kvm_arm.h b/target/arm/kvm_arm.h | ||
22 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
23 | --- a/target/arm/kvm_arm.h | 13 | --- a/target/arm/translate-neon.c.inc |
24 | +++ b/target/arm/kvm_arm.h | 14 | +++ b/target/arm/translate-neon.c.inc |
25 | @@ -XXX,XX +XXX,XX @@ | 15 | @@ -XXX,XX +XXX,XX @@ static bool trans_VCNT(DisasContext *s, arg_2misc *a) |
26 | #include "exec/memory.h" | 16 | return do_2misc(s, a, gen_helper_neon_cnt_u8); |
27 | #include "qemu/error-report.h" | 17 | } |
28 | 18 | ||
29 | +#define KVM_ARM_VGIC_V2 (1 << 0) | 19 | +static void gen_VABS_F(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs, |
30 | +#define KVM_ARM_VGIC_V3 (1 << 1) | 20 | + uint32_t oprsz, uint32_t maxsz) |
21 | +{ | ||
22 | + tcg_gen_gvec_andi(vece, rd_ofs, rm_ofs, | ||
23 | + vece == MO_16 ? 0x7fff : 0x7fffffff, | ||
24 | + oprsz, maxsz); | ||
25 | +} | ||
31 | + | 26 | + |
32 | /** | 27 | static bool trans_VABS_F(DisasContext *s, arg_2misc *a) |
33 | * kvm_arm_vcpu_init: | 28 | { |
34 | * @cs: CPUState | 29 | - if (a->size != 2) { |
35 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c | 30 | + if (a->size == MO_16) { |
36 | index XXXXXXX..XXXXXXX 100644 | 31 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
37 | --- a/hw/arm/virt.c | 32 | + return false; |
38 | +++ b/hw/arm/virt.c | 33 | + } |
39 | @@ -XXX,XX +XXX,XX @@ static void finalize_gic_version(VirtMachineState *vms) | 34 | + } else if (a->size != MO_32) { |
40 | vms->gic_version = VIRT_GIC_VERSION_3; | 35 | return false; |
41 | } | 36 | } |
42 | } else { | 37 | - /* TODO: FP16 : size == 1 */ |
43 | - vms->gic_version = kvm_arm_vgic_probe(); | 38 | - return do_2misc(s, a, gen_helper_vfp_abss); |
44 | - if (!vms->gic_version) { | 39 | + return do_2misc_vec(s, a, gen_VABS_F); |
45 | + int probe_bitmap = kvm_arm_vgic_probe(); | 40 | +} |
46 | + | 41 | + |
47 | + if (!probe_bitmap) { | 42 | +static void gen_VNEG_F(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs, |
48 | error_report( | 43 | + uint32_t oprsz, uint32_t maxsz) |
49 | "Unable to determine GIC version supported by host"); | 44 | +{ |
50 | exit(1); | 45 | + tcg_gen_gvec_xori(vece, rd_ofs, rm_ofs, |
51 | + } else { | 46 | + vece == MO_16 ? 0x8000 : 0x80000000, |
52 | + if (probe_bitmap & KVM_ARM_VGIC_V3) { | 47 | + oprsz, maxsz); |
53 | + vms->gic_version = VIRT_GIC_VERSION_3; | 48 | } |
54 | + } else { | 49 | |
55 | + vms->gic_version = VIRT_GIC_VERSION_2; | 50 | static bool trans_VNEG_F(DisasContext *s, arg_2misc *a) |
56 | + } | ||
57 | } | ||
58 | } | ||
59 | } else if (vms->gic_version == VIRT_GIC_VERSION_NOSEL) { | ||
60 | diff --git a/target/arm/kvm.c b/target/arm/kvm.c | ||
61 | index XXXXXXX..XXXXXXX 100644 | ||
62 | --- a/target/arm/kvm.c | ||
63 | +++ b/target/arm/kvm.c | ||
64 | @@ -XXX,XX +XXX,XX @@ int kvm_arch_irqchip_create(KVMState *s) | ||
65 | |||
66 | int kvm_arm_vgic_probe(void) | ||
67 | { | 51 | { |
68 | + int val = 0; | 52 | - if (a->size != 2) { |
69 | + | 53 | + if (a->size == MO_16) { |
70 | if (kvm_create_device(kvm_state, | 54 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
71 | KVM_DEV_TYPE_ARM_VGIC_V3, true) == 0) { | 55 | + return false; |
72 | - return 3; | 56 | + } |
73 | - } else if (kvm_create_device(kvm_state, | 57 | + } else if (a->size != MO_32) { |
74 | - KVM_DEV_TYPE_ARM_VGIC_V2, true) == 0) { | 58 | return false; |
75 | - return 2; | ||
76 | - } else { | ||
77 | - return 0; | ||
78 | + val |= KVM_ARM_VGIC_V3; | ||
79 | } | 59 | } |
80 | + if (kvm_create_device(kvm_state, | 60 | - /* TODO: FP16 : size == 1 */ |
81 | + KVM_DEV_TYPE_ARM_VGIC_V2, true) == 0) { | 61 | - return do_2misc(s, a, gen_helper_vfp_negs); |
82 | + val |= KVM_ARM_VGIC_V2; | 62 | + return do_2misc_vec(s, a, gen_VNEG_F); |
83 | + } | ||
84 | + return val; | ||
85 | } | 63 | } |
86 | 64 | ||
87 | int kvm_arm_set_irq(int cpu, int irqtype, int irq, int level) | 65 | static bool trans_VRECPE(DisasContext *s, arg_2misc *a) |
88 | -- | 66 | -- |
89 | 2.20.1 | 67 | 2.20.1 |
90 | 68 | ||
91 | 69 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Convert the Neon floating-point vector comparison ops VCEQ, |
---|---|---|---|
2 | VCGE and VCGT over to using a gvec helper and use this to | ||
3 | implement the fp16 case. | ||
2 | 4 | ||
3 | Allwinner System-on-Chips usually contain a Real Time Clock (RTC) | 5 | (We put the float16_ceq() etc functions above the DO_2OP() |
4 | for non-volatile system date and time keeping. This commit adds a generic | 6 | macro definition because later when we convert the |
5 | Allwinner RTC device that supports the RTC devices found in Allwinner SoC | 7 | compare-against-zero instructions we'll want their |
6 | family sun4i (A10), sun7i (A20) and sun6i and newer (A31, H2+, H3, etc). | 8 | definitions to be visible at that point in the source file.) |
7 | The following RTC functionality and features are implemented: | ||
8 | 9 | ||
9 | * Year-Month-Day read/write | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | * Hour-Minute-Second read/write | 11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
11 | * General Purpose storage | 12 | Message-id: 20200828183354.27913-27-peter.maydell@linaro.org |
13 | --- | ||
14 | target/arm/helper.h | 9 +++++++ | ||
15 | target/arm/vec_helper.c | 44 +++++++++++++++++++++++++++++++++ | ||
16 | target/arm/translate-neon.c.inc | 6 ++--- | ||
17 | 3 files changed, 56 insertions(+), 3 deletions(-) | ||
12 | 18 | ||
13 | The following boards are extended with the RTC device: | 19 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
14 | |||
15 | * Cubieboard (hw/arm/cubieboard.c) | ||
16 | * Orange Pi PC (hw/arm/orangepi.c) | ||
17 | |||
18 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
19 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
20 | Message-id: 20200311221854.30370-13-nieklinnenbank@gmail.com | ||
21 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
22 | --- | ||
23 | hw/rtc/Makefile.objs | 1 + | ||
24 | include/hw/arm/allwinner-a10.h | 2 + | ||
25 | include/hw/arm/allwinner-h3.h | 3 + | ||
26 | include/hw/rtc/allwinner-rtc.h | 134 +++++++++++ | ||
27 | hw/arm/allwinner-a10.c | 8 + | ||
28 | hw/arm/allwinner-h3.c | 9 +- | ||
29 | hw/rtc/allwinner-rtc.c | 411 +++++++++++++++++++++++++++++++++ | ||
30 | hw/rtc/trace-events | 4 + | ||
31 | 8 files changed, 571 insertions(+), 1 deletion(-) | ||
32 | create mode 100644 include/hw/rtc/allwinner-rtc.h | ||
33 | create mode 100644 hw/rtc/allwinner-rtc.c | ||
34 | |||
35 | diff --git a/hw/rtc/Makefile.objs b/hw/rtc/Makefile.objs | ||
36 | index XXXXXXX..XXXXXXX 100644 | 20 | index XXXXXXX..XXXXXXX 100644 |
37 | --- a/hw/rtc/Makefile.objs | 21 | --- a/target/arm/helper.h |
38 | +++ b/hw/rtc/Makefile.objs | 22 | +++ b/target/arm/helper.h |
39 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_MC146818RTC) += mc146818rtc.o | 23 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmul_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
40 | common-obj-$(CONFIG_SUN4V_RTC) += sun4v-rtc.o | 24 | DEF_HELPER_FLAGS_5(gvec_fabd_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
41 | common-obj-$(CONFIG_ASPEED_SOC) += aspeed_rtc.o | 25 | DEF_HELPER_FLAGS_5(gvec_fabd_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
42 | common-obj-$(CONFIG_GOLDFISH_RTC) += goldfish_rtc.o | 26 | |
43 | +common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-rtc.o | 27 | +DEF_HELPER_FLAGS_5(gvec_fceq_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
44 | diff --git a/include/hw/arm/allwinner-a10.h b/include/hw/arm/allwinner-a10.h | 28 | +DEF_HELPER_FLAGS_5(gvec_fceq_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
29 | + | ||
30 | +DEF_HELPER_FLAGS_5(gvec_fcge_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
31 | +DEF_HELPER_FLAGS_5(gvec_fcge_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
32 | + | ||
33 | +DEF_HELPER_FLAGS_5(gvec_fcgt_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
34 | +DEF_HELPER_FLAGS_5(gvec_fcgt_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
35 | + | ||
36 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, | ||
37 | void, ptr, ptr, ptr, ptr, i32) | ||
38 | DEF_HELPER_FLAGS_5(gvec_ftsmul_s, TCG_CALL_NO_RWG, | ||
39 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
45 | index XXXXXXX..XXXXXXX 100644 | 40 | index XXXXXXX..XXXXXXX 100644 |
46 | --- a/include/hw/arm/allwinner-a10.h | 41 | --- a/target/arm/vec_helper.c |
47 | +++ b/include/hw/arm/allwinner-a10.h | 42 | +++ b/target/arm/vec_helper.c |
48 | @@ -XXX,XX +XXX,XX @@ | 43 | @@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fcmlad)(void *vd, void *vn, void *vm, |
49 | #include "hw/ide/ahci.h" | 44 | clear_tail(d, opr_sz, simd_maxsz(desc)); |
50 | #include "hw/usb/hcd-ohci.h" | 45 | } |
51 | #include "hw/usb/hcd-ehci.h" | 46 | |
52 | +#include "hw/rtc/allwinner-rtc.h" | ||
53 | |||
54 | #include "target/arm/cpu.h" | ||
55 | |||
56 | @@ -XXX,XX +XXX,XX @@ typedef struct AwA10State { | ||
57 | AwEmacState emac; | ||
58 | AllwinnerAHCIState sata; | ||
59 | AwSdHostState mmc0; | ||
60 | + AwRtcState rtc; | ||
61 | MemoryRegion sram_a; | ||
62 | EHCISysBusState ehci[AW_A10_NUM_USB]; | ||
63 | OHCISysBusState ohci[AW_A10_NUM_USB]; | ||
64 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | ||
65 | index XXXXXXX..XXXXXXX 100644 | ||
66 | --- a/include/hw/arm/allwinner-h3.h | ||
67 | +++ b/include/hw/arm/allwinner-h3.h | ||
68 | @@ -XXX,XX +XXX,XX @@ | ||
69 | #include "hw/misc/allwinner-sid.h" | ||
70 | #include "hw/sd/allwinner-sdhost.h" | ||
71 | #include "hw/net/allwinner-sun8i-emac.h" | ||
72 | +#include "hw/rtc/allwinner-rtc.h" | ||
73 | #include "target/arm/cpu.h" | ||
74 | #include "sysemu/block-backend.h" | ||
75 | |||
76 | @@ -XXX,XX +XXX,XX @@ enum { | ||
77 | AW_H3_GIC_CPU, | ||
78 | AW_H3_GIC_HYP, | ||
79 | AW_H3_GIC_VCPU, | ||
80 | + AW_H3_RTC, | ||
81 | AW_H3_CPUCFG, | ||
82 | AW_H3_SDRAM | ||
83 | }; | ||
84 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
85 | AwSidState sid; | ||
86 | AwSdHostState mmc0; | ||
87 | AwSun8iEmacState emac; | ||
88 | + AwRtcState rtc; | ||
89 | GICState gic; | ||
90 | MemoryRegion sram_a1; | ||
91 | MemoryRegion sram_a2; | ||
92 | diff --git a/include/hw/rtc/allwinner-rtc.h b/include/hw/rtc/allwinner-rtc.h | ||
93 | new file mode 100644 | ||
94 | index XXXXXXX..XXXXXXX | ||
95 | --- /dev/null | ||
96 | +++ b/include/hw/rtc/allwinner-rtc.h | ||
97 | @@ -XXX,XX +XXX,XX @@ | ||
98 | +/* | 47 | +/* |
99 | + * Allwinner Real Time Clock emulation | 48 | + * Floating point comparisons producing an integer result (all 1s or all 0s). |
100 | + * | 49 | + * Note that EQ doesn't signal InvalidOp for QNaNs but GE and GT do. |
101 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | 50 | + * Softfloat routines return 0/1, which we convert to the 0/-1 Neon requires. |
102 | + * | ||
103 | + * This program is free software: you can redistribute it and/or modify | ||
104 | + * it under the terms of the GNU General Public License as published by | ||
105 | + * the Free Software Foundation, either version 2 of the License, or | ||
106 | + * (at your option) any later version. | ||
107 | + * | ||
108 | + * This program is distributed in the hope that it will be useful, | ||
109 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
110 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
111 | + * GNU General Public License for more details. | ||
112 | + * | ||
113 | + * You should have received a copy of the GNU General Public License | ||
114 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
115 | + */ | 51 | + */ |
116 | + | 52 | +static uint16_t float16_ceq(float16 op1, float16 op2, float_status *stat) |
117 | +#ifndef HW_MISC_ALLWINNER_RTC_H | ||
118 | +#define HW_MISC_ALLWINNER_RTC_H | ||
119 | + | ||
120 | +#include "qom/object.h" | ||
121 | +#include "hw/sysbus.h" | ||
122 | + | ||
123 | +/** | ||
124 | + * Constants | ||
125 | + * @{ | ||
126 | + */ | ||
127 | + | ||
128 | +/** Highest register address used by RTC device */ | ||
129 | +#define AW_RTC_REGS_MAXADDR (0x200) | ||
130 | + | ||
131 | +/** Total number of known registers */ | ||
132 | +#define AW_RTC_REGS_NUM (AW_RTC_REGS_MAXADDR / sizeof(uint32_t)) | ||
133 | + | ||
134 | +/** @} */ | ||
135 | + | ||
136 | +/** | ||
137 | + * Object model types | ||
138 | + * @{ | ||
139 | + */ | ||
140 | + | ||
141 | +/** Generic Allwinner RTC device (abstract) */ | ||
142 | +#define TYPE_AW_RTC "allwinner-rtc" | ||
143 | + | ||
144 | +/** Allwinner RTC sun4i family (A10, A12) */ | ||
145 | +#define TYPE_AW_RTC_SUN4I TYPE_AW_RTC "-sun4i" | ||
146 | + | ||
147 | +/** Allwinner RTC sun6i family and newer (A31, H2+, H3, etc) */ | ||
148 | +#define TYPE_AW_RTC_SUN6I TYPE_AW_RTC "-sun6i" | ||
149 | + | ||
150 | +/** Allwinner RTC sun7i family (A20) */ | ||
151 | +#define TYPE_AW_RTC_SUN7I TYPE_AW_RTC "-sun7i" | ||
152 | + | ||
153 | +/** @} */ | ||
154 | + | ||
155 | +/** | ||
156 | + * Object model macros | ||
157 | + * @{ | ||
158 | + */ | ||
159 | + | ||
160 | +#define AW_RTC(obj) \ | ||
161 | + OBJECT_CHECK(AwRtcState, (obj), TYPE_AW_RTC) | ||
162 | +#define AW_RTC_CLASS(klass) \ | ||
163 | + OBJECT_CLASS_CHECK(AwRtcClass, (klass), TYPE_AW_RTC) | ||
164 | +#define AW_RTC_GET_CLASS(obj) \ | ||
165 | + OBJECT_GET_CLASS(AwRtcClass, (obj), TYPE_AW_RTC) | ||
166 | + | ||
167 | +/** @} */ | ||
168 | + | ||
169 | +/** | ||
170 | + * Allwinner RTC per-object instance state. | ||
171 | + */ | ||
172 | +typedef struct AwRtcState { | ||
173 | + /*< private >*/ | ||
174 | + SysBusDevice parent_obj; | ||
175 | + /*< public >*/ | ||
176 | + | ||
177 | + /** | ||
178 | + * Actual year represented by the device when year counter is zero | ||
179 | + * | ||
180 | + * Can be overridden by the user using the corresponding 'base-year' | ||
181 | + * property. The base year used by the target OS driver can vary, for | ||
182 | + * example the Linux driver for sun6i uses 1970 while NetBSD uses 2000. | ||
183 | + */ | ||
184 | + int base_year; | ||
185 | + | ||
186 | + /** Maps I/O registers in physical memory */ | ||
187 | + MemoryRegion iomem; | ||
188 | + | ||
189 | + /** Array of hardware registers */ | ||
190 | + uint32_t regs[AW_RTC_REGS_NUM]; | ||
191 | + | ||
192 | +} AwRtcState; | ||
193 | + | ||
194 | +/** | ||
195 | + * Allwinner RTC class-level struct. | ||
196 | + * | ||
197 | + * This struct is filled by each sunxi device specific code | ||
198 | + * such that the generic code can use this struct to support | ||
199 | + * all devices. | ||
200 | + */ | ||
201 | +typedef struct AwRtcClass { | ||
202 | + /*< private >*/ | ||
203 | + SysBusDeviceClass parent_class; | ||
204 | + /*< public >*/ | ||
205 | + | ||
206 | + /** Defines device specific register map */ | ||
207 | + const uint8_t *regmap; | ||
208 | + | ||
209 | + /** Size of the regmap in bytes */ | ||
210 | + size_t regmap_size; | ||
211 | + | ||
212 | + /** | ||
213 | + * Read device specific register | ||
214 | + * | ||
215 | + * @offset: register offset to read | ||
216 | + * @return true if register read successful, false otherwise | ||
217 | + */ | ||
218 | + bool (*read)(AwRtcState *s, uint32_t offset); | ||
219 | + | ||
220 | + /** | ||
221 | + * Write device specific register | ||
222 | + * | ||
223 | + * @offset: register offset to write | ||
224 | + * @data: value to set in register | ||
225 | + * @return true if register write successful, false otherwise | ||
226 | + */ | ||
227 | + bool (*write)(AwRtcState *s, uint32_t offset, uint32_t data); | ||
228 | + | ||
229 | +} AwRtcClass; | ||
230 | + | ||
231 | +#endif /* HW_MISC_ALLWINNER_RTC_H */ | ||
232 | diff --git a/hw/arm/allwinner-a10.c b/hw/arm/allwinner-a10.c | ||
233 | index XXXXXXX..XXXXXXX 100644 | ||
234 | --- a/hw/arm/allwinner-a10.c | ||
235 | +++ b/hw/arm/allwinner-a10.c | ||
236 | @@ -XXX,XX +XXX,XX @@ | ||
237 | #define AW_A10_EHCI_BASE 0x01c14000 | ||
238 | #define AW_A10_OHCI_BASE 0x01c14400 | ||
239 | #define AW_A10_SATA_BASE 0x01c18000 | ||
240 | +#define AW_A10_RTC_BASE 0x01c20d00 | ||
241 | |||
242 | static void aw_a10_init(Object *obj) | ||
243 | { | ||
244 | @@ -XXX,XX +XXX,XX @@ static void aw_a10_init(Object *obj) | ||
245 | |||
246 | sysbus_init_child_obj(obj, "mmc0", &s->mmc0, sizeof(s->mmc0), | ||
247 | TYPE_AW_SDHOST_SUN4I); | ||
248 | + | ||
249 | + sysbus_init_child_obj(obj, "rtc", &s->rtc, sizeof(s->rtc), | ||
250 | + TYPE_AW_RTC_SUN4I); | ||
251 | } | ||
252 | |||
253 | static void aw_a10_realize(DeviceState *dev, Error **errp) | ||
254 | @@ -XXX,XX +XXX,XX @@ static void aw_a10_realize(DeviceState *dev, Error **errp) | ||
255 | sysbus_connect_irq(SYS_BUS_DEVICE(&s->mmc0), 0, qdev_get_gpio_in(dev, 32)); | ||
256 | object_property_add_alias(OBJECT(s), "sd-bus", OBJECT(&s->mmc0), | ||
257 | "sd-bus", &error_abort); | ||
258 | + | ||
259 | + /* RTC */ | ||
260 | + qdev_init_nofail(DEVICE(&s->rtc)); | ||
261 | + sysbus_mmio_map_overlap(SYS_BUS_DEVICE(&s->rtc), 0, AW_A10_RTC_BASE, 10); | ||
262 | } | ||
263 | |||
264 | static void aw_a10_class_init(ObjectClass *oc, void *data) | ||
265 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
266 | index XXXXXXX..XXXXXXX 100644 | ||
267 | --- a/hw/arm/allwinner-h3.c | ||
268 | +++ b/hw/arm/allwinner-h3.c | ||
269 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
270 | [AW_H3_GIC_CPU] = 0x01c82000, | ||
271 | [AW_H3_GIC_HYP] = 0x01c84000, | ||
272 | [AW_H3_GIC_VCPU] = 0x01c86000, | ||
273 | + [AW_H3_RTC] = 0x01f00000, | ||
274 | [AW_H3_CPUCFG] = 0x01f01c00, | ||
275 | [AW_H3_SDRAM] = 0x40000000 | ||
276 | }; | ||
277 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
278 | { "csi", 0x01cb0000, 320 * KiB }, | ||
279 | { "tve", 0x01e00000, 64 * KiB }, | ||
280 | { "hdmi", 0x01ee0000, 128 * KiB }, | ||
281 | - { "rtc", 0x01f00000, 1 * KiB }, | ||
282 | { "r_timer", 0x01f00800, 1 * KiB }, | ||
283 | { "r_intc", 0x01f00c00, 1 * KiB }, | ||
284 | { "r_wdog", 0x01f01000, 1 * KiB }, | ||
285 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
286 | "ram-addr", &error_abort); | ||
287 | object_property_add_alias(obj, "ram-size", OBJECT(&s->dramc), | ||
288 | "ram-size", &error_abort); | ||
289 | + | ||
290 | + sysbus_init_child_obj(obj, "rtc", &s->rtc, sizeof(s->rtc), | ||
291 | + TYPE_AW_RTC_SUN6I); | ||
292 | } | ||
293 | |||
294 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
295 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
296 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 1, s->memmap[AW_H3_DRAMCTL]); | ||
297 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->dramc), 2, s->memmap[AW_H3_DRAMPHY]); | ||
298 | |||
299 | + /* RTC */ | ||
300 | + qdev_init_nofail(DEVICE(&s->rtc)); | ||
301 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->rtc), 0, s->memmap[AW_H3_RTC]); | ||
302 | + | ||
303 | /* Unimplemented devices */ | ||
304 | for (i = 0; i < ARRAY_SIZE(unimplemented); i++) { | ||
305 | create_unimplemented_device(unimplemented[i].device_name, | ||
306 | diff --git a/hw/rtc/allwinner-rtc.c b/hw/rtc/allwinner-rtc.c | ||
307 | new file mode 100644 | ||
308 | index XXXXXXX..XXXXXXX | ||
309 | --- /dev/null | ||
310 | +++ b/hw/rtc/allwinner-rtc.c | ||
311 | @@ -XXX,XX +XXX,XX @@ | ||
312 | +/* | ||
313 | + * Allwinner Real Time Clock emulation | ||
314 | + * | ||
315 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
316 | + * | ||
317 | + * This program is free software: you can redistribute it and/or modify | ||
318 | + * it under the terms of the GNU General Public License as published by | ||
319 | + * the Free Software Foundation, either version 2 of the License, or | ||
320 | + * (at your option) any later version. | ||
321 | + * | ||
322 | + * This program is distributed in the hope that it will be useful, | ||
323 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
324 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
325 | + * GNU General Public License for more details. | ||
326 | + * | ||
327 | + * You should have received a copy of the GNU General Public License | ||
328 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
329 | + */ | ||
330 | + | ||
331 | +#include "qemu/osdep.h" | ||
332 | +#include "qemu/units.h" | ||
333 | +#include "hw/sysbus.h" | ||
334 | +#include "migration/vmstate.h" | ||
335 | +#include "qemu/log.h" | ||
336 | +#include "qemu/module.h" | ||
337 | +#include "qemu-common.h" | ||
338 | +#include "hw/qdev-properties.h" | ||
339 | +#include "hw/rtc/allwinner-rtc.h" | ||
340 | +#include "trace.h" | ||
341 | + | ||
342 | +/* RTC registers */ | ||
343 | +enum { | ||
344 | + REG_LOSC = 1, /* Low Oscillator Control */ | ||
345 | + REG_YYMMDD, /* RTC Year-Month-Day */ | ||
346 | + REG_HHMMSS, /* RTC Hour-Minute-Second */ | ||
347 | + REG_ALARM1_WKHHMMSS, /* Alarm1 Week Hour-Minute-Second */ | ||
348 | + REG_ALARM1_EN, /* Alarm1 Enable */ | ||
349 | + REG_ALARM1_IRQ_EN, /* Alarm1 IRQ Enable */ | ||
350 | + REG_ALARM1_IRQ_STA, /* Alarm1 IRQ Status */ | ||
351 | + REG_GP0, /* General Purpose Register 0 */ | ||
352 | + REG_GP1, /* General Purpose Register 1 */ | ||
353 | + REG_GP2, /* General Purpose Register 2 */ | ||
354 | + REG_GP3, /* General Purpose Register 3 */ | ||
355 | + | ||
356 | + /* sun4i registers */ | ||
357 | + REG_ALARM1_DDHHMMSS, /* Alarm1 Day Hour-Minute-Second */ | ||
358 | + REG_CPUCFG, /* CPU Configuration Register */ | ||
359 | + | ||
360 | + /* sun6i registers */ | ||
361 | + REG_LOSC_AUTOSTA, /* LOSC Auto Switch Status */ | ||
362 | + REG_INT_OSC_PRE, /* Internal OSC Clock Prescaler */ | ||
363 | + REG_ALARM0_COUNTER, /* Alarm0 Counter */ | ||
364 | + REG_ALARM0_CUR_VLU, /* Alarm0 Counter Current Value */ | ||
365 | + REG_ALARM0_ENABLE, /* Alarm0 Enable */ | ||
366 | + REG_ALARM0_IRQ_EN, /* Alarm0 IRQ Enable */ | ||
367 | + REG_ALARM0_IRQ_STA, /* Alarm0 IRQ Status */ | ||
368 | + REG_ALARM_CONFIG, /* Alarm Config */ | ||
369 | + REG_LOSC_OUT_GATING, /* LOSC Output Gating Register */ | ||
370 | + REG_GP4, /* General Purpose Register 4 */ | ||
371 | + REG_GP5, /* General Purpose Register 5 */ | ||
372 | + REG_GP6, /* General Purpose Register 6 */ | ||
373 | + REG_GP7, /* General Purpose Register 7 */ | ||
374 | + REG_RTC_DBG, /* RTC Debug Register */ | ||
375 | + REG_GPL_HOLD_OUT, /* GPL Hold Output Register */ | ||
376 | + REG_VDD_RTC, /* VDD RTC Regulate Register */ | ||
377 | + REG_IC_CHARA, /* IC Characteristics Register */ | ||
378 | +}; | ||
379 | + | ||
380 | +/* RTC register flags */ | ||
381 | +enum { | ||
382 | + REG_LOSC_YMD = (1 << 7), | ||
383 | + REG_LOSC_HMS = (1 << 8), | ||
384 | +}; | ||
385 | + | ||
386 | +/* RTC sun4i register map (offset to name) */ | ||
387 | +const uint8_t allwinner_rtc_sun4i_regmap[] = { | ||
388 | + [0x0000] = REG_LOSC, | ||
389 | + [0x0004] = REG_YYMMDD, | ||
390 | + [0x0008] = REG_HHMMSS, | ||
391 | + [0x000C] = REG_ALARM1_DDHHMMSS, | ||
392 | + [0x0010] = REG_ALARM1_WKHHMMSS, | ||
393 | + [0x0014] = REG_ALARM1_EN, | ||
394 | + [0x0018] = REG_ALARM1_IRQ_EN, | ||
395 | + [0x001C] = REG_ALARM1_IRQ_STA, | ||
396 | + [0x0020] = REG_GP0, | ||
397 | + [0x0024] = REG_GP1, | ||
398 | + [0x0028] = REG_GP2, | ||
399 | + [0x002C] = REG_GP3, | ||
400 | + [0x003C] = REG_CPUCFG, | ||
401 | +}; | ||
402 | + | ||
403 | +/* RTC sun6i register map (offset to name) */ | ||
404 | +const uint8_t allwinner_rtc_sun6i_regmap[] = { | ||
405 | + [0x0000] = REG_LOSC, | ||
406 | + [0x0004] = REG_LOSC_AUTOSTA, | ||
407 | + [0x0008] = REG_INT_OSC_PRE, | ||
408 | + [0x0010] = REG_YYMMDD, | ||
409 | + [0x0014] = REG_HHMMSS, | ||
410 | + [0x0020] = REG_ALARM0_COUNTER, | ||
411 | + [0x0024] = REG_ALARM0_CUR_VLU, | ||
412 | + [0x0028] = REG_ALARM0_ENABLE, | ||
413 | + [0x002C] = REG_ALARM0_IRQ_EN, | ||
414 | + [0x0030] = REG_ALARM0_IRQ_STA, | ||
415 | + [0x0040] = REG_ALARM1_WKHHMMSS, | ||
416 | + [0x0044] = REG_ALARM1_EN, | ||
417 | + [0x0048] = REG_ALARM1_IRQ_EN, | ||
418 | + [0x004C] = REG_ALARM1_IRQ_STA, | ||
419 | + [0x0050] = REG_ALARM_CONFIG, | ||
420 | + [0x0060] = REG_LOSC_OUT_GATING, | ||
421 | + [0x0100] = REG_GP0, | ||
422 | + [0x0104] = REG_GP1, | ||
423 | + [0x0108] = REG_GP2, | ||
424 | + [0x010C] = REG_GP3, | ||
425 | + [0x0110] = REG_GP4, | ||
426 | + [0x0114] = REG_GP5, | ||
427 | + [0x0118] = REG_GP6, | ||
428 | + [0x011C] = REG_GP7, | ||
429 | + [0x0170] = REG_RTC_DBG, | ||
430 | + [0x0180] = REG_GPL_HOLD_OUT, | ||
431 | + [0x0190] = REG_VDD_RTC, | ||
432 | + [0x01F0] = REG_IC_CHARA, | ||
433 | +}; | ||
434 | + | ||
435 | +static bool allwinner_rtc_sun4i_read(AwRtcState *s, uint32_t offset) | ||
436 | +{ | 53 | +{ |
437 | + /* no sun4i specific registers currently implemented */ | 54 | + return -float16_eq_quiet(op1, op2, stat); |
438 | + return false; | ||
439 | +} | 55 | +} |
440 | + | 56 | + |
441 | +static bool allwinner_rtc_sun4i_write(AwRtcState *s, uint32_t offset, | 57 | +static uint32_t float32_ceq(float32 op1, float32 op2, float_status *stat) |
442 | + uint32_t data) | ||
443 | +{ | 58 | +{ |
444 | + /* no sun4i specific registers currently implemented */ | 59 | + return -float32_eq_quiet(op1, op2, stat); |
445 | + return false; | ||
446 | +} | 60 | +} |
447 | + | 61 | + |
448 | +static bool allwinner_rtc_sun6i_read(AwRtcState *s, uint32_t offset) | 62 | +static uint16_t float16_cge(float16 op1, float16 op2, float_status *stat) |
449 | +{ | 63 | +{ |
450 | + const AwRtcClass *c = AW_RTC_GET_CLASS(s); | 64 | + return -float16_le(op2, op1, stat); |
451 | + | ||
452 | + switch (c->regmap[offset]) { | ||
453 | + case REG_GP4: /* General Purpose Register 4 */ | ||
454 | + case REG_GP5: /* General Purpose Register 5 */ | ||
455 | + case REG_GP6: /* General Purpose Register 6 */ | ||
456 | + case REG_GP7: /* General Purpose Register 7 */ | ||
457 | + return true; | ||
458 | + default: | ||
459 | + break; | ||
460 | + } | ||
461 | + return false; | ||
462 | +} | 65 | +} |
463 | + | 66 | + |
464 | +static bool allwinner_rtc_sun6i_write(AwRtcState *s, uint32_t offset, | 67 | +static uint32_t float32_cge(float32 op1, float32 op2, float_status *stat) |
465 | + uint32_t data) | ||
466 | +{ | 68 | +{ |
467 | + const AwRtcClass *c = AW_RTC_GET_CLASS(s); | 69 | + return -float32_le(op2, op1, stat); |
468 | + | ||
469 | + switch (c->regmap[offset]) { | ||
470 | + case REG_GP4: /* General Purpose Register 4 */ | ||
471 | + case REG_GP5: /* General Purpose Register 5 */ | ||
472 | + case REG_GP6: /* General Purpose Register 6 */ | ||
473 | + case REG_GP7: /* General Purpose Register 7 */ | ||
474 | + return true; | ||
475 | + default: | ||
476 | + break; | ||
477 | + } | ||
478 | + return false; | ||
479 | +} | 70 | +} |
480 | + | 71 | + |
481 | +static uint64_t allwinner_rtc_read(void *opaque, hwaddr offset, | 72 | +static uint16_t float16_cgt(float16 op1, float16 op2, float_status *stat) |
482 | + unsigned size) | ||
483 | +{ | 73 | +{ |
484 | + AwRtcState *s = AW_RTC(opaque); | 74 | + return -float16_lt(op2, op1, stat); |
485 | + const AwRtcClass *c = AW_RTC_GET_CLASS(s); | ||
486 | + uint64_t val = 0; | ||
487 | + | ||
488 | + if (offset >= c->regmap_size) { | ||
489 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
490 | + __func__, (uint32_t)offset); | ||
491 | + return 0; | ||
492 | + } | ||
493 | + | ||
494 | + if (!c->regmap[offset]) { | ||
495 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: invalid register 0x%04x\n", | ||
496 | + __func__, (uint32_t)offset); | ||
497 | + return 0; | ||
498 | + } | ||
499 | + | ||
500 | + switch (c->regmap[offset]) { | ||
501 | + case REG_LOSC: /* Low Oscillator Control */ | ||
502 | + val = s->regs[REG_LOSC]; | ||
503 | + s->regs[REG_LOSC] &= ~(REG_LOSC_YMD | REG_LOSC_HMS); | ||
504 | + break; | ||
505 | + case REG_YYMMDD: /* RTC Year-Month-Day */ | ||
506 | + case REG_HHMMSS: /* RTC Hour-Minute-Second */ | ||
507 | + case REG_GP0: /* General Purpose Register 0 */ | ||
508 | + case REG_GP1: /* General Purpose Register 1 */ | ||
509 | + case REG_GP2: /* General Purpose Register 2 */ | ||
510 | + case REG_GP3: /* General Purpose Register 3 */ | ||
511 | + val = s->regs[c->regmap[offset]]; | ||
512 | + break; | ||
513 | + default: | ||
514 | + if (!c->read(s, offset)) { | ||
515 | + qemu_log_mask(LOG_UNIMP, "%s: unimplemented register 0x%04x\n", | ||
516 | + __func__, (uint32_t)offset); | ||
517 | + } | ||
518 | + val = s->regs[c->regmap[offset]]; | ||
519 | + break; | ||
520 | + } | ||
521 | + | ||
522 | + trace_allwinner_rtc_read(offset, val); | ||
523 | + return val; | ||
524 | +} | 75 | +} |
525 | + | 76 | + |
526 | +static void allwinner_rtc_write(void *opaque, hwaddr offset, | 77 | +static uint32_t float32_cgt(float32 op1, float32 op2, float_status *stat) |
527 | + uint64_t val, unsigned size) | ||
528 | +{ | 78 | +{ |
529 | + AwRtcState *s = AW_RTC(opaque); | 79 | + return -float32_lt(op2, op1, stat); |
530 | + const AwRtcClass *c = AW_RTC_GET_CLASS(s); | ||
531 | + | ||
532 | + if (offset >= c->regmap_size) { | ||
533 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
534 | + __func__, (uint32_t)offset); | ||
535 | + return; | ||
536 | + } | ||
537 | + | ||
538 | + if (!c->regmap[offset]) { | ||
539 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: invalid register 0x%04x\n", | ||
540 | + __func__, (uint32_t)offset); | ||
541 | + return; | ||
542 | + } | ||
543 | + | ||
544 | + trace_allwinner_rtc_write(offset, val); | ||
545 | + | ||
546 | + switch (c->regmap[offset]) { | ||
547 | + case REG_YYMMDD: /* RTC Year-Month-Day */ | ||
548 | + s->regs[REG_YYMMDD] = val; | ||
549 | + s->regs[REG_LOSC] |= REG_LOSC_YMD; | ||
550 | + break; | ||
551 | + case REG_HHMMSS: /* RTC Hour-Minute-Second */ | ||
552 | + s->regs[REG_HHMMSS] = val; | ||
553 | + s->regs[REG_LOSC] |= REG_LOSC_HMS; | ||
554 | + break; | ||
555 | + case REG_GP0: /* General Purpose Register 0 */ | ||
556 | + case REG_GP1: /* General Purpose Register 1 */ | ||
557 | + case REG_GP2: /* General Purpose Register 2 */ | ||
558 | + case REG_GP3: /* General Purpose Register 3 */ | ||
559 | + s->regs[c->regmap[offset]] = val; | ||
560 | + break; | ||
561 | + default: | ||
562 | + if (!c->write(s, offset, val)) { | ||
563 | + qemu_log_mask(LOG_UNIMP, "%s: unimplemented register 0x%04x\n", | ||
564 | + __func__, (uint32_t)offset); | ||
565 | + } | ||
566 | + break; | ||
567 | + } | ||
568 | +} | 80 | +} |
569 | + | 81 | + |
570 | +static const MemoryRegionOps allwinner_rtc_ops = { | 82 | #define DO_2OP(NAME, FUNC, TYPE) \ |
571 | + .read = allwinner_rtc_read, | 83 | void HELPER(NAME)(void *vd, void *vn, void *stat, uint32_t desc) \ |
572 | + .write = allwinner_rtc_write, | 84 | { \ |
573 | + .endianness = DEVICE_NATIVE_ENDIAN, | 85 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_ftsmul_d, float64_ftsmul, float64) |
574 | + .valid = { | 86 | DO_3OP(gvec_fabd_h, float16_abd, float16) |
575 | + .min_access_size = 4, | 87 | DO_3OP(gvec_fabd_s, float32_abd, float32) |
576 | + .max_access_size = 4, | 88 | |
577 | + }, | 89 | +DO_3OP(gvec_fceq_h, float16_ceq, float16) |
578 | + .impl.min_access_size = 4, | 90 | +DO_3OP(gvec_fceq_s, float32_ceq, float32) |
579 | +}; | ||
580 | + | 91 | + |
581 | +static void allwinner_rtc_reset(DeviceState *dev) | 92 | +DO_3OP(gvec_fcge_h, float16_cge, float16) |
582 | +{ | 93 | +DO_3OP(gvec_fcge_s, float32_cge, float32) |
583 | + AwRtcState *s = AW_RTC(dev); | ||
584 | + struct tm now; | ||
585 | + | 94 | + |
586 | + /* Clear registers */ | 95 | +DO_3OP(gvec_fcgt_h, float16_cgt, float16) |
587 | + memset(s->regs, 0, sizeof(s->regs)); | 96 | +DO_3OP(gvec_fcgt_s, float32_cgt, float32) |
588 | + | 97 | + |
589 | + /* Get current datetime */ | 98 | #ifdef TARGET_AARCH64 |
590 | + qemu_get_timedate(&now, 0); | 99 | |
591 | + | 100 | DO_3OP(gvec_recps_h, helper_recpsf_f16, float16) |
592 | + /* Set RTC with current datetime */ | 101 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
593 | + if (s->base_year > 1900) { | ||
594 | + s->regs[REG_YYMMDD] = ((now.tm_year + 1900 - s->base_year) << 16) | | ||
595 | + ((now.tm_mon + 1) << 8) | | ||
596 | + now.tm_mday; | ||
597 | + s->regs[REG_HHMMSS] = (((now.tm_wday + 6) % 7) << 29) | | ||
598 | + (now.tm_hour << 16) | | ||
599 | + (now.tm_min << 8) | | ||
600 | + now.tm_sec; | ||
601 | + } | ||
602 | +} | ||
603 | + | ||
604 | +static void allwinner_rtc_init(Object *obj) | ||
605 | +{ | ||
606 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
607 | + AwRtcState *s = AW_RTC(obj); | ||
608 | + | ||
609 | + /* Memory mapping */ | ||
610 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_rtc_ops, s, | ||
611 | + TYPE_AW_RTC, 1 * KiB); | ||
612 | + sysbus_init_mmio(sbd, &s->iomem); | ||
613 | +} | ||
614 | + | ||
615 | +static const VMStateDescription allwinner_rtc_vmstate = { | ||
616 | + .name = "allwinner-rtc", | ||
617 | + .version_id = 1, | ||
618 | + .minimum_version_id = 1, | ||
619 | + .fields = (VMStateField[]) { | ||
620 | + VMSTATE_UINT32_ARRAY(regs, AwRtcState, AW_RTC_REGS_NUM), | ||
621 | + VMSTATE_END_OF_LIST() | ||
622 | + } | ||
623 | +}; | ||
624 | + | ||
625 | +static Property allwinner_rtc_properties[] = { | ||
626 | + DEFINE_PROP_INT32("base-year", AwRtcState, base_year, 0), | ||
627 | + DEFINE_PROP_END_OF_LIST(), | ||
628 | +}; | ||
629 | + | ||
630 | +static void allwinner_rtc_class_init(ObjectClass *klass, void *data) | ||
631 | +{ | ||
632 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
633 | + | ||
634 | + dc->reset = allwinner_rtc_reset; | ||
635 | + dc->vmsd = &allwinner_rtc_vmstate; | ||
636 | + device_class_set_props(dc, allwinner_rtc_properties); | ||
637 | +} | ||
638 | + | ||
639 | +static void allwinner_rtc_sun4i_init(Object *obj) | ||
640 | +{ | ||
641 | + AwRtcState *s = AW_RTC(obj); | ||
642 | + s->base_year = 2010; | ||
643 | +} | ||
644 | + | ||
645 | +static void allwinner_rtc_sun4i_class_init(ObjectClass *klass, void *data) | ||
646 | +{ | ||
647 | + AwRtcClass *arc = AW_RTC_CLASS(klass); | ||
648 | + | ||
649 | + arc->regmap = allwinner_rtc_sun4i_regmap; | ||
650 | + arc->regmap_size = sizeof(allwinner_rtc_sun4i_regmap); | ||
651 | + arc->read = allwinner_rtc_sun4i_read; | ||
652 | + arc->write = allwinner_rtc_sun4i_write; | ||
653 | +} | ||
654 | + | ||
655 | +static void allwinner_rtc_sun6i_init(Object *obj) | ||
656 | +{ | ||
657 | + AwRtcState *s = AW_RTC(obj); | ||
658 | + s->base_year = 1970; | ||
659 | +} | ||
660 | + | ||
661 | +static void allwinner_rtc_sun6i_class_init(ObjectClass *klass, void *data) | ||
662 | +{ | ||
663 | + AwRtcClass *arc = AW_RTC_CLASS(klass); | ||
664 | + | ||
665 | + arc->regmap = allwinner_rtc_sun6i_regmap; | ||
666 | + arc->regmap_size = sizeof(allwinner_rtc_sun6i_regmap); | ||
667 | + arc->read = allwinner_rtc_sun6i_read; | ||
668 | + arc->write = allwinner_rtc_sun6i_write; | ||
669 | +} | ||
670 | + | ||
671 | +static void allwinner_rtc_sun7i_init(Object *obj) | ||
672 | +{ | ||
673 | + AwRtcState *s = AW_RTC(obj); | ||
674 | + s->base_year = 1970; | ||
675 | +} | ||
676 | + | ||
677 | +static void allwinner_rtc_sun7i_class_init(ObjectClass *klass, void *data) | ||
678 | +{ | ||
679 | + AwRtcClass *arc = AW_RTC_CLASS(klass); | ||
680 | + allwinner_rtc_sun4i_class_init(klass, arc); | ||
681 | +} | ||
682 | + | ||
683 | +static const TypeInfo allwinner_rtc_info = { | ||
684 | + .name = TYPE_AW_RTC, | ||
685 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
686 | + .instance_init = allwinner_rtc_init, | ||
687 | + .instance_size = sizeof(AwRtcState), | ||
688 | + .class_init = allwinner_rtc_class_init, | ||
689 | + .class_size = sizeof(AwRtcClass), | ||
690 | + .abstract = true, | ||
691 | +}; | ||
692 | + | ||
693 | +static const TypeInfo allwinner_rtc_sun4i_info = { | ||
694 | + .name = TYPE_AW_RTC_SUN4I, | ||
695 | + .parent = TYPE_AW_RTC, | ||
696 | + .class_init = allwinner_rtc_sun4i_class_init, | ||
697 | + .instance_init = allwinner_rtc_sun4i_init, | ||
698 | +}; | ||
699 | + | ||
700 | +static const TypeInfo allwinner_rtc_sun6i_info = { | ||
701 | + .name = TYPE_AW_RTC_SUN6I, | ||
702 | + .parent = TYPE_AW_RTC, | ||
703 | + .class_init = allwinner_rtc_sun6i_class_init, | ||
704 | + .instance_init = allwinner_rtc_sun6i_init, | ||
705 | +}; | ||
706 | + | ||
707 | +static const TypeInfo allwinner_rtc_sun7i_info = { | ||
708 | + .name = TYPE_AW_RTC_SUN7I, | ||
709 | + .parent = TYPE_AW_RTC, | ||
710 | + .class_init = allwinner_rtc_sun7i_class_init, | ||
711 | + .instance_init = allwinner_rtc_sun7i_init, | ||
712 | +}; | ||
713 | + | ||
714 | +static void allwinner_rtc_register(void) | ||
715 | +{ | ||
716 | + type_register_static(&allwinner_rtc_info); | ||
717 | + type_register_static(&allwinner_rtc_sun4i_info); | ||
718 | + type_register_static(&allwinner_rtc_sun6i_info); | ||
719 | + type_register_static(&allwinner_rtc_sun7i_info); | ||
720 | +} | ||
721 | + | ||
722 | +type_init(allwinner_rtc_register) | ||
723 | diff --git a/hw/rtc/trace-events b/hw/rtc/trace-events | ||
724 | index XXXXXXX..XXXXXXX 100644 | 102 | index XXXXXXX..XXXXXXX 100644 |
725 | --- a/hw/rtc/trace-events | 103 | --- a/target/arm/translate-neon.c.inc |
726 | +++ b/hw/rtc/trace-events | 104 | +++ b/target/arm/translate-neon.c.inc |
727 | @@ -XXX,XX +XXX,XX @@ | 105 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VADD, gen_helper_gvec_fadd_s, gen_helper_gvec_fadd_h) |
728 | # See docs/devel/tracing.txt for syntax documentation. | 106 | DO_3S_FP_GVEC(VSUB, gen_helper_gvec_fsub_s, gen_helper_gvec_fsub_h) |
729 | 107 | DO_3S_FP_GVEC(VABD, gen_helper_gvec_fabd_s, gen_helper_gvec_fabd_h) | |
730 | +# allwinner-rtc.c | 108 | DO_3S_FP_GVEC(VMUL, gen_helper_gvec_fmul_s, gen_helper_gvec_fmul_h) |
731 | +allwinner_rtc_read(uint64_t addr, uint64_t value) "addr 0x%" PRIx64 " value 0x%" PRIx64 | 109 | +DO_3S_FP_GVEC(VCEQ, gen_helper_gvec_fceq_s, gen_helper_gvec_fceq_h) |
732 | +allwinner_rtc_write(uint64_t addr, uint64_t value) "addr 0x%" PRIx64 " value 0x%" PRIx64 | 110 | +DO_3S_FP_GVEC(VCGE, gen_helper_gvec_fcge_s, gen_helper_gvec_fcge_h) |
733 | + | 111 | +DO_3S_FP_GVEC(VCGT, gen_helper_gvec_fcgt_s, gen_helper_gvec_fcgt_h) |
734 | # sun4v-rtc.c | 112 | |
735 | sun4v_rtc_read(uint64_t addr, uint64_t value) "read: addr 0x%" PRIx64 " value 0x%" PRIx64 | 113 | /* |
736 | sun4v_rtc_write(uint64_t addr, uint64_t value) "write: addr 0x%" PRIx64 " value 0x%" PRIx64 | 114 | * For all the functions using this macro, size == 1 means fp16, |
115 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VMUL, gen_helper_gvec_fmul_s, gen_helper_gvec_fmul_h) | ||
116 | return do_3same_fp(s, a, FUNC, READS_VD); \ | ||
117 | } | ||
118 | |||
119 | -DO_3S_FP(VCEQ, gen_helper_neon_ceq_f32, false) | ||
120 | -DO_3S_FP(VCGE, gen_helper_neon_cge_f32, false) | ||
121 | -DO_3S_FP(VCGT, gen_helper_neon_cgt_f32, false) | ||
122 | DO_3S_FP(VACGE, gen_helper_neon_acge_f32, false) | ||
123 | DO_3S_FP(VACGT, gen_helper_neon_acgt_f32, false) | ||
124 | DO_3S_FP(VMAX, gen_helper_vfp_maxs, false) | ||
737 | -- | 125 | -- |
738 | 2.20.1 | 126 | 2.20.1 |
739 | 127 | ||
740 | 128 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Convert the neon floating-point vector absolute comparison ops |
---|---|---|---|
2 | VACGE and VACGT over to using a gvec hepler and use this to | ||
3 | implement the fp16 case. | ||
2 | 4 | ||
3 | The Allwinner System on Chip families sun4i and above contain | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | an integrated storage controller for Secure Digital (SD) and | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Multi Media Card (MMC) interfaces. This commit adds support | 7 | Message-id: 20200828183354.27913-28-peter.maydell@linaro.org |
6 | for the Allwinner SD/MMC storage controller with the following | 8 | --- |
7 | emulated features: | 9 | target/arm/helper.h | 6 ++++++ |
10 | target/arm/vec_helper.c | 26 ++++++++++++++++++++++++++ | ||
11 | target/arm/translate-neon.c.inc | 4 ++-- | ||
12 | 3 files changed, 34 insertions(+), 2 deletions(-) | ||
8 | 13 | ||
9 | * DMA transfers | 14 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
10 | * Direct FIFO I/O | ||
11 | * Short/Long format command responses | ||
12 | * Auto-Stop command (CMD12) | ||
13 | * Insert & remove card detection | ||
14 | |||
15 | The following boards are extended with the SD host controller: | ||
16 | |||
17 | * Cubieboard (hw/arm/cubieboard.c) | ||
18 | * Orange Pi PC (hw/arm/orangepi.c) | ||
19 | |||
20 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
21 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
22 | Tested-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
23 | Message-id: 20200311221854.30370-9-nieklinnenbank@gmail.com | ||
24 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
25 | --- | ||
26 | hw/sd/Makefile.objs | 1 + | ||
27 | include/hw/arm/allwinner-a10.h | 2 + | ||
28 | include/hw/arm/allwinner-h3.h | 3 + | ||
29 | include/hw/sd/allwinner-sdhost.h | 135 +++++ | ||
30 | hw/arm/allwinner-a10.c | 11 + | ||
31 | hw/arm/allwinner-h3.c | 15 +- | ||
32 | hw/arm/cubieboard.c | 15 + | ||
33 | hw/arm/orangepi.c | 16 + | ||
34 | hw/sd/allwinner-sdhost.c | 854 +++++++++++++++++++++++++++++++ | ||
35 | hw/arm/Kconfig | 1 + | ||
36 | hw/sd/trace-events | 7 + | ||
37 | 11 files changed, 1059 insertions(+), 1 deletion(-) | ||
38 | create mode 100644 include/hw/sd/allwinner-sdhost.h | ||
39 | create mode 100644 hw/sd/allwinner-sdhost.c | ||
40 | |||
41 | diff --git a/hw/sd/Makefile.objs b/hw/sd/Makefile.objs | ||
42 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
43 | --- a/hw/sd/Makefile.objs | 16 | --- a/target/arm/helper.h |
44 | +++ b/hw/sd/Makefile.objs | 17 | +++ b/target/arm/helper.h |
45 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_SD) += sd.o core.o sdmmc-internal.o | 18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fcge_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
46 | common-obj-$(CONFIG_SDHCI) += sdhci.o | 19 | DEF_HELPER_FLAGS_5(gvec_fcgt_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
47 | common-obj-$(CONFIG_SDHCI_PCI) += sdhci-pci.o | 20 | DEF_HELPER_FLAGS_5(gvec_fcgt_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
48 | 21 | ||
49 | +common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-sdhost.o | 22 | +DEF_HELPER_FLAGS_5(gvec_facge_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
50 | common-obj-$(CONFIG_MILKYMIST) += milkymist-memcard.o | 23 | +DEF_HELPER_FLAGS_5(gvec_facge_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
51 | common-obj-$(CONFIG_OMAP) += omap_mmc.o | 24 | + |
52 | common-obj-$(CONFIG_PXA2XX) += pxa2xx_mmci.o | 25 | +DEF_HELPER_FLAGS_5(gvec_facgt_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
53 | diff --git a/include/hw/arm/allwinner-a10.h b/include/hw/arm/allwinner-a10.h | 26 | +DEF_HELPER_FLAGS_5(gvec_facgt_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
27 | + | ||
28 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, | ||
29 | void, ptr, ptr, ptr, ptr, i32) | ||
30 | DEF_HELPER_FLAGS_5(gvec_ftsmul_s, TCG_CALL_NO_RWG, | ||
31 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
54 | index XXXXXXX..XXXXXXX 100644 | 32 | index XXXXXXX..XXXXXXX 100644 |
55 | --- a/include/hw/arm/allwinner-a10.h | 33 | --- a/target/arm/vec_helper.c |
56 | +++ b/include/hw/arm/allwinner-a10.h | 34 | +++ b/target/arm/vec_helper.c |
57 | @@ -XXX,XX +XXX,XX @@ | 35 | @@ -XXX,XX +XXX,XX @@ static uint32_t float32_cgt(float32 op1, float32 op2, float_status *stat) |
58 | #include "hw/timer/allwinner-a10-pit.h" | 36 | return -float32_lt(op2, op1, stat); |
59 | #include "hw/intc/allwinner-a10-pic.h" | ||
60 | #include "hw/net/allwinner_emac.h" | ||
61 | +#include "hw/sd/allwinner-sdhost.h" | ||
62 | #include "hw/ide/ahci.h" | ||
63 | #include "hw/usb/hcd-ohci.h" | ||
64 | #include "hw/usb/hcd-ehci.h" | ||
65 | @@ -XXX,XX +XXX,XX @@ typedef struct AwA10State { | ||
66 | AwA10PICState intc; | ||
67 | AwEmacState emac; | ||
68 | AllwinnerAHCIState sata; | ||
69 | + AwSdHostState mmc0; | ||
70 | MemoryRegion sram_a; | ||
71 | EHCISysBusState ehci[AW_A10_NUM_USB]; | ||
72 | OHCISysBusState ohci[AW_A10_NUM_USB]; | ||
73 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | ||
74 | index XXXXXXX..XXXXXXX 100644 | ||
75 | --- a/include/hw/arm/allwinner-h3.h | ||
76 | +++ b/include/hw/arm/allwinner-h3.h | ||
77 | @@ -XXX,XX +XXX,XX @@ | ||
78 | #include "hw/misc/allwinner-cpucfg.h" | ||
79 | #include "hw/misc/allwinner-h3-sysctrl.h" | ||
80 | #include "hw/misc/allwinner-sid.h" | ||
81 | +#include "hw/sd/allwinner-sdhost.h" | ||
82 | #include "target/arm/cpu.h" | ||
83 | |||
84 | /** | ||
85 | @@ -XXX,XX +XXX,XX @@ enum { | ||
86 | AW_H3_SRAM_A2, | ||
87 | AW_H3_SRAM_C, | ||
88 | AW_H3_SYSCTRL, | ||
89 | + AW_H3_MMC0, | ||
90 | AW_H3_SID, | ||
91 | AW_H3_EHCI0, | ||
92 | AW_H3_OHCI0, | ||
93 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
94 | AwCpuCfgState cpucfg; | ||
95 | AwH3SysCtrlState sysctrl; | ||
96 | AwSidState sid; | ||
97 | + AwSdHostState mmc0; | ||
98 | GICState gic; | ||
99 | MemoryRegion sram_a1; | ||
100 | MemoryRegion sram_a2; | ||
101 | diff --git a/include/hw/sd/allwinner-sdhost.h b/include/hw/sd/allwinner-sdhost.h | ||
102 | new file mode 100644 | ||
103 | index XXXXXXX..XXXXXXX | ||
104 | --- /dev/null | ||
105 | +++ b/include/hw/sd/allwinner-sdhost.h | ||
106 | @@ -XXX,XX +XXX,XX @@ | ||
107 | +/* | ||
108 | + * Allwinner (sun4i and above) SD Host Controller emulation | ||
109 | + * | ||
110 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
111 | + * | ||
112 | + * This program is free software: you can redistribute it and/or modify | ||
113 | + * it under the terms of the GNU General Public License as published by | ||
114 | + * the Free Software Foundation, either version 2 of the License, or | ||
115 | + * (at your option) any later version. | ||
116 | + * | ||
117 | + * This program is distributed in the hope that it will be useful, | ||
118 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
119 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
120 | + * GNU General Public License for more details. | ||
121 | + * | ||
122 | + * You should have received a copy of the GNU General Public License | ||
123 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
124 | + */ | ||
125 | + | ||
126 | +#ifndef HW_SD_ALLWINNER_SDHOST_H | ||
127 | +#define HW_SD_ALLWINNER_SDHOST_H | ||
128 | + | ||
129 | +#include "qom/object.h" | ||
130 | +#include "hw/sysbus.h" | ||
131 | +#include "hw/sd/sd.h" | ||
132 | + | ||
133 | +/** | ||
134 | + * Object model types | ||
135 | + * @{ | ||
136 | + */ | ||
137 | + | ||
138 | +/** Generic Allwinner SD Host Controller (abstract) */ | ||
139 | +#define TYPE_AW_SDHOST "allwinner-sdhost" | ||
140 | + | ||
141 | +/** Allwinner sun4i family (A10, A12) */ | ||
142 | +#define TYPE_AW_SDHOST_SUN4I TYPE_AW_SDHOST "-sun4i" | ||
143 | + | ||
144 | +/** Allwinner sun5i family and newer (A13, H2+, H3, etc) */ | ||
145 | +#define TYPE_AW_SDHOST_SUN5I TYPE_AW_SDHOST "-sun5i" | ||
146 | + | ||
147 | +/** @} */ | ||
148 | + | ||
149 | +/** | ||
150 | + * Object model macros | ||
151 | + * @{ | ||
152 | + */ | ||
153 | + | ||
154 | +#define AW_SDHOST(obj) \ | ||
155 | + OBJECT_CHECK(AwSdHostState, (obj), TYPE_AW_SDHOST) | ||
156 | +#define AW_SDHOST_CLASS(klass) \ | ||
157 | + OBJECT_CLASS_CHECK(AwSdHostClass, (klass), TYPE_AW_SDHOST) | ||
158 | +#define AW_SDHOST_GET_CLASS(obj) \ | ||
159 | + OBJECT_GET_CLASS(AwSdHostClass, (obj), TYPE_AW_SDHOST) | ||
160 | + | ||
161 | +/** @} */ | ||
162 | + | ||
163 | +/** | ||
164 | + * Allwinner SD Host Controller object instance state. | ||
165 | + */ | ||
166 | +typedef struct AwSdHostState { | ||
167 | + /*< private >*/ | ||
168 | + SysBusDevice busdev; | ||
169 | + /*< public >*/ | ||
170 | + | ||
171 | + /** Secure Digital (SD) bus, which connects to SD card (if present) */ | ||
172 | + SDBus sdbus; | ||
173 | + | ||
174 | + /** Maps I/O registers in physical memory */ | ||
175 | + MemoryRegion iomem; | ||
176 | + | ||
177 | + /** Interrupt output signal to notify CPU */ | ||
178 | + qemu_irq irq; | ||
179 | + | ||
180 | + /** Number of bytes left in current DMA transfer */ | ||
181 | + uint32_t transfer_cnt; | ||
182 | + | ||
183 | + /** | ||
184 | + * @name Hardware Registers | ||
185 | + * @{ | ||
186 | + */ | ||
187 | + | ||
188 | + uint32_t global_ctl; /**< Global Control */ | ||
189 | + uint32_t clock_ctl; /**< Clock Control */ | ||
190 | + uint32_t timeout; /**< Timeout */ | ||
191 | + uint32_t bus_width; /**< Bus Width */ | ||
192 | + uint32_t block_size; /**< Block Size */ | ||
193 | + uint32_t byte_count; /**< Byte Count */ | ||
194 | + | ||
195 | + uint32_t command; /**< Command */ | ||
196 | + uint32_t command_arg; /**< Command Argument */ | ||
197 | + uint32_t response[4]; /**< Command Response */ | ||
198 | + | ||
199 | + uint32_t irq_mask; /**< Interrupt Mask */ | ||
200 | + uint32_t irq_status; /**< Raw Interrupt Status */ | ||
201 | + uint32_t status; /**< Status */ | ||
202 | + | ||
203 | + uint32_t fifo_wlevel; /**< FIFO Water Level */ | ||
204 | + uint32_t fifo_func_sel; /**< FIFO Function Select */ | ||
205 | + uint32_t debug_enable; /**< Debug Enable */ | ||
206 | + uint32_t auto12_arg; /**< Auto Command 12 Argument */ | ||
207 | + uint32_t newtiming_set; /**< SD New Timing Set */ | ||
208 | + uint32_t newtiming_debug; /**< SD New Timing Debug */ | ||
209 | + uint32_t hardware_rst; /**< Hardware Reset */ | ||
210 | + uint32_t dmac; /**< Internal DMA Controller Control */ | ||
211 | + uint32_t desc_base; /**< Descriptor List Base Address */ | ||
212 | + uint32_t dmac_status; /**< Internal DMA Controller Status */ | ||
213 | + uint32_t dmac_irq; /**< Internal DMA Controller IRQ Enable */ | ||
214 | + uint32_t card_threshold; /**< Card Threshold Control */ | ||
215 | + uint32_t startbit_detect; /**< eMMC DDR Start Bit Detection Control */ | ||
216 | + uint32_t response_crc; /**< Response CRC */ | ||
217 | + uint32_t data_crc[8]; /**< Data CRC */ | ||
218 | + uint32_t status_crc; /**< Status CRC */ | ||
219 | + | ||
220 | + /** @} */ | ||
221 | + | ||
222 | +} AwSdHostState; | ||
223 | + | ||
224 | +/** | ||
225 | + * Allwinner SD Host Controller class-level struct. | ||
226 | + * | ||
227 | + * This struct is filled by each sunxi device specific code | ||
228 | + * such that the generic code can use this struct to support | ||
229 | + * all devices. | ||
230 | + */ | ||
231 | +typedef struct AwSdHostClass { | ||
232 | + /*< private >*/ | ||
233 | + SysBusDeviceClass parent_class; | ||
234 | + /*< public >*/ | ||
235 | + | ||
236 | + /** Maximum buffer size in bytes per DMA descriptor */ | ||
237 | + size_t max_desc_size; | ||
238 | + | ||
239 | +} AwSdHostClass; | ||
240 | + | ||
241 | +#endif /* HW_SD_ALLWINNER_SDHOST_H */ | ||
242 | diff --git a/hw/arm/allwinner-a10.c b/hw/arm/allwinner-a10.c | ||
243 | index XXXXXXX..XXXXXXX 100644 | ||
244 | --- a/hw/arm/allwinner-a10.c | ||
245 | +++ b/hw/arm/allwinner-a10.c | ||
246 | @@ -XXX,XX +XXX,XX @@ | ||
247 | #include "hw/boards.h" | ||
248 | #include "hw/usb/hcd-ohci.h" | ||
249 | |||
250 | +#define AW_A10_MMC0_BASE 0x01c0f000 | ||
251 | #define AW_A10_PIC_REG_BASE 0x01c20400 | ||
252 | #define AW_A10_PIT_REG_BASE 0x01c20c00 | ||
253 | #define AW_A10_UART0_REG_BASE 0x01c28000 | ||
254 | @@ -XXX,XX +XXX,XX @@ static void aw_a10_init(Object *obj) | ||
255 | sizeof(s->ohci[i]), TYPE_SYSBUS_OHCI); | ||
256 | } | ||
257 | } | ||
258 | + | ||
259 | + sysbus_init_child_obj(obj, "mmc0", &s->mmc0, sizeof(s->mmc0), | ||
260 | + TYPE_AW_SDHOST_SUN4I); | ||
261 | } | 37 | } |
262 | 38 | ||
263 | static void aw_a10_realize(DeviceState *dev, Error **errp) | 39 | +static uint16_t float16_acge(float16 op1, float16 op2, float_status *stat) |
264 | @@ -XXX,XX +XXX,XX @@ static void aw_a10_realize(DeviceState *dev, Error **errp) | ||
265 | qdev_get_gpio_in(dev, 64 + i)); | ||
266 | } | ||
267 | } | ||
268 | + | ||
269 | + /* SD/MMC */ | ||
270 | + qdev_init_nofail(DEVICE(&s->mmc0)); | ||
271 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->mmc0), 0, AW_A10_MMC0_BASE); | ||
272 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->mmc0), 0, qdev_get_gpio_in(dev, 32)); | ||
273 | + object_property_add_alias(OBJECT(s), "sd-bus", OBJECT(&s->mmc0), | ||
274 | + "sd-bus", &error_abort); | ||
275 | } | ||
276 | |||
277 | static void aw_a10_class_init(ObjectClass *oc, void *data) | ||
278 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
279 | index XXXXXXX..XXXXXXX 100644 | ||
280 | --- a/hw/arm/allwinner-h3.c | ||
281 | +++ b/hw/arm/allwinner-h3.c | ||
282 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
283 | [AW_H3_SRAM_A2] = 0x00044000, | ||
284 | [AW_H3_SRAM_C] = 0x00010000, | ||
285 | [AW_H3_SYSCTRL] = 0x01c00000, | ||
286 | + [AW_H3_MMC0] = 0x01c0f000, | ||
287 | [AW_H3_SID] = 0x01c14000, | ||
288 | [AW_H3_EHCI0] = 0x01c1a000, | ||
289 | [AW_H3_OHCI0] = 0x01c1a400, | ||
290 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
291 | { "lcd0", 0x01c0c000, 4 * KiB }, | ||
292 | { "lcd1", 0x01c0d000, 4 * KiB }, | ||
293 | { "ve", 0x01c0e000, 4 * KiB }, | ||
294 | - { "mmc0", 0x01c0f000, 4 * KiB }, | ||
295 | { "mmc1", 0x01c10000, 4 * KiB }, | ||
296 | { "mmc2", 0x01c11000, 4 * KiB }, | ||
297 | { "crypto", 0x01c15000, 4 * KiB }, | ||
298 | @@ -XXX,XX +XXX,XX @@ enum { | ||
299 | AW_H3_GIC_SPI_UART3 = 3, | ||
300 | AW_H3_GIC_SPI_TIMER0 = 18, | ||
301 | AW_H3_GIC_SPI_TIMER1 = 19, | ||
302 | + AW_H3_GIC_SPI_MMC0 = 60, | ||
303 | AW_H3_GIC_SPI_EHCI0 = 72, | ||
304 | AW_H3_GIC_SPI_OHCI0 = 73, | ||
305 | AW_H3_GIC_SPI_EHCI1 = 74, | ||
306 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
307 | TYPE_AW_SID); | ||
308 | object_property_add_alias(obj, "identifier", OBJECT(&s->sid), | ||
309 | "identifier", &error_abort); | ||
310 | + | ||
311 | + sysbus_init_child_obj(obj, "mmc0", &s->mmc0, sizeof(s->mmc0), | ||
312 | + TYPE_AW_SDHOST_SUN5I); | ||
313 | } | ||
314 | |||
315 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
316 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
317 | qdev_init_nofail(DEVICE(&s->sid)); | ||
318 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->sid), 0, s->memmap[AW_H3_SID]); | ||
319 | |||
320 | + /* SD/MMC */ | ||
321 | + qdev_init_nofail(DEVICE(&s->mmc0)); | ||
322 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->mmc0), 0, s->memmap[AW_H3_MMC0]); | ||
323 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->mmc0), 0, | ||
324 | + qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_MMC0)); | ||
325 | + | ||
326 | + object_property_add_alias(OBJECT(s), "sd-bus", OBJECT(&s->mmc0), | ||
327 | + "sd-bus", &error_abort); | ||
328 | + | ||
329 | /* Universal Serial Bus */ | ||
330 | sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI0], | ||
331 | qdev_get_gpio_in(DEVICE(&s->gic), | ||
332 | diff --git a/hw/arm/cubieboard.c b/hw/arm/cubieboard.c | ||
333 | index XXXXXXX..XXXXXXX 100644 | ||
334 | --- a/hw/arm/cubieboard.c | ||
335 | +++ b/hw/arm/cubieboard.c | ||
336 | @@ -XXX,XX +XXX,XX @@ | ||
337 | #include "sysemu/sysemu.h" | ||
338 | #include "hw/sysbus.h" | ||
339 | #include "hw/boards.h" | ||
340 | +#include "hw/qdev-properties.h" | ||
341 | #include "hw/arm/allwinner-a10.h" | ||
342 | |||
343 | static struct arm_boot_info cubieboard_binfo = { | ||
344 | @@ -XXX,XX +XXX,XX @@ static void cubieboard_init(MachineState *machine) | ||
345 | { | ||
346 | AwA10State *a10; | ||
347 | Error *err = NULL; | ||
348 | + DriveInfo *di; | ||
349 | + BlockBackend *blk; | ||
350 | + BusState *bus; | ||
351 | + DeviceState *carddev; | ||
352 | |||
353 | /* BIOS is not supported by this board */ | ||
354 | if (bios_name) { | ||
355 | @@ -XXX,XX +XXX,XX @@ static void cubieboard_init(MachineState *machine) | ||
356 | exit(1); | ||
357 | } | ||
358 | |||
359 | + /* Retrieve SD bus */ | ||
360 | + di = drive_get_next(IF_SD); | ||
361 | + blk = di ? blk_by_legacy_dinfo(di) : NULL; | ||
362 | + bus = qdev_get_child_bus(DEVICE(a10), "sd-bus"); | ||
363 | + | ||
364 | + /* Plug in SD card */ | ||
365 | + carddev = qdev_create(bus, TYPE_SD_CARD); | ||
366 | + qdev_prop_set_drive(carddev, "drive", blk, &error_fatal); | ||
367 | + object_property_set_bool(OBJECT(carddev), true, "realized", &error_fatal); | ||
368 | + | ||
369 | memory_region_add_subregion(get_system_memory(), AW_A10_SDRAM_BASE, | ||
370 | machine->ram); | ||
371 | |||
372 | diff --git a/hw/arm/orangepi.c b/hw/arm/orangepi.c | ||
373 | index XXXXXXX..XXXXXXX 100644 | ||
374 | --- a/hw/arm/orangepi.c | ||
375 | +++ b/hw/arm/orangepi.c | ||
376 | @@ -XXX,XX +XXX,XX @@ static struct arm_boot_info orangepi_binfo = { | ||
377 | static void orangepi_init(MachineState *machine) | ||
378 | { | ||
379 | AwH3State *h3; | ||
380 | + DriveInfo *di; | ||
381 | + BlockBackend *blk; | ||
382 | + BusState *bus; | ||
383 | + DeviceState *carddev; | ||
384 | |||
385 | /* BIOS is not supported by this board */ | ||
386 | if (bios_name) { | ||
387 | @@ -XXX,XX +XXX,XX @@ static void orangepi_init(MachineState *machine) | ||
388 | /* Mark H3 object realized */ | ||
389 | object_property_set_bool(OBJECT(h3), true, "realized", &error_abort); | ||
390 | |||
391 | + /* Retrieve SD bus */ | ||
392 | + di = drive_get_next(IF_SD); | ||
393 | + blk = di ? blk_by_legacy_dinfo(di) : NULL; | ||
394 | + bus = qdev_get_child_bus(DEVICE(h3), "sd-bus"); | ||
395 | + | ||
396 | + /* Plug in SD card */ | ||
397 | + carddev = qdev_create(bus, TYPE_SD_CARD); | ||
398 | + qdev_prop_set_drive(carddev, "drive", blk, &error_fatal); | ||
399 | + object_property_set_bool(OBJECT(carddev), true, "realized", &error_fatal); | ||
400 | + | ||
401 | /* SDRAM */ | ||
402 | memory_region_add_subregion(get_system_memory(), h3->memmap[AW_H3_SDRAM], | ||
403 | machine->ram); | ||
404 | @@ -XXX,XX +XXX,XX @@ static void orangepi_machine_init(MachineClass *mc) | ||
405 | { | ||
406 | mc->desc = "Orange Pi PC"; | ||
407 | mc->init = orangepi_init; | ||
408 | + mc->block_default_type = IF_SD; | ||
409 | + mc->units_per_default_bus = 1; | ||
410 | mc->min_cpus = AW_H3_NUM_CPUS; | ||
411 | mc->max_cpus = AW_H3_NUM_CPUS; | ||
412 | mc->default_cpus = AW_H3_NUM_CPUS; | ||
413 | diff --git a/hw/sd/allwinner-sdhost.c b/hw/sd/allwinner-sdhost.c | ||
414 | new file mode 100644 | ||
415 | index XXXXXXX..XXXXXXX | ||
416 | --- /dev/null | ||
417 | +++ b/hw/sd/allwinner-sdhost.c | ||
418 | @@ -XXX,XX +XXX,XX @@ | ||
419 | +/* | ||
420 | + * Allwinner (sun4i and above) SD Host Controller emulation | ||
421 | + * | ||
422 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
423 | + * | ||
424 | + * This program is free software: you can redistribute it and/or modify | ||
425 | + * it under the terms of the GNU General Public License as published by | ||
426 | + * the Free Software Foundation, either version 2 of the License, or | ||
427 | + * (at your option) any later version. | ||
428 | + * | ||
429 | + * This program is distributed in the hope that it will be useful, | ||
430 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
431 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
432 | + * GNU General Public License for more details. | ||
433 | + * | ||
434 | + * You should have received a copy of the GNU General Public License | ||
435 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
436 | + */ | ||
437 | + | ||
438 | +#include "qemu/osdep.h" | ||
439 | +#include "qemu/log.h" | ||
440 | +#include "qemu/module.h" | ||
441 | +#include "qemu/units.h" | ||
442 | +#include "sysemu/blockdev.h" | ||
443 | +#include "hw/irq.h" | ||
444 | +#include "hw/sd/allwinner-sdhost.h" | ||
445 | +#include "migration/vmstate.h" | ||
446 | +#include "trace.h" | ||
447 | + | ||
448 | +#define TYPE_AW_SDHOST_BUS "allwinner-sdhost-bus" | ||
449 | +#define AW_SDHOST_BUS(obj) \ | ||
450 | + OBJECT_CHECK(SDBus, (obj), TYPE_AW_SDHOST_BUS) | ||
451 | + | ||
452 | +/* SD Host register offsets */ | ||
453 | +enum { | ||
454 | + REG_SD_GCTL = 0x00, /* Global Control */ | ||
455 | + REG_SD_CKCR = 0x04, /* Clock Control */ | ||
456 | + REG_SD_TMOR = 0x08, /* Timeout */ | ||
457 | + REG_SD_BWDR = 0x0C, /* Bus Width */ | ||
458 | + REG_SD_BKSR = 0x10, /* Block Size */ | ||
459 | + REG_SD_BYCR = 0x14, /* Byte Count */ | ||
460 | + REG_SD_CMDR = 0x18, /* Command */ | ||
461 | + REG_SD_CAGR = 0x1C, /* Command Argument */ | ||
462 | + REG_SD_RESP0 = 0x20, /* Response Zero */ | ||
463 | + REG_SD_RESP1 = 0x24, /* Response One */ | ||
464 | + REG_SD_RESP2 = 0x28, /* Response Two */ | ||
465 | + REG_SD_RESP3 = 0x2C, /* Response Three */ | ||
466 | + REG_SD_IMKR = 0x30, /* Interrupt Mask */ | ||
467 | + REG_SD_MISR = 0x34, /* Masked Interrupt Status */ | ||
468 | + REG_SD_RISR = 0x38, /* Raw Interrupt Status */ | ||
469 | + REG_SD_STAR = 0x3C, /* Status */ | ||
470 | + REG_SD_FWLR = 0x40, /* FIFO Water Level */ | ||
471 | + REG_SD_FUNS = 0x44, /* FIFO Function Select */ | ||
472 | + REG_SD_DBGC = 0x50, /* Debug Enable */ | ||
473 | + REG_SD_A12A = 0x58, /* Auto command 12 argument */ | ||
474 | + REG_SD_NTSR = 0x5C, /* SD NewTiming Set */ | ||
475 | + REG_SD_SDBG = 0x60, /* SD newTiming Set Debug */ | ||
476 | + REG_SD_HWRST = 0x78, /* Hardware Reset Register */ | ||
477 | + REG_SD_DMAC = 0x80, /* Internal DMA Controller Control */ | ||
478 | + REG_SD_DLBA = 0x84, /* Descriptor List Base Address */ | ||
479 | + REG_SD_IDST = 0x88, /* Internal DMA Controller Status */ | ||
480 | + REG_SD_IDIE = 0x8C, /* Internal DMA Controller IRQ Enable */ | ||
481 | + REG_SD_THLDC = 0x100, /* Card Threshold Control */ | ||
482 | + REG_SD_DSBD = 0x10C, /* eMMC DDR Start Bit Detection Control */ | ||
483 | + REG_SD_RES_CRC = 0x110, /* Response CRC from card/eMMC */ | ||
484 | + REG_SD_DATA7_CRC = 0x114, /* CRC Data 7 from card/eMMC */ | ||
485 | + REG_SD_DATA6_CRC = 0x118, /* CRC Data 6 from card/eMMC */ | ||
486 | + REG_SD_DATA5_CRC = 0x11C, /* CRC Data 5 from card/eMMC */ | ||
487 | + REG_SD_DATA4_CRC = 0x120, /* CRC Data 4 from card/eMMC */ | ||
488 | + REG_SD_DATA3_CRC = 0x124, /* CRC Data 3 from card/eMMC */ | ||
489 | + REG_SD_DATA2_CRC = 0x128, /* CRC Data 2 from card/eMMC */ | ||
490 | + REG_SD_DATA1_CRC = 0x12C, /* CRC Data 1 from card/eMMC */ | ||
491 | + REG_SD_DATA0_CRC = 0x130, /* CRC Data 0 from card/eMMC */ | ||
492 | + REG_SD_CRC_STA = 0x134, /* CRC status from card/eMMC during write */ | ||
493 | + REG_SD_FIFO = 0x200, /* Read/Write FIFO */ | ||
494 | +}; | ||
495 | + | ||
496 | +/* SD Host register flags */ | ||
497 | +enum { | ||
498 | + SD_GCTL_FIFO_AC_MOD = (1 << 31), | ||
499 | + SD_GCTL_DDR_MOD_SEL = (1 << 10), | ||
500 | + SD_GCTL_CD_DBC_ENB = (1 << 8), | ||
501 | + SD_GCTL_DMA_ENB = (1 << 5), | ||
502 | + SD_GCTL_INT_ENB = (1 << 4), | ||
503 | + SD_GCTL_DMA_RST = (1 << 2), | ||
504 | + SD_GCTL_FIFO_RST = (1 << 1), | ||
505 | + SD_GCTL_SOFT_RST = (1 << 0), | ||
506 | +}; | ||
507 | + | ||
508 | +enum { | ||
509 | + SD_CMDR_LOAD = (1 << 31), | ||
510 | + SD_CMDR_CLKCHANGE = (1 << 21), | ||
511 | + SD_CMDR_WRITE = (1 << 10), | ||
512 | + SD_CMDR_AUTOSTOP = (1 << 12), | ||
513 | + SD_CMDR_DATA = (1 << 9), | ||
514 | + SD_CMDR_RESPONSE_LONG = (1 << 7), | ||
515 | + SD_CMDR_RESPONSE = (1 << 6), | ||
516 | + SD_CMDR_CMDID_MASK = (0x3f), | ||
517 | +}; | ||
518 | + | ||
519 | +enum { | ||
520 | + SD_RISR_CARD_REMOVE = (1 << 31), | ||
521 | + SD_RISR_CARD_INSERT = (1 << 30), | ||
522 | + SD_RISR_SDIO_INTR = (1 << 16), | ||
523 | + SD_RISR_AUTOCMD_DONE = (1 << 14), | ||
524 | + SD_RISR_DATA_COMPLETE = (1 << 3), | ||
525 | + SD_RISR_CMD_COMPLETE = (1 << 2), | ||
526 | + SD_RISR_NO_RESPONSE = (1 << 1), | ||
527 | +}; | ||
528 | + | ||
529 | +enum { | ||
530 | + SD_STAR_CARD_PRESENT = (1 << 8), | ||
531 | +}; | ||
532 | + | ||
533 | +enum { | ||
534 | + SD_IDST_INT_SUMMARY = (1 << 8), | ||
535 | + SD_IDST_RECEIVE_IRQ = (1 << 1), | ||
536 | + SD_IDST_TRANSMIT_IRQ = (1 << 0), | ||
537 | + SD_IDST_IRQ_MASK = (1 << 1) | (1 << 0) | (1 << 8), | ||
538 | + SD_IDST_WR_MASK = (0x3ff), | ||
539 | +}; | ||
540 | + | ||
541 | +/* SD Host register reset values */ | ||
542 | +enum { | ||
543 | + REG_SD_GCTL_RST = 0x00000300, | ||
544 | + REG_SD_CKCR_RST = 0x0, | ||
545 | + REG_SD_TMOR_RST = 0xFFFFFF40, | ||
546 | + REG_SD_BWDR_RST = 0x0, | ||
547 | + REG_SD_BKSR_RST = 0x00000200, | ||
548 | + REG_SD_BYCR_RST = 0x00000200, | ||
549 | + REG_SD_CMDR_RST = 0x0, | ||
550 | + REG_SD_CAGR_RST = 0x0, | ||
551 | + REG_SD_RESP_RST = 0x0, | ||
552 | + REG_SD_IMKR_RST = 0x0, | ||
553 | + REG_SD_MISR_RST = 0x0, | ||
554 | + REG_SD_RISR_RST = 0x0, | ||
555 | + REG_SD_STAR_RST = 0x00000100, | ||
556 | + REG_SD_FWLR_RST = 0x000F0000, | ||
557 | + REG_SD_FUNS_RST = 0x0, | ||
558 | + REG_SD_DBGC_RST = 0x0, | ||
559 | + REG_SD_A12A_RST = 0x0000FFFF, | ||
560 | + REG_SD_NTSR_RST = 0x00000001, | ||
561 | + REG_SD_SDBG_RST = 0x0, | ||
562 | + REG_SD_HWRST_RST = 0x00000001, | ||
563 | + REG_SD_DMAC_RST = 0x0, | ||
564 | + REG_SD_DLBA_RST = 0x0, | ||
565 | + REG_SD_IDST_RST = 0x0, | ||
566 | + REG_SD_IDIE_RST = 0x0, | ||
567 | + REG_SD_THLDC_RST = 0x0, | ||
568 | + REG_SD_DSBD_RST = 0x0, | ||
569 | + REG_SD_RES_CRC_RST = 0x0, | ||
570 | + REG_SD_DATA_CRC_RST = 0x0, | ||
571 | + REG_SD_CRC_STA_RST = 0x0, | ||
572 | + REG_SD_FIFO_RST = 0x0, | ||
573 | +}; | ||
574 | + | ||
575 | +/* Data transfer descriptor for DMA */ | ||
576 | +typedef struct TransferDescriptor { | ||
577 | + uint32_t status; /* Status flags */ | ||
578 | + uint32_t size; /* Data buffer size */ | ||
579 | + uint32_t addr; /* Data buffer address */ | ||
580 | + uint32_t next; /* Physical address of next descriptor */ | ||
581 | +} TransferDescriptor; | ||
582 | + | ||
583 | +/* Data transfer descriptor flags */ | ||
584 | +enum { | ||
585 | + DESC_STATUS_HOLD = (1 << 31), /* Set when descriptor is in use by DMA */ | ||
586 | + DESC_STATUS_ERROR = (1 << 30), /* Set when DMA transfer error occurred */ | ||
587 | + DESC_STATUS_CHAIN = (1 << 4), /* Indicates chained descriptor. */ | ||
588 | + DESC_STATUS_FIRST = (1 << 3), /* Set on the first descriptor */ | ||
589 | + DESC_STATUS_LAST = (1 << 2), /* Set on the last descriptor */ | ||
590 | + DESC_STATUS_NOIRQ = (1 << 1), /* Skip raising interrupt after transfer */ | ||
591 | + DESC_SIZE_MASK = (0xfffffffc) | ||
592 | +}; | ||
593 | + | ||
594 | +static void allwinner_sdhost_update_irq(AwSdHostState *s) | ||
595 | +{ | 40 | +{ |
596 | + uint32_t irq; | 41 | + return -float16_le(float16_abs(op2), float16_abs(op1), stat); |
597 | + | ||
598 | + if (s->global_ctl & SD_GCTL_INT_ENB) { | ||
599 | + irq = s->irq_status & s->irq_mask; | ||
600 | + } else { | ||
601 | + irq = 0; | ||
602 | + } | ||
603 | + | ||
604 | + trace_allwinner_sdhost_update_irq(irq); | ||
605 | + qemu_set_irq(s->irq, irq); | ||
606 | +} | 42 | +} |
607 | + | 43 | + |
608 | +static void allwinner_sdhost_update_transfer_cnt(AwSdHostState *s, | 44 | +static uint32_t float32_acge(float32 op1, float32 op2, float_status *stat) |
609 | + uint32_t bytes) | ||
610 | +{ | 45 | +{ |
611 | + if (s->transfer_cnt > bytes) { | 46 | + return -float32_le(float32_abs(op2), float32_abs(op1), stat); |
612 | + s->transfer_cnt -= bytes; | ||
613 | + } else { | ||
614 | + s->transfer_cnt = 0; | ||
615 | + } | ||
616 | + | ||
617 | + if (!s->transfer_cnt) { | ||
618 | + s->irq_status |= SD_RISR_DATA_COMPLETE; | ||
619 | + } | ||
620 | +} | 47 | +} |
621 | + | 48 | + |
622 | +static void allwinner_sdhost_set_inserted(DeviceState *dev, bool inserted) | 49 | +static uint16_t float16_acgt(float16 op1, float16 op2, float_status *stat) |
623 | +{ | 50 | +{ |
624 | + AwSdHostState *s = AW_SDHOST(dev); | 51 | + return -float16_lt(float16_abs(op2), float16_abs(op1), stat); |
625 | + | ||
626 | + trace_allwinner_sdhost_set_inserted(inserted); | ||
627 | + | ||
628 | + if (inserted) { | ||
629 | + s->irq_status |= SD_RISR_CARD_INSERT; | ||
630 | + s->irq_status &= ~SD_RISR_CARD_REMOVE; | ||
631 | + s->status |= SD_STAR_CARD_PRESENT; | ||
632 | + } else { | ||
633 | + s->irq_status &= ~SD_RISR_CARD_INSERT; | ||
634 | + s->irq_status |= SD_RISR_CARD_REMOVE; | ||
635 | + s->status &= ~SD_STAR_CARD_PRESENT; | ||
636 | + } | ||
637 | + | ||
638 | + allwinner_sdhost_update_irq(s); | ||
639 | +} | 52 | +} |
640 | + | 53 | + |
641 | +static void allwinner_sdhost_send_command(AwSdHostState *s) | 54 | +static uint32_t float32_acgt(float32 op1, float32 op2, float_status *stat) |
642 | +{ | 55 | +{ |
643 | + SDRequest request; | 56 | + return -float32_lt(float32_abs(op2), float32_abs(op1), stat); |
644 | + uint8_t resp[16]; | ||
645 | + int rlen; | ||
646 | + | ||
647 | + /* Auto clear load flag */ | ||
648 | + s->command &= ~SD_CMDR_LOAD; | ||
649 | + | ||
650 | + /* Clock change does not actually interact with the SD bus */ | ||
651 | + if (!(s->command & SD_CMDR_CLKCHANGE)) { | ||
652 | + | ||
653 | + /* Prepare request */ | ||
654 | + request.cmd = s->command & SD_CMDR_CMDID_MASK; | ||
655 | + request.arg = s->command_arg; | ||
656 | + | ||
657 | + /* Send request to SD bus */ | ||
658 | + rlen = sdbus_do_command(&s->sdbus, &request, resp); | ||
659 | + if (rlen < 0) { | ||
660 | + goto error; | ||
661 | + } | ||
662 | + | ||
663 | + /* If the command has a response, store it in the response registers */ | ||
664 | + if ((s->command & SD_CMDR_RESPONSE)) { | ||
665 | + if (rlen == 4 && !(s->command & SD_CMDR_RESPONSE_LONG)) { | ||
666 | + s->response[0] = ldl_be_p(&resp[0]); | ||
667 | + s->response[1] = s->response[2] = s->response[3] = 0; | ||
668 | + | ||
669 | + } else if (rlen == 16 && (s->command & SD_CMDR_RESPONSE_LONG)) { | ||
670 | + s->response[0] = ldl_be_p(&resp[12]); | ||
671 | + s->response[1] = ldl_be_p(&resp[8]); | ||
672 | + s->response[2] = ldl_be_p(&resp[4]); | ||
673 | + s->response[3] = ldl_be_p(&resp[0]); | ||
674 | + } else { | ||
675 | + goto error; | ||
676 | + } | ||
677 | + } | ||
678 | + } | ||
679 | + | ||
680 | + /* Set interrupt status bits */ | ||
681 | + s->irq_status |= SD_RISR_CMD_COMPLETE; | ||
682 | + return; | ||
683 | + | ||
684 | +error: | ||
685 | + s->irq_status |= SD_RISR_NO_RESPONSE; | ||
686 | +} | 57 | +} |
687 | + | 58 | + |
688 | +static void allwinner_sdhost_auto_stop(AwSdHostState *s) | 59 | #define DO_2OP(NAME, FUNC, TYPE) \ |
689 | +{ | 60 | void HELPER(NAME)(void *vd, void *vn, void *stat, uint32_t desc) \ |
690 | + /* | 61 | { \ |
691 | + * The stop command (CMD12) ensures the SD bus | 62 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_fcge_s, float32_cge, float32) |
692 | + * returns to the transfer state. | 63 | DO_3OP(gvec_fcgt_h, float16_cgt, float16) |
693 | + */ | 64 | DO_3OP(gvec_fcgt_s, float32_cgt, float32) |
694 | + if ((s->command & SD_CMDR_AUTOSTOP) && (s->transfer_cnt == 0)) { | 65 | |
695 | + /* First save current command registers */ | 66 | +DO_3OP(gvec_facge_h, float16_acge, float16) |
696 | + uint32_t saved_cmd = s->command; | 67 | +DO_3OP(gvec_facge_s, float32_acge, float32) |
697 | + uint32_t saved_arg = s->command_arg; | ||
698 | + | 68 | + |
699 | + /* Prepare stop command (CMD12) */ | 69 | +DO_3OP(gvec_facgt_h, float16_acgt, float16) |
700 | + s->command &= ~SD_CMDR_CMDID_MASK; | 70 | +DO_3OP(gvec_facgt_s, float32_acgt, float32) |
701 | + s->command |= 12; /* CMD12 */ | ||
702 | + s->command_arg = 0; | ||
703 | + | 71 | + |
704 | + /* Put the command on SD bus */ | 72 | #ifdef TARGET_AARCH64 |
705 | + allwinner_sdhost_send_command(s); | 73 | |
706 | + | 74 | DO_3OP(gvec_recps_h, helper_recpsf_f16, float16) |
707 | + /* Restore command values */ | 75 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
708 | + s->command = saved_cmd; | ||
709 | + s->command_arg = saved_arg; | ||
710 | + | ||
711 | + /* Set IRQ status bit for automatic stop done */ | ||
712 | + s->irq_status |= SD_RISR_AUTOCMD_DONE; | ||
713 | + } | ||
714 | +} | ||
715 | + | ||
716 | +static uint32_t allwinner_sdhost_process_desc(AwSdHostState *s, | ||
717 | + hwaddr desc_addr, | ||
718 | + TransferDescriptor *desc, | ||
719 | + bool is_write, uint32_t max_bytes) | ||
720 | +{ | ||
721 | + AwSdHostClass *klass = AW_SDHOST_GET_CLASS(s); | ||
722 | + uint32_t num_done = 0; | ||
723 | + uint32_t num_bytes = max_bytes; | ||
724 | + uint8_t buf[1024]; | ||
725 | + | ||
726 | + /* Read descriptor */ | ||
727 | + cpu_physical_memory_read(desc_addr, desc, sizeof(*desc)); | ||
728 | + if (desc->size == 0) { | ||
729 | + desc->size = klass->max_desc_size; | ||
730 | + } else if (desc->size > klass->max_desc_size) { | ||
731 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: DMA descriptor buffer size " | ||
732 | + " is out-of-bounds: %" PRIu32 " > %zu", | ||
733 | + __func__, desc->size, klass->max_desc_size); | ||
734 | + desc->size = klass->max_desc_size; | ||
735 | + } | ||
736 | + if (desc->size < num_bytes) { | ||
737 | + num_bytes = desc->size; | ||
738 | + } | ||
739 | + | ||
740 | + trace_allwinner_sdhost_process_desc(desc_addr, desc->size, | ||
741 | + is_write, max_bytes); | ||
742 | + | ||
743 | + while (num_done < num_bytes) { | ||
744 | + /* Try to completely fill the local buffer */ | ||
745 | + uint32_t buf_bytes = num_bytes - num_done; | ||
746 | + if (buf_bytes > sizeof(buf)) { | ||
747 | + buf_bytes = sizeof(buf); | ||
748 | + } | ||
749 | + | ||
750 | + /* Write to SD bus */ | ||
751 | + if (is_write) { | ||
752 | + cpu_physical_memory_read((desc->addr & DESC_SIZE_MASK) + num_done, | ||
753 | + buf, buf_bytes); | ||
754 | + | ||
755 | + for (uint32_t i = 0; i < buf_bytes; i++) { | ||
756 | + sdbus_write_data(&s->sdbus, buf[i]); | ||
757 | + } | ||
758 | + | ||
759 | + /* Read from SD bus */ | ||
760 | + } else { | ||
761 | + for (uint32_t i = 0; i < buf_bytes; i++) { | ||
762 | + buf[i] = sdbus_read_data(&s->sdbus); | ||
763 | + } | ||
764 | + cpu_physical_memory_write((desc->addr & DESC_SIZE_MASK) + num_done, | ||
765 | + buf, buf_bytes); | ||
766 | + } | ||
767 | + num_done += buf_bytes; | ||
768 | + } | ||
769 | + | ||
770 | + /* Clear hold flag and flush descriptor */ | ||
771 | + desc->status &= ~DESC_STATUS_HOLD; | ||
772 | + cpu_physical_memory_write(desc_addr, desc, sizeof(*desc)); | ||
773 | + | ||
774 | + return num_done; | ||
775 | +} | ||
776 | + | ||
777 | +static void allwinner_sdhost_dma(AwSdHostState *s) | ||
778 | +{ | ||
779 | + TransferDescriptor desc; | ||
780 | + hwaddr desc_addr = s->desc_base; | ||
781 | + bool is_write = (s->command & SD_CMDR_WRITE); | ||
782 | + uint32_t bytes_done = 0; | ||
783 | + | ||
784 | + /* Check if DMA can be performed */ | ||
785 | + if (s->byte_count == 0 || s->block_size == 0 || | ||
786 | + !(s->global_ctl & SD_GCTL_DMA_ENB)) { | ||
787 | + return; | ||
788 | + } | ||
789 | + | ||
790 | + /* | ||
791 | + * For read operations, data must be available on the SD bus | ||
792 | + * If not, it is an error and we should not act at all | ||
793 | + */ | ||
794 | + if (!is_write && !sdbus_data_ready(&s->sdbus)) { | ||
795 | + return; | ||
796 | + } | ||
797 | + | ||
798 | + /* Process the DMA descriptors until all data is copied */ | ||
799 | + while (s->byte_count > 0) { | ||
800 | + bytes_done = allwinner_sdhost_process_desc(s, desc_addr, &desc, | ||
801 | + is_write, s->byte_count); | ||
802 | + allwinner_sdhost_update_transfer_cnt(s, bytes_done); | ||
803 | + | ||
804 | + if (bytes_done <= s->byte_count) { | ||
805 | + s->byte_count -= bytes_done; | ||
806 | + } else { | ||
807 | + s->byte_count = 0; | ||
808 | + } | ||
809 | + | ||
810 | + if (desc.status & DESC_STATUS_LAST) { | ||
811 | + break; | ||
812 | + } else { | ||
813 | + desc_addr = desc.next; | ||
814 | + } | ||
815 | + } | ||
816 | + | ||
817 | + /* Raise IRQ to signal DMA is completed */ | ||
818 | + s->irq_status |= SD_RISR_DATA_COMPLETE | SD_RISR_SDIO_INTR; | ||
819 | + | ||
820 | + /* Update DMAC bits */ | ||
821 | + s->dmac_status |= SD_IDST_INT_SUMMARY; | ||
822 | + | ||
823 | + if (is_write) { | ||
824 | + s->dmac_status |= SD_IDST_TRANSMIT_IRQ; | ||
825 | + } else { | ||
826 | + s->dmac_status |= SD_IDST_RECEIVE_IRQ; | ||
827 | + } | ||
828 | +} | ||
829 | + | ||
830 | +static uint64_t allwinner_sdhost_read(void *opaque, hwaddr offset, | ||
831 | + unsigned size) | ||
832 | +{ | ||
833 | + AwSdHostState *s = AW_SDHOST(opaque); | ||
834 | + uint32_t res = 0; | ||
835 | + | ||
836 | + switch (offset) { | ||
837 | + case REG_SD_GCTL: /* Global Control */ | ||
838 | + res = s->global_ctl; | ||
839 | + break; | ||
840 | + case REG_SD_CKCR: /* Clock Control */ | ||
841 | + res = s->clock_ctl; | ||
842 | + break; | ||
843 | + case REG_SD_TMOR: /* Timeout */ | ||
844 | + res = s->timeout; | ||
845 | + break; | ||
846 | + case REG_SD_BWDR: /* Bus Width */ | ||
847 | + res = s->bus_width; | ||
848 | + break; | ||
849 | + case REG_SD_BKSR: /* Block Size */ | ||
850 | + res = s->block_size; | ||
851 | + break; | ||
852 | + case REG_SD_BYCR: /* Byte Count */ | ||
853 | + res = s->byte_count; | ||
854 | + break; | ||
855 | + case REG_SD_CMDR: /* Command */ | ||
856 | + res = s->command; | ||
857 | + break; | ||
858 | + case REG_SD_CAGR: /* Command Argument */ | ||
859 | + res = s->command_arg; | ||
860 | + break; | ||
861 | + case REG_SD_RESP0: /* Response Zero */ | ||
862 | + res = s->response[0]; | ||
863 | + break; | ||
864 | + case REG_SD_RESP1: /* Response One */ | ||
865 | + res = s->response[1]; | ||
866 | + break; | ||
867 | + case REG_SD_RESP2: /* Response Two */ | ||
868 | + res = s->response[2]; | ||
869 | + break; | ||
870 | + case REG_SD_RESP3: /* Response Three */ | ||
871 | + res = s->response[3]; | ||
872 | + break; | ||
873 | + case REG_SD_IMKR: /* Interrupt Mask */ | ||
874 | + res = s->irq_mask; | ||
875 | + break; | ||
876 | + case REG_SD_MISR: /* Masked Interrupt Status */ | ||
877 | + res = s->irq_status & s->irq_mask; | ||
878 | + break; | ||
879 | + case REG_SD_RISR: /* Raw Interrupt Status */ | ||
880 | + res = s->irq_status; | ||
881 | + break; | ||
882 | + case REG_SD_STAR: /* Status */ | ||
883 | + res = s->status; | ||
884 | + break; | ||
885 | + case REG_SD_FWLR: /* FIFO Water Level */ | ||
886 | + res = s->fifo_wlevel; | ||
887 | + break; | ||
888 | + case REG_SD_FUNS: /* FIFO Function Select */ | ||
889 | + res = s->fifo_func_sel; | ||
890 | + break; | ||
891 | + case REG_SD_DBGC: /* Debug Enable */ | ||
892 | + res = s->debug_enable; | ||
893 | + break; | ||
894 | + case REG_SD_A12A: /* Auto command 12 argument */ | ||
895 | + res = s->auto12_arg; | ||
896 | + break; | ||
897 | + case REG_SD_NTSR: /* SD NewTiming Set */ | ||
898 | + res = s->newtiming_set; | ||
899 | + break; | ||
900 | + case REG_SD_SDBG: /* SD newTiming Set Debug */ | ||
901 | + res = s->newtiming_debug; | ||
902 | + break; | ||
903 | + case REG_SD_HWRST: /* Hardware Reset Register */ | ||
904 | + res = s->hardware_rst; | ||
905 | + break; | ||
906 | + case REG_SD_DMAC: /* Internal DMA Controller Control */ | ||
907 | + res = s->dmac; | ||
908 | + break; | ||
909 | + case REG_SD_DLBA: /* Descriptor List Base Address */ | ||
910 | + res = s->desc_base; | ||
911 | + break; | ||
912 | + case REG_SD_IDST: /* Internal DMA Controller Status */ | ||
913 | + res = s->dmac_status; | ||
914 | + break; | ||
915 | + case REG_SD_IDIE: /* Internal DMA Controller Interrupt Enable */ | ||
916 | + res = s->dmac_irq; | ||
917 | + break; | ||
918 | + case REG_SD_THLDC: /* Card Threshold Control */ | ||
919 | + res = s->card_threshold; | ||
920 | + break; | ||
921 | + case REG_SD_DSBD: /* eMMC DDR Start Bit Detection Control */ | ||
922 | + res = s->startbit_detect; | ||
923 | + break; | ||
924 | + case REG_SD_RES_CRC: /* Response CRC from card/eMMC */ | ||
925 | + res = s->response_crc; | ||
926 | + break; | ||
927 | + case REG_SD_DATA7_CRC: /* CRC Data 7 from card/eMMC */ | ||
928 | + case REG_SD_DATA6_CRC: /* CRC Data 6 from card/eMMC */ | ||
929 | + case REG_SD_DATA5_CRC: /* CRC Data 5 from card/eMMC */ | ||
930 | + case REG_SD_DATA4_CRC: /* CRC Data 4 from card/eMMC */ | ||
931 | + case REG_SD_DATA3_CRC: /* CRC Data 3 from card/eMMC */ | ||
932 | + case REG_SD_DATA2_CRC: /* CRC Data 2 from card/eMMC */ | ||
933 | + case REG_SD_DATA1_CRC: /* CRC Data 1 from card/eMMC */ | ||
934 | + case REG_SD_DATA0_CRC: /* CRC Data 0 from card/eMMC */ | ||
935 | + res = s->data_crc[((offset - REG_SD_DATA7_CRC) / sizeof(uint32_t))]; | ||
936 | + break; | ||
937 | + case REG_SD_CRC_STA: /* CRC status from card/eMMC in write operation */ | ||
938 | + res = s->status_crc; | ||
939 | + break; | ||
940 | + case REG_SD_FIFO: /* Read/Write FIFO */ | ||
941 | + if (sdbus_data_ready(&s->sdbus)) { | ||
942 | + res = sdbus_read_data(&s->sdbus); | ||
943 | + res |= sdbus_read_data(&s->sdbus) << 8; | ||
944 | + res |= sdbus_read_data(&s->sdbus) << 16; | ||
945 | + res |= sdbus_read_data(&s->sdbus) << 24; | ||
946 | + allwinner_sdhost_update_transfer_cnt(s, sizeof(uint32_t)); | ||
947 | + allwinner_sdhost_auto_stop(s); | ||
948 | + allwinner_sdhost_update_irq(s); | ||
949 | + } else { | ||
950 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: no data ready on SD bus\n", | ||
951 | + __func__); | ||
952 | + } | ||
953 | + break; | ||
954 | + default: | ||
955 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset %" | ||
956 | + HWADDR_PRIx"\n", __func__, offset); | ||
957 | + res = 0; | ||
958 | + break; | ||
959 | + } | ||
960 | + | ||
961 | + trace_allwinner_sdhost_read(offset, res, size); | ||
962 | + return res; | ||
963 | +} | ||
964 | + | ||
965 | +static void allwinner_sdhost_write(void *opaque, hwaddr offset, | ||
966 | + uint64_t value, unsigned size) | ||
967 | +{ | ||
968 | + AwSdHostState *s = AW_SDHOST(opaque); | ||
969 | + | ||
970 | + trace_allwinner_sdhost_write(offset, value, size); | ||
971 | + | ||
972 | + switch (offset) { | ||
973 | + case REG_SD_GCTL: /* Global Control */ | ||
974 | + s->global_ctl = value; | ||
975 | + s->global_ctl &= ~(SD_GCTL_DMA_RST | SD_GCTL_FIFO_RST | | ||
976 | + SD_GCTL_SOFT_RST); | ||
977 | + allwinner_sdhost_update_irq(s); | ||
978 | + break; | ||
979 | + case REG_SD_CKCR: /* Clock Control */ | ||
980 | + s->clock_ctl = value; | ||
981 | + break; | ||
982 | + case REG_SD_TMOR: /* Timeout */ | ||
983 | + s->timeout = value; | ||
984 | + break; | ||
985 | + case REG_SD_BWDR: /* Bus Width */ | ||
986 | + s->bus_width = value; | ||
987 | + break; | ||
988 | + case REG_SD_BKSR: /* Block Size */ | ||
989 | + s->block_size = value; | ||
990 | + break; | ||
991 | + case REG_SD_BYCR: /* Byte Count */ | ||
992 | + s->byte_count = value; | ||
993 | + s->transfer_cnt = value; | ||
994 | + break; | ||
995 | + case REG_SD_CMDR: /* Command */ | ||
996 | + s->command = value; | ||
997 | + if (value & SD_CMDR_LOAD) { | ||
998 | + allwinner_sdhost_send_command(s); | ||
999 | + allwinner_sdhost_dma(s); | ||
1000 | + allwinner_sdhost_auto_stop(s); | ||
1001 | + } | ||
1002 | + allwinner_sdhost_update_irq(s); | ||
1003 | + break; | ||
1004 | + case REG_SD_CAGR: /* Command Argument */ | ||
1005 | + s->command_arg = value; | ||
1006 | + break; | ||
1007 | + case REG_SD_RESP0: /* Response Zero */ | ||
1008 | + s->response[0] = value; | ||
1009 | + break; | ||
1010 | + case REG_SD_RESP1: /* Response One */ | ||
1011 | + s->response[1] = value; | ||
1012 | + break; | ||
1013 | + case REG_SD_RESP2: /* Response Two */ | ||
1014 | + s->response[2] = value; | ||
1015 | + break; | ||
1016 | + case REG_SD_RESP3: /* Response Three */ | ||
1017 | + s->response[3] = value; | ||
1018 | + break; | ||
1019 | + case REG_SD_IMKR: /* Interrupt Mask */ | ||
1020 | + s->irq_mask = value; | ||
1021 | + allwinner_sdhost_update_irq(s); | ||
1022 | + break; | ||
1023 | + case REG_SD_MISR: /* Masked Interrupt Status */ | ||
1024 | + case REG_SD_RISR: /* Raw Interrupt Status */ | ||
1025 | + s->irq_status &= ~value; | ||
1026 | + allwinner_sdhost_update_irq(s); | ||
1027 | + break; | ||
1028 | + case REG_SD_STAR: /* Status */ | ||
1029 | + s->status &= ~value; | ||
1030 | + allwinner_sdhost_update_irq(s); | ||
1031 | + break; | ||
1032 | + case REG_SD_FWLR: /* FIFO Water Level */ | ||
1033 | + s->fifo_wlevel = value; | ||
1034 | + break; | ||
1035 | + case REG_SD_FUNS: /* FIFO Function Select */ | ||
1036 | + s->fifo_func_sel = value; | ||
1037 | + break; | ||
1038 | + case REG_SD_DBGC: /* Debug Enable */ | ||
1039 | + s->debug_enable = value; | ||
1040 | + break; | ||
1041 | + case REG_SD_A12A: /* Auto command 12 argument */ | ||
1042 | + s->auto12_arg = value; | ||
1043 | + break; | ||
1044 | + case REG_SD_NTSR: /* SD NewTiming Set */ | ||
1045 | + s->newtiming_set = value; | ||
1046 | + break; | ||
1047 | + case REG_SD_SDBG: /* SD newTiming Set Debug */ | ||
1048 | + s->newtiming_debug = value; | ||
1049 | + break; | ||
1050 | + case REG_SD_HWRST: /* Hardware Reset Register */ | ||
1051 | + s->hardware_rst = value; | ||
1052 | + break; | ||
1053 | + case REG_SD_DMAC: /* Internal DMA Controller Control */ | ||
1054 | + s->dmac = value; | ||
1055 | + allwinner_sdhost_update_irq(s); | ||
1056 | + break; | ||
1057 | + case REG_SD_DLBA: /* Descriptor List Base Address */ | ||
1058 | + s->desc_base = value; | ||
1059 | + break; | ||
1060 | + case REG_SD_IDST: /* Internal DMA Controller Status */ | ||
1061 | + s->dmac_status &= (~SD_IDST_WR_MASK) | (~value & SD_IDST_WR_MASK); | ||
1062 | + allwinner_sdhost_update_irq(s); | ||
1063 | + break; | ||
1064 | + case REG_SD_IDIE: /* Internal DMA Controller Interrupt Enable */ | ||
1065 | + s->dmac_irq = value; | ||
1066 | + allwinner_sdhost_update_irq(s); | ||
1067 | + break; | ||
1068 | + case REG_SD_THLDC: /* Card Threshold Control */ | ||
1069 | + s->card_threshold = value; | ||
1070 | + break; | ||
1071 | + case REG_SD_DSBD: /* eMMC DDR Start Bit Detection Control */ | ||
1072 | + s->startbit_detect = value; | ||
1073 | + break; | ||
1074 | + case REG_SD_FIFO: /* Read/Write FIFO */ | ||
1075 | + sdbus_write_data(&s->sdbus, value & 0xff); | ||
1076 | + sdbus_write_data(&s->sdbus, (value >> 8) & 0xff); | ||
1077 | + sdbus_write_data(&s->sdbus, (value >> 16) & 0xff); | ||
1078 | + sdbus_write_data(&s->sdbus, (value >> 24) & 0xff); | ||
1079 | + allwinner_sdhost_update_transfer_cnt(s, sizeof(uint32_t)); | ||
1080 | + allwinner_sdhost_auto_stop(s); | ||
1081 | + allwinner_sdhost_update_irq(s); | ||
1082 | + break; | ||
1083 | + case REG_SD_RES_CRC: /* Response CRC from card/eMMC */ | ||
1084 | + case REG_SD_DATA7_CRC: /* CRC Data 7 from card/eMMC */ | ||
1085 | + case REG_SD_DATA6_CRC: /* CRC Data 6 from card/eMMC */ | ||
1086 | + case REG_SD_DATA5_CRC: /* CRC Data 5 from card/eMMC */ | ||
1087 | + case REG_SD_DATA4_CRC: /* CRC Data 4 from card/eMMC */ | ||
1088 | + case REG_SD_DATA3_CRC: /* CRC Data 3 from card/eMMC */ | ||
1089 | + case REG_SD_DATA2_CRC: /* CRC Data 2 from card/eMMC */ | ||
1090 | + case REG_SD_DATA1_CRC: /* CRC Data 1 from card/eMMC */ | ||
1091 | + case REG_SD_DATA0_CRC: /* CRC Data 0 from card/eMMC */ | ||
1092 | + case REG_SD_CRC_STA: /* CRC status from card/eMMC in write operation */ | ||
1093 | + break; | ||
1094 | + default: | ||
1095 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset %" | ||
1096 | + HWADDR_PRIx"\n", __func__, offset); | ||
1097 | + break; | ||
1098 | + } | ||
1099 | +} | ||
1100 | + | ||
1101 | +static const MemoryRegionOps allwinner_sdhost_ops = { | ||
1102 | + .read = allwinner_sdhost_read, | ||
1103 | + .write = allwinner_sdhost_write, | ||
1104 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
1105 | + .valid = { | ||
1106 | + .min_access_size = 4, | ||
1107 | + .max_access_size = 4, | ||
1108 | + }, | ||
1109 | + .impl.min_access_size = 4, | ||
1110 | +}; | ||
1111 | + | ||
1112 | +static const VMStateDescription vmstate_allwinner_sdhost = { | ||
1113 | + .name = "allwinner-sdhost", | ||
1114 | + .version_id = 1, | ||
1115 | + .minimum_version_id = 1, | ||
1116 | + .fields = (VMStateField[]) { | ||
1117 | + VMSTATE_UINT32(global_ctl, AwSdHostState), | ||
1118 | + VMSTATE_UINT32(clock_ctl, AwSdHostState), | ||
1119 | + VMSTATE_UINT32(timeout, AwSdHostState), | ||
1120 | + VMSTATE_UINT32(bus_width, AwSdHostState), | ||
1121 | + VMSTATE_UINT32(block_size, AwSdHostState), | ||
1122 | + VMSTATE_UINT32(byte_count, AwSdHostState), | ||
1123 | + VMSTATE_UINT32(transfer_cnt, AwSdHostState), | ||
1124 | + VMSTATE_UINT32(command, AwSdHostState), | ||
1125 | + VMSTATE_UINT32(command_arg, AwSdHostState), | ||
1126 | + VMSTATE_UINT32_ARRAY(response, AwSdHostState, 4), | ||
1127 | + VMSTATE_UINT32(irq_mask, AwSdHostState), | ||
1128 | + VMSTATE_UINT32(irq_status, AwSdHostState), | ||
1129 | + VMSTATE_UINT32(status, AwSdHostState), | ||
1130 | + VMSTATE_UINT32(fifo_wlevel, AwSdHostState), | ||
1131 | + VMSTATE_UINT32(fifo_func_sel, AwSdHostState), | ||
1132 | + VMSTATE_UINT32(debug_enable, AwSdHostState), | ||
1133 | + VMSTATE_UINT32(auto12_arg, AwSdHostState), | ||
1134 | + VMSTATE_UINT32(newtiming_set, AwSdHostState), | ||
1135 | + VMSTATE_UINT32(newtiming_debug, AwSdHostState), | ||
1136 | + VMSTATE_UINT32(hardware_rst, AwSdHostState), | ||
1137 | + VMSTATE_UINT32(dmac, AwSdHostState), | ||
1138 | + VMSTATE_UINT32(desc_base, AwSdHostState), | ||
1139 | + VMSTATE_UINT32(dmac_status, AwSdHostState), | ||
1140 | + VMSTATE_UINT32(dmac_irq, AwSdHostState), | ||
1141 | + VMSTATE_UINT32(card_threshold, AwSdHostState), | ||
1142 | + VMSTATE_UINT32(startbit_detect, AwSdHostState), | ||
1143 | + VMSTATE_UINT32(response_crc, AwSdHostState), | ||
1144 | + VMSTATE_UINT32_ARRAY(data_crc, AwSdHostState, 8), | ||
1145 | + VMSTATE_UINT32(status_crc, AwSdHostState), | ||
1146 | + VMSTATE_END_OF_LIST() | ||
1147 | + } | ||
1148 | +}; | ||
1149 | + | ||
1150 | +static void allwinner_sdhost_init(Object *obj) | ||
1151 | +{ | ||
1152 | + AwSdHostState *s = AW_SDHOST(obj); | ||
1153 | + | ||
1154 | + qbus_create_inplace(&s->sdbus, sizeof(s->sdbus), | ||
1155 | + TYPE_AW_SDHOST_BUS, DEVICE(s), "sd-bus"); | ||
1156 | + | ||
1157 | + memory_region_init_io(&s->iomem, obj, &allwinner_sdhost_ops, s, | ||
1158 | + TYPE_AW_SDHOST, 4 * KiB); | ||
1159 | + sysbus_init_mmio(SYS_BUS_DEVICE(s), &s->iomem); | ||
1160 | + sysbus_init_irq(SYS_BUS_DEVICE(s), &s->irq); | ||
1161 | +} | ||
1162 | + | ||
1163 | +static void allwinner_sdhost_reset(DeviceState *dev) | ||
1164 | +{ | ||
1165 | + AwSdHostState *s = AW_SDHOST(dev); | ||
1166 | + | ||
1167 | + s->global_ctl = REG_SD_GCTL_RST; | ||
1168 | + s->clock_ctl = REG_SD_CKCR_RST; | ||
1169 | + s->timeout = REG_SD_TMOR_RST; | ||
1170 | + s->bus_width = REG_SD_BWDR_RST; | ||
1171 | + s->block_size = REG_SD_BKSR_RST; | ||
1172 | + s->byte_count = REG_SD_BYCR_RST; | ||
1173 | + s->transfer_cnt = 0; | ||
1174 | + | ||
1175 | + s->command = REG_SD_CMDR_RST; | ||
1176 | + s->command_arg = REG_SD_CAGR_RST; | ||
1177 | + | ||
1178 | + for (int i = 0; i < ARRAY_SIZE(s->response); i++) { | ||
1179 | + s->response[i] = REG_SD_RESP_RST; | ||
1180 | + } | ||
1181 | + | ||
1182 | + s->irq_mask = REG_SD_IMKR_RST; | ||
1183 | + s->irq_status = REG_SD_RISR_RST; | ||
1184 | + s->status = REG_SD_STAR_RST; | ||
1185 | + | ||
1186 | + s->fifo_wlevel = REG_SD_FWLR_RST; | ||
1187 | + s->fifo_func_sel = REG_SD_FUNS_RST; | ||
1188 | + s->debug_enable = REG_SD_DBGC_RST; | ||
1189 | + s->auto12_arg = REG_SD_A12A_RST; | ||
1190 | + s->newtiming_set = REG_SD_NTSR_RST; | ||
1191 | + s->newtiming_debug = REG_SD_SDBG_RST; | ||
1192 | + s->hardware_rst = REG_SD_HWRST_RST; | ||
1193 | + s->dmac = REG_SD_DMAC_RST; | ||
1194 | + s->desc_base = REG_SD_DLBA_RST; | ||
1195 | + s->dmac_status = REG_SD_IDST_RST; | ||
1196 | + s->dmac_irq = REG_SD_IDIE_RST; | ||
1197 | + s->card_threshold = REG_SD_THLDC_RST; | ||
1198 | + s->startbit_detect = REG_SD_DSBD_RST; | ||
1199 | + s->response_crc = REG_SD_RES_CRC_RST; | ||
1200 | + | ||
1201 | + for (int i = 0; i < ARRAY_SIZE(s->data_crc); i++) { | ||
1202 | + s->data_crc[i] = REG_SD_DATA_CRC_RST; | ||
1203 | + } | ||
1204 | + | ||
1205 | + s->status_crc = REG_SD_CRC_STA_RST; | ||
1206 | +} | ||
1207 | + | ||
1208 | +static void allwinner_sdhost_bus_class_init(ObjectClass *klass, void *data) | ||
1209 | +{ | ||
1210 | + SDBusClass *sbc = SD_BUS_CLASS(klass); | ||
1211 | + | ||
1212 | + sbc->set_inserted = allwinner_sdhost_set_inserted; | ||
1213 | +} | ||
1214 | + | ||
1215 | +static void allwinner_sdhost_class_init(ObjectClass *klass, void *data) | ||
1216 | +{ | ||
1217 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
1218 | + | ||
1219 | + dc->reset = allwinner_sdhost_reset; | ||
1220 | + dc->vmsd = &vmstate_allwinner_sdhost; | ||
1221 | +} | ||
1222 | + | ||
1223 | +static void allwinner_sdhost_sun4i_class_init(ObjectClass *klass, void *data) | ||
1224 | +{ | ||
1225 | + AwSdHostClass *sc = AW_SDHOST_CLASS(klass); | ||
1226 | + sc->max_desc_size = 8 * KiB; | ||
1227 | +} | ||
1228 | + | ||
1229 | +static void allwinner_sdhost_sun5i_class_init(ObjectClass *klass, void *data) | ||
1230 | +{ | ||
1231 | + AwSdHostClass *sc = AW_SDHOST_CLASS(klass); | ||
1232 | + sc->max_desc_size = 64 * KiB; | ||
1233 | +} | ||
1234 | + | ||
1235 | +static TypeInfo allwinner_sdhost_info = { | ||
1236 | + .name = TYPE_AW_SDHOST, | ||
1237 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
1238 | + .instance_init = allwinner_sdhost_init, | ||
1239 | + .instance_size = sizeof(AwSdHostState), | ||
1240 | + .class_init = allwinner_sdhost_class_init, | ||
1241 | + .class_size = sizeof(AwSdHostClass), | ||
1242 | + .abstract = true, | ||
1243 | +}; | ||
1244 | + | ||
1245 | +static const TypeInfo allwinner_sdhost_sun4i_info = { | ||
1246 | + .name = TYPE_AW_SDHOST_SUN4I, | ||
1247 | + .parent = TYPE_AW_SDHOST, | ||
1248 | + .class_init = allwinner_sdhost_sun4i_class_init, | ||
1249 | +}; | ||
1250 | + | ||
1251 | +static const TypeInfo allwinner_sdhost_sun5i_info = { | ||
1252 | + .name = TYPE_AW_SDHOST_SUN5I, | ||
1253 | + .parent = TYPE_AW_SDHOST, | ||
1254 | + .class_init = allwinner_sdhost_sun5i_class_init, | ||
1255 | +}; | ||
1256 | + | ||
1257 | +static const TypeInfo allwinner_sdhost_bus_info = { | ||
1258 | + .name = TYPE_AW_SDHOST_BUS, | ||
1259 | + .parent = TYPE_SD_BUS, | ||
1260 | + .instance_size = sizeof(SDBus), | ||
1261 | + .class_init = allwinner_sdhost_bus_class_init, | ||
1262 | +}; | ||
1263 | + | ||
1264 | +static void allwinner_sdhost_register_types(void) | ||
1265 | +{ | ||
1266 | + type_register_static(&allwinner_sdhost_info); | ||
1267 | + type_register_static(&allwinner_sdhost_sun4i_info); | ||
1268 | + type_register_static(&allwinner_sdhost_sun5i_info); | ||
1269 | + type_register_static(&allwinner_sdhost_bus_info); | ||
1270 | +} | ||
1271 | + | ||
1272 | +type_init(allwinner_sdhost_register_types) | ||
1273 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig | ||
1274 | index XXXXXXX..XXXXXXX 100644 | 76 | index XXXXXXX..XXXXXXX 100644 |
1275 | --- a/hw/arm/Kconfig | 77 | --- a/target/arm/translate-neon.c.inc |
1276 | +++ b/hw/arm/Kconfig | 78 | +++ b/target/arm/translate-neon.c.inc |
1277 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_H3 | 79 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VMUL, gen_helper_gvec_fmul_s, gen_helper_gvec_fmul_h) |
1278 | select UNIMP | 80 | DO_3S_FP_GVEC(VCEQ, gen_helper_gvec_fceq_s, gen_helper_gvec_fceq_h) |
1279 | select USB_OHCI | 81 | DO_3S_FP_GVEC(VCGE, gen_helper_gvec_fcge_s, gen_helper_gvec_fcge_h) |
1280 | select USB_EHCI_SYSBUS | 82 | DO_3S_FP_GVEC(VCGT, gen_helper_gvec_fcgt_s, gen_helper_gvec_fcgt_h) |
1281 | + select SD | 83 | +DO_3S_FP_GVEC(VACGE, gen_helper_gvec_facge_s, gen_helper_gvec_facge_h) |
1282 | 84 | +DO_3S_FP_GVEC(VACGT, gen_helper_gvec_facgt_s, gen_helper_gvec_facgt_h) | |
1283 | config RASPI | 85 | |
1284 | bool | 86 | /* |
1285 | diff --git a/hw/sd/trace-events b/hw/sd/trace-events | 87 | * For all the functions using this macro, size == 1 means fp16, |
1286 | index XXXXXXX..XXXXXXX 100644 | 88 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VCGT, gen_helper_gvec_fcgt_s, gen_helper_gvec_fcgt_h) |
1287 | --- a/hw/sd/trace-events | 89 | return do_3same_fp(s, a, FUNC, READS_VD); \ |
1288 | +++ b/hw/sd/trace-events | 90 | } |
1289 | @@ -XXX,XX +XXX,XX @@ | 91 | |
1290 | # See docs/devel/tracing.txt for syntax documentation. | 92 | -DO_3S_FP(VACGE, gen_helper_neon_acge_f32, false) |
1291 | 93 | -DO_3S_FP(VACGT, gen_helper_neon_acgt_f32, false) | |
1292 | +# allwinner-sdhost.c | 94 | DO_3S_FP(VMAX, gen_helper_vfp_maxs, false) |
1293 | +allwinner_sdhost_set_inserted(bool inserted) "inserted %u" | 95 | DO_3S_FP(VMIN, gen_helper_vfp_mins, false) |
1294 | +allwinner_sdhost_process_desc(uint64_t desc_addr, uint32_t desc_size, bool is_write, uint32_t max_bytes) "desc_addr 0x%" PRIx64 " desc_size %" PRIu32 " is_write %u max_bytes %" PRIu32 | 96 | |
1295 | +allwinner_sdhost_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
1296 | +allwinner_sdhost_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | ||
1297 | +allwinner_sdhost_update_irq(uint32_t irq) "IRQ bits 0x%" PRIx32 | ||
1298 | + | ||
1299 | # bcm2835_sdhost.c | ||
1300 | bcm2835_sdhost_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u" | ||
1301 | bcm2835_sdhost_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u" | ||
1302 | -- | 97 | -- |
1303 | 2.20.1 | 98 | 2.20.1 |
1304 | 99 | ||
1305 | 100 | diff view generated by jsdifflib |
1 | Fix a couple of comment typos. | 1 | Convert the Neon float-point VMAX and VMIN insns over to using |
---|---|---|---|
2 | a gvec helper, and use this to implement the fp16 case. | ||
2 | 3 | ||
3 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Message-id: 20200303174950.3298-5-peter.maydell@linaro.org | 6 | Message-id: 20200828183354.27913-29-peter.maydell@linaro.org |
6 | --- | 7 | --- |
7 | target/arm/helper.c | 2 +- | 8 | target/arm/helper.h | 6 ++++++ |
8 | target/arm/translate.c | 2 +- | 9 | target/arm/vec_helper.c | 6 ++++++ |
9 | 2 files changed, 2 insertions(+), 2 deletions(-) | 10 | target/arm/translate-neon.c.inc | 5 ++--- |
11 | 3 files changed, 14 insertions(+), 3 deletions(-) | ||
10 | 12 | ||
11 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
12 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/target/arm/helper.c | 15 | --- a/target/arm/helper.h |
14 | +++ b/target/arm/helper.c | 16 | +++ b/target/arm/helper.h |
15 | @@ -XXX,XX +XXX,XX @@ void HELPER(rebuild_hflags_m32)(CPUARMState *env, int el) | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_facge_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
18 | DEF_HELPER_FLAGS_5(gvec_facgt_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
19 | DEF_HELPER_FLAGS_5(gvec_facgt_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
20 | |||
21 | +DEF_HELPER_FLAGS_5(gvec_fmax_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
22 | +DEF_HELPER_FLAGS_5(gvec_fmax_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
23 | + | ||
24 | +DEF_HELPER_FLAGS_5(gvec_fmin_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
25 | +DEF_HELPER_FLAGS_5(gvec_fmin_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
26 | + | ||
27 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, | ||
28 | void, ptr, ptr, ptr, ptr, i32) | ||
29 | DEF_HELPER_FLAGS_5(gvec_ftsmul_s, TCG_CALL_NO_RWG, | ||
30 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
31 | index XXXXXXX..XXXXXXX 100644 | ||
32 | --- a/target/arm/vec_helper.c | ||
33 | +++ b/target/arm/vec_helper.c | ||
34 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_facge_s, float32_acge, float32) | ||
35 | DO_3OP(gvec_facgt_h, float16_acgt, float16) | ||
36 | DO_3OP(gvec_facgt_s, float32_acgt, float32) | ||
37 | |||
38 | +DO_3OP(gvec_fmax_h, float16_max, float16) | ||
39 | +DO_3OP(gvec_fmax_s, float32_max, float32) | ||
40 | + | ||
41 | +DO_3OP(gvec_fmin_h, float16_min, float16) | ||
42 | +DO_3OP(gvec_fmin_s, float32_min, float32) | ||
43 | + | ||
44 | #ifdef TARGET_AARCH64 | ||
45 | |||
46 | DO_3OP(gvec_recps_h, helper_recpsf_f16, float16) | ||
47 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
48 | index XXXXXXX..XXXXXXX 100644 | ||
49 | --- a/target/arm/translate-neon.c.inc | ||
50 | +++ b/target/arm/translate-neon.c.inc | ||
51 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VCGE, gen_helper_gvec_fcge_s, gen_helper_gvec_fcge_h) | ||
52 | DO_3S_FP_GVEC(VCGT, gen_helper_gvec_fcgt_s, gen_helper_gvec_fcgt_h) | ||
53 | DO_3S_FP_GVEC(VACGE, gen_helper_gvec_facge_s, gen_helper_gvec_facge_h) | ||
54 | DO_3S_FP_GVEC(VACGT, gen_helper_gvec_facgt_s, gen_helper_gvec_facgt_h) | ||
55 | +DO_3S_FP_GVEC(VMAX, gen_helper_gvec_fmax_s, gen_helper_gvec_fmax_h) | ||
56 | +DO_3S_FP_GVEC(VMIN, gen_helper_gvec_fmin_s, gen_helper_gvec_fmin_h) | ||
16 | 57 | ||
17 | /* | 58 | /* |
18 | * If we have triggered a EL state change we can't rely on the | 59 | * For all the functions using this macro, size == 1 means fp16, |
19 | - * translator having passed it too us, we need to recompute. | 60 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VACGT, gen_helper_gvec_facgt_s, gen_helper_gvec_facgt_h) |
20 | + * translator having passed it to us, we need to recompute. | 61 | return do_3same_fp(s, a, FUNC, READS_VD); \ |
21 | */ | 62 | } |
22 | void HELPER(rebuild_hflags_a32_newel)(CPUARMState *env) | 63 | |
64 | -DO_3S_FP(VMAX, gen_helper_vfp_maxs, false) | ||
65 | -DO_3S_FP(VMIN, gen_helper_vfp_mins, false) | ||
66 | - | ||
67 | static void gen_VMLA_fp_3s(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, | ||
68 | TCGv_ptr fpstatus) | ||
23 | { | 69 | { |
24 | diff --git a/target/arm/translate.c b/target/arm/translate.c | ||
25 | index XXXXXXX..XXXXXXX 100644 | ||
26 | --- a/target/arm/translate.c | ||
27 | +++ b/target/arm/translate.c | ||
28 | @@ -XXX,XX +XXX,XX @@ static int disas_coproc_insn(DisasContext *s, uint32_t insn) | ||
29 | |||
30 | if (!isread && !(ri->type & ARM_CP_SUPPRESS_TB_END)) { | ||
31 | /* | ||
32 | - * A write to any coprocessor regiser that ends a TB | ||
33 | + * A write to any coprocessor register that ends a TB | ||
34 | * must rebuild the hflags for the next TB. | ||
35 | */ | ||
36 | TCGv_i32 tcg_el = tcg_const_i32(s->current_el); | ||
37 | -- | 70 | -- |
38 | 2.20.1 | 71 | 2.20.1 |
39 | 72 | ||
40 | 73 | diff view generated by jsdifflib |
1 | From: Eric Auger <eric.auger@redhat.com> | 1 | Convert the Neon floating point VMAXNM and VMINNM insns to |
---|---|---|---|
2 | using a gvec helper and use this to implement the fp16 case. | ||
2 | 3 | ||
3 | We plan to introduce yet another value for the gic version (nosel). | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | As we already use exotic values such as 0 and -1, let's introduce | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | a dedicated enum type and let vms->gic_version take this | 6 | Message-id: 20200828183354.27913-30-peter.maydell@linaro.org |
6 | type. | 7 | --- |
8 | target/arm/helper.h | 6 ++++++ | ||
9 | target/arm/vec_helper.c | 6 ++++++ | ||
10 | target/arm/translate-neon.c.inc | 23 +++++++++++++++-------- | ||
11 | 3 files changed, 27 insertions(+), 8 deletions(-) | ||
7 | 12 | ||
8 | Signed-off-by: Eric Auger <eric.auger@redhat.com> | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
10 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
11 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
12 | Message-id: 20200311131618.7187-3-eric.auger@redhat.com | ||
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
14 | --- | ||
15 | include/hw/arm/virt.h | 11 +++++++++-- | ||
16 | hw/arm/virt.c | 30 +++++++++++++++--------------- | ||
17 | 2 files changed, 24 insertions(+), 17 deletions(-) | ||
18 | |||
19 | diff --git a/include/hw/arm/virt.h b/include/hw/arm/virt.h | ||
20 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
21 | --- a/include/hw/arm/virt.h | 15 | --- a/target/arm/helper.h |
22 | +++ b/include/hw/arm/virt.h | 16 | +++ b/target/arm/helper.h |
23 | @@ -XXX,XX +XXX,XX @@ typedef enum VirtIOMMUType { | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmax_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
24 | VIRT_IOMMU_VIRTIO, | 18 | DEF_HELPER_FLAGS_5(gvec_fmin_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
25 | } VirtIOMMUType; | 19 | DEF_HELPER_FLAGS_5(gvec_fmin_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
26 | 20 | ||
27 | +typedef enum VirtGICType { | 21 | +DEF_HELPER_FLAGS_5(gvec_fmaxnum_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
28 | + VIRT_GIC_VERSION_MAX, | 22 | +DEF_HELPER_FLAGS_5(gvec_fmaxnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
29 | + VIRT_GIC_VERSION_HOST, | ||
30 | + VIRT_GIC_VERSION_2, | ||
31 | + VIRT_GIC_VERSION_3, | ||
32 | +} VirtGICType; | ||
33 | + | 23 | + |
34 | typedef struct MemMapEntry { | 24 | +DEF_HELPER_FLAGS_5(gvec_fminnum_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
35 | hwaddr base; | 25 | +DEF_HELPER_FLAGS_5(gvec_fminnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
36 | hwaddr size; | 26 | + |
37 | @@ -XXX,XX +XXX,XX @@ typedef struct { | 27 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, |
38 | bool highmem_ecam; | 28 | void, ptr, ptr, ptr, ptr, i32) |
39 | bool its; | 29 | DEF_HELPER_FLAGS_5(gvec_ftsmul_s, TCG_CALL_NO_RWG, |
40 | bool virt; | 30 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
41 | - int32_t gic_version; | 31 | index XXXXXXX..XXXXXXX 100644 |
42 | + VirtGICType gic_version; | 32 | --- a/target/arm/vec_helper.c |
43 | VirtIOMMUType iommu; | 33 | +++ b/target/arm/vec_helper.c |
44 | uint16_t virtio_iommu_bdf; | 34 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_fmax_s, float32_max, float32) |
45 | struct arm_boot_info bootinfo; | 35 | DO_3OP(gvec_fmin_h, float16_min, float16) |
46 | @@ -XXX,XX +XXX,XX @@ static inline int virt_gicv3_redist_region_count(VirtMachineState *vms) | 36 | DO_3OP(gvec_fmin_s, float32_min, float32) |
47 | uint32_t redist0_capacity = | 37 | |
48 | vms->memmap[VIRT_GIC_REDIST].size / GICV3_REDIST_SIZE; | 38 | +DO_3OP(gvec_fmaxnum_h, float16_maxnum, float16) |
49 | 39 | +DO_3OP(gvec_fmaxnum_s, float32_maxnum, float32) | |
50 | - assert(vms->gic_version == 3); | 40 | + |
51 | + assert(vms->gic_version == VIRT_GIC_VERSION_3); | 41 | +DO_3OP(gvec_fminnum_h, float16_minnum, float16) |
52 | 42 | +DO_3OP(gvec_fminnum_s, float32_minnum, float32) | |
53 | return vms->smp_cpus > redist0_capacity ? 2 : 1; | 43 | + |
44 | #ifdef TARGET_AARCH64 | ||
45 | |||
46 | DO_3OP(gvec_recps_h, helper_recpsf_f16, float16) | ||
47 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
48 | index XXXXXXX..XXXXXXX 100644 | ||
49 | --- a/target/arm/translate-neon.c.inc | ||
50 | +++ b/target/arm/translate-neon.c.inc | ||
51 | @@ -XXX,XX +XXX,XX @@ static void gen_VMLS_fp_3s(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, | ||
52 | DO_3S_FP(VMLA, gen_VMLA_fp_3s, true) | ||
53 | DO_3S_FP(VMLS, gen_VMLS_fp_3s, true) | ||
54 | |||
55 | +WRAP_FP_GVEC(gen_VMAXNM_fp32_3s, FPST_STD, gen_helper_gvec_fmaxnum_s) | ||
56 | +WRAP_FP_GVEC(gen_VMAXNM_fp16_3s, FPST_STD_F16, gen_helper_gvec_fmaxnum_h) | ||
57 | +WRAP_FP_GVEC(gen_VMINNM_fp32_3s, FPST_STD, gen_helper_gvec_fminnum_s) | ||
58 | +WRAP_FP_GVEC(gen_VMINNM_fp16_3s, FPST_STD_F16, gen_helper_gvec_fminnum_h) | ||
59 | + | ||
60 | static bool trans_VMAXNM_fp_3s(DisasContext *s, arg_3same *a) | ||
61 | { | ||
62 | if (!arm_dc_feature(s, ARM_FEATURE_V8)) { | ||
63 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMAXNM_fp_3s(DisasContext *s, arg_3same *a) | ||
64 | } | ||
65 | |||
66 | if (a->size != 0) { | ||
67 | - /* TODO fp16 support */ | ||
68 | - return false; | ||
69 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { | ||
70 | + return false; | ||
71 | + } | ||
72 | + return do_3same(s, a, gen_VMAXNM_fp16_3s); | ||
73 | } | ||
74 | - | ||
75 | - return do_3same_fp(s, a, gen_helper_vfp_maxnums, false); | ||
76 | + return do_3same(s, a, gen_VMAXNM_fp32_3s); | ||
54 | } | 77 | } |
55 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c | 78 | |
56 | index XXXXXXX..XXXXXXX 100644 | 79 | static bool trans_VMINNM_fp_3s(DisasContext *s, arg_3same *a) |
57 | --- a/hw/arm/virt.c | 80 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMINNM_fp_3s(DisasContext *s, arg_3same *a) |
58 | +++ b/hw/arm/virt.c | ||
59 | @@ -XXX,XX +XXX,XX @@ static void fdt_add_timer_nodes(const VirtMachineState *vms) | ||
60 | irqflags = GIC_FDT_IRQ_FLAGS_EDGE_LO_HI; | ||
61 | } | 81 | } |
62 | 82 | ||
63 | - if (vms->gic_version == 2) { | 83 | if (a->size != 0) { |
64 | + if (vms->gic_version == VIRT_GIC_VERSION_2) { | 84 | - /* TODO fp16 support */ |
65 | irqflags = deposit32(irqflags, GIC_FDT_IRQ_PPI_CPU_START, | 85 | - return false; |
66 | GIC_FDT_IRQ_PPI_CPU_WIDTH, | 86 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
67 | (1 << vms->smp_cpus) - 1); | 87 | + return false; |
68 | @@ -XXX,XX +XXX,XX @@ static void fdt_add_gic_node(VirtMachineState *vms) | 88 | + } |
69 | qemu_fdt_setprop_cell(vms->fdt, nodename, "#address-cells", 0x2); | 89 | + return do_3same(s, a, gen_VMINNM_fp16_3s); |
70 | qemu_fdt_setprop_cell(vms->fdt, nodename, "#size-cells", 0x2); | ||
71 | qemu_fdt_setprop(vms->fdt, nodename, "ranges", NULL, 0); | ||
72 | - if (vms->gic_version == 3) { | ||
73 | + if (vms->gic_version == VIRT_GIC_VERSION_3) { | ||
74 | int nb_redist_regions = virt_gicv3_redist_region_count(vms); | ||
75 | |||
76 | qemu_fdt_setprop_string(vms->fdt, nodename, "compatible", | ||
77 | @@ -XXX,XX +XXX,XX @@ static void fdt_add_pmu_nodes(const VirtMachineState *vms) | ||
78 | } | ||
79 | } | 90 | } |
80 | 91 | - | |
81 | - if (vms->gic_version == 2) { | 92 | - return do_3same_fp(s, a, gen_helper_vfp_minnums, false); |
82 | + if (vms->gic_version == VIRT_GIC_VERSION_2) { | 93 | + return do_3same(s, a, gen_VMINNM_fp32_3s); |
83 | irqflags = deposit32(irqflags, GIC_FDT_IRQ_PPI_CPU_START, | ||
84 | GIC_FDT_IRQ_PPI_CPU_WIDTH, | ||
85 | (1 << vms->smp_cpus) - 1); | ||
86 | @@ -XXX,XX +XXX,XX @@ static uint64_t virt_cpu_mp_affinity(VirtMachineState *vms, int idx) | ||
87 | * purposes are to make TCG consistent (with 64-bit KVM hosts) | ||
88 | * and to improve SGI efficiency. | ||
89 | */ | ||
90 | - if (vms->gic_version == 3) { | ||
91 | + if (vms->gic_version == VIRT_GIC_VERSION_3) { | ||
92 | clustersz = GICV3_TARGETLIST_BITS; | ||
93 | } else { | ||
94 | clustersz = GIC_TARGETLIST_BITS; | ||
95 | @@ -XXX,XX +XXX,XX @@ static void machvirt_init(MachineState *machine) | ||
96 | /* We can probe only here because during property set | ||
97 | * KVM is not available yet | ||
98 | */ | ||
99 | - if (vms->gic_version <= 0) { | ||
100 | - /* "host" or "max" */ | ||
101 | + if (vms->gic_version == VIRT_GIC_VERSION_HOST || | ||
102 | + vms->gic_version == VIRT_GIC_VERSION_MAX) { | ||
103 | if (!kvm_enabled()) { | ||
104 | - if (vms->gic_version == 0) { | ||
105 | + if (vms->gic_version == VIRT_GIC_VERSION_HOST) { | ||
106 | error_report("gic-version=host requires KVM"); | ||
107 | exit(1); | ||
108 | } else { | ||
109 | /* "max": currently means 3 for TCG */ | ||
110 | - vms->gic_version = 3; | ||
111 | + vms->gic_version = VIRT_GIC_VERSION_3; | ||
112 | } | ||
113 | } else { | ||
114 | vms->gic_version = kvm_arm_vgic_probe(); | ||
115 | @@ -XXX,XX +XXX,XX @@ static void machvirt_init(MachineState *machine) | ||
116 | /* The maximum number of CPUs depends on the GIC version, or on how | ||
117 | * many redistributors we can fit into the memory map. | ||
118 | */ | ||
119 | - if (vms->gic_version == 3) { | ||
120 | + if (vms->gic_version == VIRT_GIC_VERSION_3) { | ||
121 | virt_max_cpus = | ||
122 | vms->memmap[VIRT_GIC_REDIST].size / GICV3_REDIST_SIZE; | ||
123 | virt_max_cpus += | ||
124 | @@ -XXX,XX +XXX,XX @@ static void virt_set_its(Object *obj, bool value, Error **errp) | ||
125 | static char *virt_get_gic_version(Object *obj, Error **errp) | ||
126 | { | ||
127 | VirtMachineState *vms = VIRT_MACHINE(obj); | ||
128 | - const char *val = vms->gic_version == 3 ? "3" : "2"; | ||
129 | + const char *val = vms->gic_version == VIRT_GIC_VERSION_3 ? "3" : "2"; | ||
130 | |||
131 | return g_strdup(val); | ||
132 | } | 94 | } |
133 | @@ -XXX,XX +XXX,XX @@ static void virt_set_gic_version(Object *obj, const char *value, Error **errp) | 95 | |
134 | VirtMachineState *vms = VIRT_MACHINE(obj); | 96 | WRAP_ENV_FN(gen_VRECPS_tramp, gen_helper_recps_f32) |
135 | |||
136 | if (!strcmp(value, "3")) { | ||
137 | - vms->gic_version = 3; | ||
138 | + vms->gic_version = VIRT_GIC_VERSION_3; | ||
139 | } else if (!strcmp(value, "2")) { | ||
140 | - vms->gic_version = 2; | ||
141 | + vms->gic_version = VIRT_GIC_VERSION_2; | ||
142 | } else if (!strcmp(value, "host")) { | ||
143 | - vms->gic_version = 0; /* Will probe later */ | ||
144 | + vms->gic_version = VIRT_GIC_VERSION_HOST; /* Will probe later */ | ||
145 | } else if (!strcmp(value, "max")) { | ||
146 | - vms->gic_version = -1; /* Will probe later */ | ||
147 | + vms->gic_version = VIRT_GIC_VERSION_MAX; /* Will probe later */ | ||
148 | } else { | ||
149 | error_setg(errp, "Invalid gic-version value"); | ||
150 | error_append_hint(errp, "Valid values are 3, 2, host, max.\n"); | ||
151 | @@ -XXX,XX +XXX,XX @@ static void virt_instance_init(Object *obj) | ||
152 | "physical address space above 32 bits", | ||
153 | NULL); | ||
154 | /* Default GIC type is v2 */ | ||
155 | - vms->gic_version = 2; | ||
156 | + vms->gic_version = VIRT_GIC_VERSION_2; | ||
157 | object_property_add_str(obj, "gic-version", virt_get_gic_version, | ||
158 | virt_set_gic_version, NULL); | ||
159 | object_property_set_description(obj, "gic-version", | ||
160 | -- | 97 | -- |
161 | 2.20.1 | 98 | 2.20.1 |
162 | 99 | ||
163 | 100 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Convert the Neon floating-point VMLA and VMLS insns over to using a |
---|---|---|---|
2 | gvec helper, and use this to implement the fp16 case. | ||
2 | 3 | ||
3 | Various Allwinner System on Chip designs contain multiple processors | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | that can be configured and reset using the generic CPU Configuration | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | module interface. This commit adds support for the Allwinner CPU | 6 | Message-id: 20200828183354.27913-31-peter.maydell@linaro.org |
6 | configuration interface which emulates the following features: | 7 | --- |
8 | target/arm/helper.h | 6 +++++ | ||
9 | target/arm/vec_helper.c | 42 +++++++++++++++++++++++++++++++++ | ||
10 | target/arm/translate-neon.c.inc | 33 ++------------------------ | ||
11 | 3 files changed, 50 insertions(+), 31 deletions(-) | ||
7 | 12 | ||
8 | * CPU reset | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
9 | * CPU status | ||
10 | |||
11 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
12 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
13 | Message-id: 20200311221854.30370-7-nieklinnenbank@gmail.com | ||
14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
15 | --- | ||
16 | hw/misc/Makefile.objs | 1 + | ||
17 | include/hw/arm/allwinner-h3.h | 3 + | ||
18 | include/hw/misc/allwinner-cpucfg.h | 52 ++++++ | ||
19 | hw/arm/allwinner-h3.c | 9 +- | ||
20 | hw/misc/allwinner-cpucfg.c | 282 +++++++++++++++++++++++++++++ | ||
21 | hw/misc/trace-events | 5 + | ||
22 | 6 files changed, 351 insertions(+), 1 deletion(-) | ||
23 | create mode 100644 include/hw/misc/allwinner-cpucfg.h | ||
24 | create mode 100644 hw/misc/allwinner-cpucfg.c | ||
25 | |||
26 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs | ||
27 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
28 | --- a/hw/misc/Makefile.objs | 15 | --- a/target/arm/helper.h |
29 | +++ b/hw/misc/Makefile.objs | 16 | +++ b/target/arm/helper.h |
30 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_MACIO) += macio/ | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmaxnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i3 |
31 | common-obj-$(CONFIG_IVSHMEM_DEVICE) += ivshmem.o | 18 | DEF_HELPER_FLAGS_5(gvec_fminnum_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
32 | 19 | DEF_HELPER_FLAGS_5(gvec_fminnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | |
33 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-ccu.o | 20 | |
34 | +obj-$(CONFIG_ALLWINNER_H3) += allwinner-cpucfg.o | 21 | +DEF_HELPER_FLAGS_5(gvec_fmla_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
35 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-sysctrl.o | 22 | +DEF_HELPER_FLAGS_5(gvec_fmla_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
36 | common-obj-$(CONFIG_REALVIEW) += arm_sysctl.o | 23 | + |
37 | common-obj-$(CONFIG_NSERIES) += cbus.o | 24 | +DEF_HELPER_FLAGS_5(gvec_fmls_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
38 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | 25 | +DEF_HELPER_FLAGS_5(gvec_fmls_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
26 | + | ||
27 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, | ||
28 | void, ptr, ptr, ptr, ptr, i32) | ||
29 | DEF_HELPER_FLAGS_5(gvec_ftsmul_s, TCG_CALL_NO_RWG, | ||
30 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
39 | index XXXXXXX..XXXXXXX 100644 | 31 | index XXXXXXX..XXXXXXX 100644 |
40 | --- a/include/hw/arm/allwinner-h3.h | 32 | --- a/target/arm/vec_helper.c |
41 | +++ b/include/hw/arm/allwinner-h3.h | 33 | +++ b/target/arm/vec_helper.c |
42 | @@ -XXX,XX +XXX,XX @@ | 34 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_rsqrts_d, helper_rsqrtsf_f64, float64) |
43 | #include "hw/timer/allwinner-a10-pit.h" | 35 | #endif |
44 | #include "hw/intc/arm_gic.h" | 36 | #undef DO_3OP |
45 | #include "hw/misc/allwinner-h3-ccu.h" | 37 | |
46 | +#include "hw/misc/allwinner-cpucfg.h" | 38 | +/* Non-fused multiply-add (unlike float16_muladd etc, which are fused) */ |
47 | #include "hw/misc/allwinner-h3-sysctrl.h" | 39 | +static float16 float16_muladd_nf(float16 dest, float16 op1, float16 op2, |
48 | #include "target/arm/cpu.h" | 40 | + float_status *stat) |
49 | |||
50 | @@ -XXX,XX +XXX,XX @@ enum { | ||
51 | AW_H3_GIC_CPU, | ||
52 | AW_H3_GIC_HYP, | ||
53 | AW_H3_GIC_VCPU, | ||
54 | + AW_H3_CPUCFG, | ||
55 | AW_H3_SDRAM | ||
56 | }; | ||
57 | |||
58 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
59 | const hwaddr *memmap; | ||
60 | AwA10PITState timer; | ||
61 | AwH3ClockCtlState ccu; | ||
62 | + AwCpuCfgState cpucfg; | ||
63 | AwH3SysCtrlState sysctrl; | ||
64 | GICState gic; | ||
65 | MemoryRegion sram_a1; | ||
66 | diff --git a/include/hw/misc/allwinner-cpucfg.h b/include/hw/misc/allwinner-cpucfg.h | ||
67 | new file mode 100644 | ||
68 | index XXXXXXX..XXXXXXX | ||
69 | --- /dev/null | ||
70 | +++ b/include/hw/misc/allwinner-cpucfg.h | ||
71 | @@ -XXX,XX +XXX,XX @@ | ||
72 | +/* | ||
73 | + * Allwinner CPU Configuration Module emulation | ||
74 | + * | ||
75 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
76 | + * | ||
77 | + * This program is free software: you can redistribute it and/or modify | ||
78 | + * it under the terms of the GNU General Public License as published by | ||
79 | + * the Free Software Foundation, either version 2 of the License, or | ||
80 | + * (at your option) any later version. | ||
81 | + * | ||
82 | + * This program is distributed in the hope that it will be useful, | ||
83 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
84 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
85 | + * GNU General Public License for more details. | ||
86 | + * | ||
87 | + * You should have received a copy of the GNU General Public License | ||
88 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
89 | + */ | ||
90 | + | ||
91 | +#ifndef HW_MISC_ALLWINNER_CPUCFG_H | ||
92 | +#define HW_MISC_ALLWINNER_CPUCFG_H | ||
93 | + | ||
94 | +#include "qom/object.h" | ||
95 | +#include "hw/sysbus.h" | ||
96 | + | ||
97 | +/** | ||
98 | + * Object model | ||
99 | + * @{ | ||
100 | + */ | ||
101 | + | ||
102 | +#define TYPE_AW_CPUCFG "allwinner-cpucfg" | ||
103 | +#define AW_CPUCFG(obj) \ | ||
104 | + OBJECT_CHECK(AwCpuCfgState, (obj), TYPE_AW_CPUCFG) | ||
105 | + | ||
106 | +/** @} */ | ||
107 | + | ||
108 | +/** | ||
109 | + * Allwinner CPU Configuration Module instance state | ||
110 | + */ | ||
111 | +typedef struct AwCpuCfgState { | ||
112 | + /*< private >*/ | ||
113 | + SysBusDevice parent_obj; | ||
114 | + /*< public >*/ | ||
115 | + | ||
116 | + MemoryRegion iomem; | ||
117 | + uint32_t gen_ctrl; | ||
118 | + uint32_t super_standby; | ||
119 | + uint32_t entry_addr; | ||
120 | + | ||
121 | +} AwCpuCfgState; | ||
122 | + | ||
123 | +#endif /* HW_MISC_ALLWINNER_CPUCFG_H */ | ||
124 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
125 | index XXXXXXX..XXXXXXX 100644 | ||
126 | --- a/hw/arm/allwinner-h3.c | ||
127 | +++ b/hw/arm/allwinner-h3.c | ||
128 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
129 | [AW_H3_GIC_CPU] = 0x01c82000, | ||
130 | [AW_H3_GIC_HYP] = 0x01c84000, | ||
131 | [AW_H3_GIC_VCPU] = 0x01c86000, | ||
132 | + [AW_H3_CPUCFG] = 0x01f01c00, | ||
133 | [AW_H3_SDRAM] = 0x40000000 | ||
134 | }; | ||
135 | |||
136 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
137 | { "r_wdog", 0x01f01000, 1 * KiB }, | ||
138 | { "r_prcm", 0x01f01400, 1 * KiB }, | ||
139 | { "r_twd", 0x01f01800, 1 * KiB }, | ||
140 | - { "r_cpucfg", 0x01f01c00, 1 * KiB }, | ||
141 | { "r_cir-rx", 0x01f02000, 1 * KiB }, | ||
142 | { "r_twi", 0x01f02400, 1 * KiB }, | ||
143 | { "r_uart", 0x01f02800, 1 * KiB }, | ||
144 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
145 | |||
146 | sysbus_init_child_obj(obj, "sysctrl", &s->sysctrl, sizeof(s->sysctrl), | ||
147 | TYPE_AW_H3_SYSCTRL); | ||
148 | + | ||
149 | + sysbus_init_child_obj(obj, "cpucfg", &s->cpucfg, sizeof(s->cpucfg), | ||
150 | + TYPE_AW_CPUCFG); | ||
151 | } | ||
152 | |||
153 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
154 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
155 | qdev_init_nofail(DEVICE(&s->sysctrl)); | ||
156 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->sysctrl), 0, s->memmap[AW_H3_SYSCTRL]); | ||
157 | |||
158 | + /* CPU Configuration */ | ||
159 | + qdev_init_nofail(DEVICE(&s->cpucfg)); | ||
160 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->cpucfg), 0, s->memmap[AW_H3_CPUCFG]); | ||
161 | + | ||
162 | /* Universal Serial Bus */ | ||
163 | sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI0], | ||
164 | qdev_get_gpio_in(DEVICE(&s->gic), | ||
165 | diff --git a/hw/misc/allwinner-cpucfg.c b/hw/misc/allwinner-cpucfg.c | ||
166 | new file mode 100644 | ||
167 | index XXXXXXX..XXXXXXX | ||
168 | --- /dev/null | ||
169 | +++ b/hw/misc/allwinner-cpucfg.c | ||
170 | @@ -XXX,XX +XXX,XX @@ | ||
171 | +/* | ||
172 | + * Allwinner CPU Configuration Module emulation | ||
173 | + * | ||
174 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
175 | + * | ||
176 | + * This program is free software: you can redistribute it and/or modify | ||
177 | + * it under the terms of the GNU General Public License as published by | ||
178 | + * the Free Software Foundation, either version 2 of the License, or | ||
179 | + * (at your option) any later version. | ||
180 | + * | ||
181 | + * This program is distributed in the hope that it will be useful, | ||
182 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
183 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
184 | + * GNU General Public License for more details. | ||
185 | + * | ||
186 | + * You should have received a copy of the GNU General Public License | ||
187 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
188 | + */ | ||
189 | + | ||
190 | +#include "qemu/osdep.h" | ||
191 | +#include "qemu/units.h" | ||
192 | +#include "hw/sysbus.h" | ||
193 | +#include "migration/vmstate.h" | ||
194 | +#include "qemu/log.h" | ||
195 | +#include "qemu/module.h" | ||
196 | +#include "qemu/error-report.h" | ||
197 | +#include "qemu/timer.h" | ||
198 | +#include "hw/core/cpu.h" | ||
199 | +#include "target/arm/arm-powerctl.h" | ||
200 | +#include "target/arm/cpu.h" | ||
201 | +#include "hw/misc/allwinner-cpucfg.h" | ||
202 | +#include "trace.h" | ||
203 | + | ||
204 | +/* CPUCFG register offsets */ | ||
205 | +enum { | ||
206 | + REG_CPUS_RST_CTRL = 0x0000, /* CPUs Reset Control */ | ||
207 | + REG_CPU0_RST_CTRL = 0x0040, /* CPU#0 Reset Control */ | ||
208 | + REG_CPU0_CTRL = 0x0044, /* CPU#0 Control */ | ||
209 | + REG_CPU0_STATUS = 0x0048, /* CPU#0 Status */ | ||
210 | + REG_CPU1_RST_CTRL = 0x0080, /* CPU#1 Reset Control */ | ||
211 | + REG_CPU1_CTRL = 0x0084, /* CPU#1 Control */ | ||
212 | + REG_CPU1_STATUS = 0x0088, /* CPU#1 Status */ | ||
213 | + REG_CPU2_RST_CTRL = 0x00C0, /* CPU#2 Reset Control */ | ||
214 | + REG_CPU2_CTRL = 0x00C4, /* CPU#2 Control */ | ||
215 | + REG_CPU2_STATUS = 0x00C8, /* CPU#2 Status */ | ||
216 | + REG_CPU3_RST_CTRL = 0x0100, /* CPU#3 Reset Control */ | ||
217 | + REG_CPU3_CTRL = 0x0104, /* CPU#3 Control */ | ||
218 | + REG_CPU3_STATUS = 0x0108, /* CPU#3 Status */ | ||
219 | + REG_CPU_SYS_RST = 0x0140, /* CPU System Reset */ | ||
220 | + REG_CLK_GATING = 0x0144, /* CPU Clock Gating */ | ||
221 | + REG_GEN_CTRL = 0x0184, /* General Control */ | ||
222 | + REG_SUPER_STANDBY = 0x01A0, /* Super Standby Flag */ | ||
223 | + REG_ENTRY_ADDR = 0x01A4, /* Reset Entry Address */ | ||
224 | + REG_DBG_EXTERN = 0x01E4, /* Debug External */ | ||
225 | + REG_CNT64_CTRL = 0x0280, /* 64-bit Counter Control */ | ||
226 | + REG_CNT64_LOW = 0x0284, /* 64-bit Counter Low */ | ||
227 | + REG_CNT64_HIGH = 0x0288, /* 64-bit Counter High */ | ||
228 | +}; | ||
229 | + | ||
230 | +/* CPUCFG register flags */ | ||
231 | +enum { | ||
232 | + CPUX_RESET_RELEASED = ((1 << 1) | (1 << 0)), | ||
233 | + CPUX_STATUS_SMP = (1 << 0), | ||
234 | + CPU_SYS_RESET_RELEASED = (1 << 0), | ||
235 | + CLK_GATING_ENABLE = ((1 << 8) | 0xF), | ||
236 | +}; | ||
237 | + | ||
238 | +/* CPUCFG register reset values */ | ||
239 | +enum { | ||
240 | + REG_CLK_GATING_RST = 0x0000010F, | ||
241 | + REG_GEN_CTRL_RST = 0x00000020, | ||
242 | + REG_SUPER_STANDBY_RST = 0x0, | ||
243 | + REG_CNT64_CTRL_RST = 0x0, | ||
244 | +}; | ||
245 | + | ||
246 | +/* CPUCFG constants */ | ||
247 | +enum { | ||
248 | + CPU_EXCEPTION_LEVEL_ON_RESET = 3, /* EL3 */ | ||
249 | +}; | ||
250 | + | ||
251 | +static void allwinner_cpucfg_cpu_reset(AwCpuCfgState *s, uint8_t cpu_id) | ||
252 | +{ | 41 | +{ |
253 | + int ret; | 42 | + return float16_add(dest, float16_mul(op1, op2, stat), stat); |
254 | + | ||
255 | + trace_allwinner_cpucfg_cpu_reset(cpu_id, s->entry_addr); | ||
256 | + | ||
257 | + ARMCPU *target_cpu = ARM_CPU(arm_get_cpu_by_id(cpu_id)); | ||
258 | + if (!target_cpu) { | ||
259 | + /* | ||
260 | + * Called with a bogus value for cpu_id. Guest error will | ||
261 | + * already have been logged, we can simply return here. | ||
262 | + */ | ||
263 | + return; | ||
264 | + } | ||
265 | + bool target_aa64 = arm_feature(&target_cpu->env, ARM_FEATURE_AARCH64); | ||
266 | + | ||
267 | + ret = arm_set_cpu_on(cpu_id, s->entry_addr, 0, | ||
268 | + CPU_EXCEPTION_LEVEL_ON_RESET, target_aa64); | ||
269 | + if (ret != QEMU_ARM_POWERCTL_RET_SUCCESS) { | ||
270 | + error_report("%s: failed to bring up CPU %d: err %d", | ||
271 | + __func__, cpu_id, ret); | ||
272 | + return; | ||
273 | + } | ||
274 | +} | 43 | +} |
275 | + | 44 | + |
276 | +static uint64_t allwinner_cpucfg_read(void *opaque, hwaddr offset, | 45 | +static float32 float32_muladd_nf(float32 dest, float32 op1, float32 op2, |
277 | + unsigned size) | 46 | + float_status *stat) |
278 | +{ | 47 | +{ |
279 | + const AwCpuCfgState *s = AW_CPUCFG(opaque); | 48 | + return float32_add(dest, float32_mul(op1, op2, stat), stat); |
280 | + uint64_t val = 0; | ||
281 | + | ||
282 | + switch (offset) { | ||
283 | + case REG_CPUS_RST_CTRL: /* CPUs Reset Control */ | ||
284 | + case REG_CPU_SYS_RST: /* CPU System Reset */ | ||
285 | + val = CPU_SYS_RESET_RELEASED; | ||
286 | + break; | ||
287 | + case REG_CPU0_RST_CTRL: /* CPU#0 Reset Control */ | ||
288 | + case REG_CPU1_RST_CTRL: /* CPU#1 Reset Control */ | ||
289 | + case REG_CPU2_RST_CTRL: /* CPU#2 Reset Control */ | ||
290 | + case REG_CPU3_RST_CTRL: /* CPU#3 Reset Control */ | ||
291 | + val = CPUX_RESET_RELEASED; | ||
292 | + break; | ||
293 | + case REG_CPU0_CTRL: /* CPU#0 Control */ | ||
294 | + case REG_CPU1_CTRL: /* CPU#1 Control */ | ||
295 | + case REG_CPU2_CTRL: /* CPU#2 Control */ | ||
296 | + case REG_CPU3_CTRL: /* CPU#3 Control */ | ||
297 | + val = 0; | ||
298 | + break; | ||
299 | + case REG_CPU0_STATUS: /* CPU#0 Status */ | ||
300 | + case REG_CPU1_STATUS: /* CPU#1 Status */ | ||
301 | + case REG_CPU2_STATUS: /* CPU#2 Status */ | ||
302 | + case REG_CPU3_STATUS: /* CPU#3 Status */ | ||
303 | + val = CPUX_STATUS_SMP; | ||
304 | + break; | ||
305 | + case REG_CLK_GATING: /* CPU Clock Gating */ | ||
306 | + val = CLK_GATING_ENABLE; | ||
307 | + break; | ||
308 | + case REG_GEN_CTRL: /* General Control */ | ||
309 | + val = s->gen_ctrl; | ||
310 | + break; | ||
311 | + case REG_SUPER_STANDBY: /* Super Standby Flag */ | ||
312 | + val = s->super_standby; | ||
313 | + break; | ||
314 | + case REG_ENTRY_ADDR: /* Reset Entry Address */ | ||
315 | + val = s->entry_addr; | ||
316 | + break; | ||
317 | + case REG_DBG_EXTERN: /* Debug External */ | ||
318 | + case REG_CNT64_CTRL: /* 64-bit Counter Control */ | ||
319 | + case REG_CNT64_LOW: /* 64-bit Counter Low */ | ||
320 | + case REG_CNT64_HIGH: /* 64-bit Counter High */ | ||
321 | + qemu_log_mask(LOG_UNIMP, "%s: unimplemented register at 0x%04x\n", | ||
322 | + __func__, (uint32_t)offset); | ||
323 | + break; | ||
324 | + default: | ||
325 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
326 | + __func__, (uint32_t)offset); | ||
327 | + break; | ||
328 | + } | ||
329 | + | ||
330 | + trace_allwinner_cpucfg_read(offset, val, size); | ||
331 | + | ||
332 | + return val; | ||
333 | +} | 49 | +} |
334 | + | 50 | + |
335 | +static void allwinner_cpucfg_write(void *opaque, hwaddr offset, | 51 | +static float16 float16_mulsub_nf(float16 dest, float16 op1, float16 op2, |
336 | + uint64_t val, unsigned size) | 52 | + float_status *stat) |
337 | +{ | 53 | +{ |
338 | + AwCpuCfgState *s = AW_CPUCFG(opaque); | 54 | + return float16_sub(dest, float16_mul(op1, op2, stat), stat); |
339 | + | ||
340 | + trace_allwinner_cpucfg_write(offset, val, size); | ||
341 | + | ||
342 | + switch (offset) { | ||
343 | + case REG_CPUS_RST_CTRL: /* CPUs Reset Control */ | ||
344 | + case REG_CPU_SYS_RST: /* CPU System Reset */ | ||
345 | + break; | ||
346 | + case REG_CPU0_RST_CTRL: /* CPU#0 Reset Control */ | ||
347 | + case REG_CPU1_RST_CTRL: /* CPU#1 Reset Control */ | ||
348 | + case REG_CPU2_RST_CTRL: /* CPU#2 Reset Control */ | ||
349 | + case REG_CPU3_RST_CTRL: /* CPU#3 Reset Control */ | ||
350 | + if (val) { | ||
351 | + allwinner_cpucfg_cpu_reset(s, (offset - REG_CPU0_RST_CTRL) >> 6); | ||
352 | + } | ||
353 | + break; | ||
354 | + case REG_CPU0_CTRL: /* CPU#0 Control */ | ||
355 | + case REG_CPU1_CTRL: /* CPU#1 Control */ | ||
356 | + case REG_CPU2_CTRL: /* CPU#2 Control */ | ||
357 | + case REG_CPU3_CTRL: /* CPU#3 Control */ | ||
358 | + case REG_CPU0_STATUS: /* CPU#0 Status */ | ||
359 | + case REG_CPU1_STATUS: /* CPU#1 Status */ | ||
360 | + case REG_CPU2_STATUS: /* CPU#2 Status */ | ||
361 | + case REG_CPU3_STATUS: /* CPU#3 Status */ | ||
362 | + case REG_CLK_GATING: /* CPU Clock Gating */ | ||
363 | + break; | ||
364 | + case REG_GEN_CTRL: /* General Control */ | ||
365 | + s->gen_ctrl = val; | ||
366 | + break; | ||
367 | + case REG_SUPER_STANDBY: /* Super Standby Flag */ | ||
368 | + s->super_standby = val; | ||
369 | + break; | ||
370 | + case REG_ENTRY_ADDR: /* Reset Entry Address */ | ||
371 | + s->entry_addr = val; | ||
372 | + break; | ||
373 | + case REG_DBG_EXTERN: /* Debug External */ | ||
374 | + case REG_CNT64_CTRL: /* 64-bit Counter Control */ | ||
375 | + case REG_CNT64_LOW: /* 64-bit Counter Low */ | ||
376 | + case REG_CNT64_HIGH: /* 64-bit Counter High */ | ||
377 | + qemu_log_mask(LOG_UNIMP, "%s: unimplemented register at 0x%04x\n", | ||
378 | + __func__, (uint32_t)offset); | ||
379 | + break; | ||
380 | + default: | ||
381 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
382 | + __func__, (uint32_t)offset); | ||
383 | + break; | ||
384 | + } | ||
385 | +} | 55 | +} |
386 | + | 56 | + |
387 | +static const MemoryRegionOps allwinner_cpucfg_ops = { | 57 | +static float32 float32_mulsub_nf(float32 dest, float32 op1, float32 op2, |
388 | + .read = allwinner_cpucfg_read, | 58 | + float_status *stat) |
389 | + .write = allwinner_cpucfg_write, | ||
390 | + .endianness = DEVICE_NATIVE_ENDIAN, | ||
391 | + .valid = { | ||
392 | + .min_access_size = 4, | ||
393 | + .max_access_size = 4, | ||
394 | + }, | ||
395 | + .impl.min_access_size = 4, | ||
396 | +}; | ||
397 | + | ||
398 | +static void allwinner_cpucfg_reset(DeviceState *dev) | ||
399 | +{ | 59 | +{ |
400 | + AwCpuCfgState *s = AW_CPUCFG(dev); | 60 | + return float32_sub(dest, float32_mul(op1, op2, stat), stat); |
401 | + | ||
402 | + /* Set default values for registers */ | ||
403 | + s->gen_ctrl = REG_GEN_CTRL_RST; | ||
404 | + s->super_standby = REG_SUPER_STANDBY_RST; | ||
405 | + s->entry_addr = 0; | ||
406 | +} | 61 | +} |
407 | + | 62 | + |
408 | +static void allwinner_cpucfg_init(Object *obj) | 63 | +#define DO_MULADD(NAME, FUNC, TYPE) \ |
409 | +{ | 64 | +void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ |
410 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | 65 | +{ \ |
411 | + AwCpuCfgState *s = AW_CPUCFG(obj); | 66 | + intptr_t i, oprsz = simd_oprsz(desc); \ |
412 | + | 67 | + TYPE *d = vd, *n = vn, *m = vm; \ |
413 | + /* Memory mapping */ | 68 | + for (i = 0; i < oprsz / sizeof(TYPE); i++) { \ |
414 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_cpucfg_ops, s, | 69 | + d[i] = FUNC(d[i], n[i], m[i], stat); \ |
415 | + TYPE_AW_CPUCFG, 1 * KiB); | 70 | + } \ |
416 | + sysbus_init_mmio(sbd, &s->iomem); | 71 | + clear_tail(d, oprsz, simd_maxsz(desc)); \ |
417 | +} | 72 | +} |
418 | + | 73 | + |
419 | +static const VMStateDescription allwinner_cpucfg_vmstate = { | 74 | +DO_MULADD(gvec_fmla_h, float16_muladd_nf, float16) |
420 | + .name = "allwinner-cpucfg", | 75 | +DO_MULADD(gvec_fmla_s, float32_muladd_nf, float32) |
421 | + .version_id = 1, | ||
422 | + .minimum_version_id = 1, | ||
423 | + .fields = (VMStateField[]) { | ||
424 | + VMSTATE_UINT32(gen_ctrl, AwCpuCfgState), | ||
425 | + VMSTATE_UINT32(super_standby, AwCpuCfgState), | ||
426 | + VMSTATE_UINT32(entry_addr, AwCpuCfgState), | ||
427 | + VMSTATE_END_OF_LIST() | ||
428 | + } | ||
429 | +}; | ||
430 | + | 76 | + |
431 | +static void allwinner_cpucfg_class_init(ObjectClass *klass, void *data) | 77 | +DO_MULADD(gvec_fmls_h, float16_mulsub_nf, float16) |
432 | +{ | 78 | +DO_MULADD(gvec_fmls_s, float32_mulsub_nf, float32) |
433 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
434 | + | 79 | + |
435 | + dc->reset = allwinner_cpucfg_reset; | 80 | /* For the indexed ops, SVE applies the index per 128-bit vector segment. |
436 | + dc->vmsd = &allwinner_cpucfg_vmstate; | 81 | * For AdvSIMD, there is of course only one such vector segment. |
437 | +} | 82 | */ |
438 | + | 83 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
439 | +static const TypeInfo allwinner_cpucfg_info = { | ||
440 | + .name = TYPE_AW_CPUCFG, | ||
441 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
442 | + .instance_init = allwinner_cpucfg_init, | ||
443 | + .instance_size = sizeof(AwCpuCfgState), | ||
444 | + .class_init = allwinner_cpucfg_class_init, | ||
445 | +}; | ||
446 | + | ||
447 | +static void allwinner_cpucfg_register(void) | ||
448 | +{ | ||
449 | + type_register_static(&allwinner_cpucfg_info); | ||
450 | +} | ||
451 | + | ||
452 | +type_init(allwinner_cpucfg_register) | ||
453 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events | ||
454 | index XXXXXXX..XXXXXXX 100644 | 84 | index XXXXXXX..XXXXXXX 100644 |
455 | --- a/hw/misc/trace-events | 85 | --- a/target/arm/translate-neon.c.inc |
456 | +++ b/hw/misc/trace-events | 86 | +++ b/target/arm/translate-neon.c.inc |
457 | @@ -XXX,XX +XXX,XX @@ | 87 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VACGE, gen_helper_gvec_facge_s, gen_helper_gvec_facge_h) |
458 | # See docs/devel/tracing.txt for syntax documentation. | 88 | DO_3S_FP_GVEC(VACGT, gen_helper_gvec_facgt_s, gen_helper_gvec_facgt_h) |
459 | 89 | DO_3S_FP_GVEC(VMAX, gen_helper_gvec_fmax_s, gen_helper_gvec_fmax_h) | |
460 | +# allwinner-cpucfg.c | 90 | DO_3S_FP_GVEC(VMIN, gen_helper_gvec_fmin_s, gen_helper_gvec_fmin_h) |
461 | +allwinner_cpucfg_cpu_reset(uint8_t cpu_id, uint32_t reset_addr) "id %u, reset_addr 0x%" PRIu32 | 91 | - |
462 | +allwinner_cpucfg_read(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | 92 | -/* |
463 | +allwinner_cpucfg_write(uint64_t offset, uint64_t data, unsigned size) "offset 0x%" PRIx64 " data 0x%" PRIx64 " size %" PRIu32 | 93 | - * For all the functions using this macro, size == 1 means fp16, |
464 | + | 94 | - * which is an architecture extension we don't implement yet. |
465 | # eccmemctl.c | 95 | - */ |
466 | ecc_mem_writel_mer(uint32_t val) "Write memory enable 0x%08x" | 96 | -#define DO_3S_FP(INSN,FUNC,READS_VD) \ |
467 | ecc_mem_writel_mdr(uint32_t val) "Write memory delay 0x%08x" | 97 | - static bool trans_##INSN##_fp_3s(DisasContext *s, arg_3same *a) \ |
98 | - { \ | ||
99 | - if (a->size != 0) { \ | ||
100 | - /* TODO fp16 support */ \ | ||
101 | - return false; \ | ||
102 | - } \ | ||
103 | - return do_3same_fp(s, a, FUNC, READS_VD); \ | ||
104 | - } | ||
105 | - | ||
106 | -static void gen_VMLA_fp_3s(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, | ||
107 | - TCGv_ptr fpstatus) | ||
108 | -{ | ||
109 | - gen_helper_vfp_muls(vn, vn, vm, fpstatus); | ||
110 | - gen_helper_vfp_adds(vd, vd, vn, fpstatus); | ||
111 | -} | ||
112 | - | ||
113 | -static void gen_VMLS_fp_3s(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, | ||
114 | - TCGv_ptr fpstatus) | ||
115 | -{ | ||
116 | - gen_helper_vfp_muls(vn, vn, vm, fpstatus); | ||
117 | - gen_helper_vfp_subs(vd, vd, vn, fpstatus); | ||
118 | -} | ||
119 | - | ||
120 | -DO_3S_FP(VMLA, gen_VMLA_fp_3s, true) | ||
121 | -DO_3S_FP(VMLS, gen_VMLS_fp_3s, true) | ||
122 | +DO_3S_FP_GVEC(VMLA, gen_helper_gvec_fmla_s, gen_helper_gvec_fmla_h) | ||
123 | +DO_3S_FP_GVEC(VMLS, gen_helper_gvec_fmls_s, gen_helper_gvec_fmls_h) | ||
124 | |||
125 | WRAP_FP_GVEC(gen_VMAXNM_fp32_3s, FPST_STD, gen_helper_gvec_fmaxnum_s) | ||
126 | WRAP_FP_GVEC(gen_VMAXNM_fp16_3s, FPST_STD_F16, gen_helper_gvec_fmaxnum_h) | ||
468 | -- | 127 | -- |
469 | 2.20.1 | 128 | 2.20.1 |
470 | 129 | ||
471 | 130 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Convert the neon floating-point vector operations VFMA and VFMS |
---|---|---|---|
2 | 2 | to use a gvec helper, and use this to implement the fp16 case. | |
3 | The Xunlong Orange Pi PC machine is a functional ARM machine | 3 | |
4 | based on the Allwinner H3 System-on-Chip. It supports mainline | 4 | This is the last use of do_3same_fp() so we can now delete |
5 | Linux, U-Boot, NetBSD and is covered by acceptance tests. | 5 | that function. |
6 | 6 | ||
7 | This commit adds a documentation text file with a description | ||
8 | of the machine and instructions for the user. | ||
9 | |||
10 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
11 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
12 | Message-id: 20200311221854.30370-19-nieklinnenbank@gmail.com | ||
13 | [PMM: moved file into docs/system/arm to match the reorg | ||
14 | of the arm target part of the docs; tweaked heading to | ||
15 | match other boards] | ||
16 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20200828183354.27913-32-peter.maydell@linaro.org | ||
17 | --- | 10 | --- |
18 | MAINTAINERS | 1 + | 11 | target/arm/helper.h | 6 +++ |
19 | docs/system/arm/orangepi.rst | 253 +++++++++++++++++++++++++++++++++++ | 12 | target/arm/vec_helper.c | 33 +++++++++++- |
20 | docs/system/target-arm.rst | 2 + | 13 | target/arm/translate-neon.c.inc | 92 +-------------------------------- |
21 | 3 files changed, 256 insertions(+) | 14 | 3 files changed, 40 insertions(+), 91 deletions(-) |
22 | create mode 100644 docs/system/arm/orangepi.rst | 15 | |
23 | 16 | diff --git a/target/arm/helper.h b/target/arm/helper.h | |
24 | diff --git a/MAINTAINERS b/MAINTAINERS | ||
25 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
26 | --- a/MAINTAINERS | 18 | --- a/target/arm/helper.h |
27 | +++ b/MAINTAINERS | 19 | +++ b/target/arm/helper.h |
28 | @@ -XXX,XX +XXX,XX @@ S: Maintained | 20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmla_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
29 | F: hw/*/allwinner-h3* | 21 | DEF_HELPER_FLAGS_5(gvec_fmls_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
30 | F: include/hw/*/allwinner-h3* | 22 | DEF_HELPER_FLAGS_5(gvec_fmls_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
31 | F: hw/arm/orangepi.c | 23 | |
32 | +F: docs/system/orangepi.rst | 24 | +DEF_HELPER_FLAGS_5(gvec_vfma_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
33 | 25 | +DEF_HELPER_FLAGS_5(gvec_vfma_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | |
34 | ARM PrimeCell and CMSDK devices | 26 | + |
35 | M: Peter Maydell <peter.maydell@linaro.org> | 27 | +DEF_HELPER_FLAGS_5(gvec_vfms_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
36 | diff --git a/docs/system/arm/orangepi.rst b/docs/system/arm/orangepi.rst | 28 | +DEF_HELPER_FLAGS_5(gvec_vfms_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
37 | new file mode 100644 | 29 | + |
38 | index XXXXXXX..XXXXXXX | 30 | DEF_HELPER_FLAGS_5(gvec_ftsmul_h, TCG_CALL_NO_RWG, |
39 | --- /dev/null | 31 | void, ptr, ptr, ptr, ptr, i32) |
40 | +++ b/docs/system/arm/orangepi.rst | 32 | DEF_HELPER_FLAGS_5(gvec_ftsmul_s, TCG_CALL_NO_RWG, |
41 | @@ -XXX,XX +XXX,XX @@ | 33 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
42 | +Orange Pi PC (``orangepi-pc``) | ||
43 | +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ | ||
44 | + | ||
45 | +The Xunlong Orange Pi PC is an Allwinner H3 System on Chip | ||
46 | +based embedded computer with mainline support in both U-Boot | ||
47 | +and Linux. The board comes with a Quad Core Cortex-A7 @ 1.3GHz, | ||
48 | +1GiB RAM, 100Mbit ethernet, USB, SD/MMC, USB, HDMI and | ||
49 | +various other I/O. | ||
50 | + | ||
51 | +Supported devices | ||
52 | +""""""""""""""""" | ||
53 | + | ||
54 | +The Orange Pi PC machine supports the following devices: | ||
55 | + | ||
56 | + * SMP (Quad Core Cortex-A7) | ||
57 | + * Generic Interrupt Controller configuration | ||
58 | + * SRAM mappings | ||
59 | + * SDRAM controller | ||
60 | + * Real Time Clock | ||
61 | + * Timer device (re-used from Allwinner A10) | ||
62 | + * UART | ||
63 | + * SD/MMC storage controller | ||
64 | + * EMAC ethernet | ||
65 | + * USB 2.0 interfaces | ||
66 | + * Clock Control Unit | ||
67 | + * System Control module | ||
68 | + * Security Identifier device | ||
69 | + | ||
70 | +Limitations | ||
71 | +""""""""""" | ||
72 | + | ||
73 | +Currently, Orange Pi PC does *not* support the following features: | ||
74 | + | ||
75 | +- Graphical output via HDMI, GPU and/or the Display Engine | ||
76 | +- Audio output | ||
77 | +- Hardware Watchdog | ||
78 | + | ||
79 | +Also see the 'unimplemented' array in the Allwinner H3 SoC module | ||
80 | +for a complete list of unimplemented I/O devices: ``./hw/arm/allwinner-h3.c`` | ||
81 | + | ||
82 | +Boot options | ||
83 | +"""""""""""" | ||
84 | + | ||
85 | +The Orange Pi PC machine can start using the standard -kernel functionality | ||
86 | +for loading a Linux kernel or ELF executable. Additionally, the Orange Pi PC | ||
87 | +machine can also emulate the BootROM which is present on an actual Allwinner H3 | ||
88 | +based SoC, which loads the bootloader from a SD card, specified via the -sd argument | ||
89 | +to qemu-system-arm. | ||
90 | + | ||
91 | +Machine-specific options | ||
92 | +"""""""""""""""""""""""" | ||
93 | + | ||
94 | +The following machine-specific options are supported: | ||
95 | + | ||
96 | +- allwinner-rtc.base-year=YYYY | ||
97 | + | ||
98 | + The Allwinner RTC device is automatically created by the Orange Pi PC machine | ||
99 | + and uses a default base year value which can be overridden using the 'base-year' property. | ||
100 | + The base year is the actual represented year when the RTC year value is zero. | ||
101 | + This option can be used in case the target operating system driver uses a different | ||
102 | + base year value. The minimum value for the base year is 1900. | ||
103 | + | ||
104 | +- allwinner-sid.identifier=abcd1122-a000-b000-c000-12345678ffff | ||
105 | + | ||
106 | + The Security Identifier value can be read by the guest. | ||
107 | + For example, U-Boot uses it to determine a unique MAC address. | ||
108 | + | ||
109 | +The above machine-specific options can be specified in qemu-system-arm | ||
110 | +via the '-global' argument, for example: | ||
111 | + | ||
112 | +.. code-block:: bash | ||
113 | + | ||
114 | + $ qemu-system-arm -M orangepi-pc -sd mycard.img \ | ||
115 | + -global allwinner-rtc.base-year=2000 | ||
116 | + | ||
117 | +Running mainline Linux | ||
118 | +"""""""""""""""""""""" | ||
119 | + | ||
120 | +Mainline Linux kernels from 4.19 up to latest master are known to work. | ||
121 | +To build a Linux mainline kernel that can be booted by the Orange Pi PC machine, | ||
122 | +simply configure the kernel using the sunxi_defconfig configuration: | ||
123 | + | ||
124 | +.. code-block:: bash | ||
125 | + | ||
126 | + $ ARCH=arm CROSS_COMPILE=arm-linux-gnueabi- make mrproper | ||
127 | + $ ARCH=arm CROSS_COMPILE=arm-linux-gnueabi- make sunxi_defconfig | ||
128 | + | ||
129 | +To be able to use USB storage, you need to manually enable the corresponding | ||
130 | +configuration item. Start the kconfig configuration tool: | ||
131 | + | ||
132 | +.. code-block:: bash | ||
133 | + | ||
134 | + $ ARCH=arm CROSS_COMPILE=arm-linux-gnueabi- make menuconfig | ||
135 | + | ||
136 | +Navigate to the following item, enable it and save your configuration: | ||
137 | + | ||
138 | + Device Drivers > USB support > USB Mass Storage support | ||
139 | + | ||
140 | +Build the Linux kernel with: | ||
141 | + | ||
142 | +.. code-block:: bash | ||
143 | + | ||
144 | + $ ARCH=arm CROSS_COMPILE=arm-linux-gnueabi- make | ||
145 | + | ||
146 | +To boot the newly build linux kernel in QEMU with the Orange Pi PC machine, use: | ||
147 | + | ||
148 | +.. code-block:: bash | ||
149 | + | ||
150 | + $ qemu-system-arm -M orangepi-pc -nic user -nographic \ | ||
151 | + -kernel /path/to/linux/arch/arm/boot/zImage \ | ||
152 | + -append 'console=ttyS0,115200' \ | ||
153 | + -dtb /path/to/linux/arch/arm/boot/dts/sun8i-h3-orangepi-pc.dtb | ||
154 | + | ||
155 | +Orange Pi PC images | ||
156 | +""""""""""""""""""" | ||
157 | + | ||
158 | +Note that the mainline kernel does not have a root filesystem. You may provide it | ||
159 | +with an official Orange Pi PC image from the official website: | ||
160 | + | ||
161 | + http://www.orangepi.org/downloadresources/ | ||
162 | + | ||
163 | +Another possibility is to run an Armbian image for Orange Pi PC which | ||
164 | +can be downloaded from: | ||
165 | + | ||
166 | + https://www.armbian.com/orange-pi-pc/ | ||
167 | + | ||
168 | +Alternatively, you can also choose to build you own image with buildroot | ||
169 | +using the orangepi_pc_defconfig. Also see https://buildroot.org for more information. | ||
170 | + | ||
171 | +You can choose to attach the selected image either as an SD card or as USB mass storage. | ||
172 | +For example, to boot using the Orange Pi PC Debian image on SD card, simply add the -sd | ||
173 | +argument and provide the proper root= kernel parameter: | ||
174 | + | ||
175 | +.. code-block:: bash | ||
176 | + | ||
177 | + $ qemu-system-arm -M orangepi-pc -nic user -nographic \ | ||
178 | + -kernel /path/to/linux/arch/arm/boot/zImage \ | ||
179 | + -append 'console=ttyS0,115200 root=/dev/mmcblk0p2' \ | ||
180 | + -dtb /path/to/linux/arch/arm/boot/dts/sun8i-h3-orangepi-pc.dtb \ | ||
181 | + -sd OrangePi_pc_debian_stretch_server_linux5.3.5_v1.0.img | ||
182 | + | ||
183 | +To attach the image as an USB mass storage device to the machine, | ||
184 | +simply append to the command: | ||
185 | + | ||
186 | +.. code-block:: bash | ||
187 | + | ||
188 | + -drive if=none,id=stick,file=myimage.img \ | ||
189 | + -device usb-storage,bus=usb-bus.0,drive=stick | ||
190 | + | ||
191 | +Instead of providing a custom Linux kernel via the -kernel command you may also | ||
192 | +choose to let the Orange Pi PC machine load the bootloader from SD card, just like | ||
193 | +a real board would do using the BootROM. Simply pass the selected image via the -sd | ||
194 | +argument and remove the -kernel, -append, -dbt and -initrd arguments: | ||
195 | + | ||
196 | +.. code-block:: bash | ||
197 | + | ||
198 | + $ qemu-system-arm -M orangepi-pc -nic user -nographic \ | ||
199 | + -sd Armbian_19.11.3_Orangepipc_buster_current_5.3.9.img | ||
200 | + | ||
201 | +Note that both the official Orange Pi PC images and Armbian images start | ||
202 | +a lot of userland programs via systemd. Depending on the host hardware and OS, | ||
203 | +they may be slow to emulate, especially due to emulating the 4 cores. | ||
204 | +To help reduce the performance slow down due to emulating the 4 cores, you can | ||
205 | +give the following kernel parameters via U-Boot (or via -append): | ||
206 | + | ||
207 | +.. code-block:: bash | ||
208 | + | ||
209 | + => setenv extraargs 'systemd.default_timeout_start_sec=9000 loglevel=7 nosmp console=ttyS0,115200' | ||
210 | + | ||
211 | +Running U-Boot | ||
212 | +"""""""""""""" | ||
213 | + | ||
214 | +U-Boot mainline can be build and configured using the orangepi_pc_defconfig | ||
215 | +using similar commands as describe above for Linux. Note that it is recommended | ||
216 | +for development/testing to select the following configuration setting in U-Boot: | ||
217 | + | ||
218 | + Device Tree Control > Provider for DTB for DT Control > Embedded DTB | ||
219 | + | ||
220 | +To start U-Boot using the Orange Pi PC machine, provide the | ||
221 | +u-boot binary to the -kernel argument: | ||
222 | + | ||
223 | +.. code-block:: bash | ||
224 | + | ||
225 | + $ qemu-system-arm -M orangepi-pc -nic user -nographic \ | ||
226 | + -kernel /path/to/uboot/u-boot -sd disk.img | ||
227 | + | ||
228 | +Use the following U-boot commands to load and boot a Linux kernel from SD card: | ||
229 | + | ||
230 | +.. code-block:: bash | ||
231 | + | ||
232 | + => setenv bootargs console=ttyS0,115200 | ||
233 | + => ext2load mmc 0 0x42000000 zImage | ||
234 | + => ext2load mmc 0 0x43000000 sun8i-h3-orangepi-pc.dtb | ||
235 | + => bootz 0x42000000 - 0x43000000 | ||
236 | + | ||
237 | +Running NetBSD | ||
238 | +"""""""""""""" | ||
239 | + | ||
240 | +The NetBSD operating system also includes support for Allwinner H3 based boards, | ||
241 | +including the Orange Pi PC. NetBSD 9.0 is known to work best for the Orange Pi PC | ||
242 | +board and provides a fully working system with serial console, networking and storage. | ||
243 | +For the Orange Pi PC machine, get the 'evbarm-earmv7hf' based image from: | ||
244 | + | ||
245 | + https://cdn.netbsd.org/pub/NetBSD/NetBSD-9.0/evbarm-earmv7hf/binary/gzimg/armv7.img.gz | ||
246 | + | ||
247 | +The image requires manually installing U-Boot in the image. Build U-Boot with | ||
248 | +the orangepi_pc_defconfig configuration as described in the previous section. | ||
249 | +Next, unzip the NetBSD image and write the U-Boot binary including SPL using: | ||
250 | + | ||
251 | +.. code-block:: bash | ||
252 | + | ||
253 | + $ gunzip armv7.img.gz | ||
254 | + $ dd if=/path/to/u-boot-sunxi-with-spl.bin of=armv7.img bs=1024 seek=8 conv=notrunc | ||
255 | + | ||
256 | +Finally, before starting the machine the SD image must be extended such | ||
257 | +that the NetBSD kernel will not conclude the NetBSD partition is larger than | ||
258 | +the emulated SD card: | ||
259 | + | ||
260 | +.. code-block:: bash | ||
261 | + | ||
262 | + $ dd if=/dev/zero bs=1M count=64 >> armv7.img | ||
263 | + | ||
264 | +Start the machine using the following command: | ||
265 | + | ||
266 | +.. code-block:: bash | ||
267 | + | ||
268 | + $ qemu-system-arm -M orangepi-pc -nic user -nographic \ | ||
269 | + -sd armv7.img -global allwinner-rtc.base-year=2000 | ||
270 | + | ||
271 | +At the U-Boot stage, interrupt the automatic boot process by pressing a key | ||
272 | +and set the following environment variables before booting: | ||
273 | + | ||
274 | +.. code-block:: bash | ||
275 | + | ||
276 | + => setenv bootargs root=ld0a | ||
277 | + => setenv kernel netbsd-GENERIC.ub | ||
278 | + => setenv fdtfile dtb/sun8i-h3-orangepi-pc.dtb | ||
279 | + => setenv bootcmd 'fatload mmc 0:1 ${kernel_addr_r} ${kernel}; fatload mmc 0:1 ${fdt_addr_r} ${fdtfile}; fdt addr ${fdt_addr_r}; bootm ${kernel_addr_r} - ${fdt_addr_r}' | ||
280 | + | ||
281 | +Optionally you may save the environment variables to SD card with 'saveenv'. | ||
282 | +To continue booting simply give the 'boot' command and NetBSD boots. | ||
283 | + | ||
284 | +Orange Pi PC acceptance tests | ||
285 | +""""""""""""""""""""""""""""" | ||
286 | + | ||
287 | +The Orange Pi PC machine has several acceptance tests included. | ||
288 | +To run the whole set of tests, build QEMU from source and simply | ||
289 | +provide the following command: | ||
290 | + | ||
291 | +.. code-block:: bash | ||
292 | + | ||
293 | + $ AVOCADO_ALLOW_LARGE_STORAGE=yes avocado --show=app,console run \ | ||
294 | + -t machine:orangepi-pc tests/acceptance/boot_linux_console.py | ||
295 | diff --git a/docs/system/target-arm.rst b/docs/system/target-arm.rst | ||
296 | index XXXXXXX..XXXXXXX 100644 | 34 | index XXXXXXX..XXXXXXX 100644 |
297 | --- a/docs/system/target-arm.rst | 35 | --- a/target/arm/vec_helper.c |
298 | +++ b/docs/system/target-arm.rst | 36 | +++ b/target/arm/vec_helper.c |
299 | @@ -XXX,XX +XXX,XX @@ undocumented; you can get a complete list by running | 37 | @@ -XXX,XX +XXX,XX @@ static float32 float32_mulsub_nf(float32 dest, float32 op1, float32 op2, |
300 | ``qemu-system-aarch64 --machine help``. | 38 | return float32_sub(dest, float32_mul(op1, op2, stat), stat); |
301 | 39 | } | |
302 | .. toctree:: | 40 | |
303 | + :maxdepth: 1 | 41 | -#define DO_MULADD(NAME, FUNC, TYPE) \ |
304 | 42 | +/* Fused versions; these have the semantics Neon VFMA/VFMS want */ | |
305 | arm/integratorcp | 43 | +static float16 float16_muladd_f(float16 dest, float16 op1, float16 op2, |
306 | arm/versatile | 44 | + float_status *stat) |
307 | @@ -XXX,XX +XXX,XX @@ undocumented; you can get a complete list by running | 45 | +{ |
308 | arm/stellaris | 46 | + return float16_muladd(op1, op2, dest, 0, stat); |
309 | arm/musicpal | 47 | +} |
310 | arm/sx1 | 48 | + |
311 | + arm/orangepi | 49 | +static float32 float32_muladd_f(float32 dest, float32 op1, float32 op2, |
312 | 50 | + float_status *stat) | |
313 | Arm CPU features | 51 | +{ |
314 | ================ | 52 | + return float32_muladd(op1, op2, dest, 0, stat); |
53 | +} | ||
54 | + | ||
55 | +static float16 float16_mulsub_f(float16 dest, float16 op1, float16 op2, | ||
56 | + float_status *stat) | ||
57 | +{ | ||
58 | + return float16_muladd(float16_chs(op1), op2, dest, 0, stat); | ||
59 | +} | ||
60 | + | ||
61 | +static float32 float32_mulsub_f(float32 dest, float32 op1, float32 op2, | ||
62 | + float_status *stat) | ||
63 | +{ | ||
64 | + return float32_muladd(float32_chs(op1), op2, dest, 0, stat); | ||
65 | +} | ||
66 | + | ||
67 | +#define DO_MULADD(NAME, FUNC, TYPE) \ | ||
68 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ | ||
69 | { \ | ||
70 | intptr_t i, oprsz = simd_oprsz(desc); \ | ||
71 | @@ -XXX,XX +XXX,XX @@ DO_MULADD(gvec_fmla_s, float32_muladd_nf, float32) | ||
72 | DO_MULADD(gvec_fmls_h, float16_mulsub_nf, float16) | ||
73 | DO_MULADD(gvec_fmls_s, float32_mulsub_nf, float32) | ||
74 | |||
75 | +DO_MULADD(gvec_vfma_h, float16_muladd_f, float16) | ||
76 | +DO_MULADD(gvec_vfma_s, float32_muladd_f, float32) | ||
77 | + | ||
78 | +DO_MULADD(gvec_vfms_h, float16_mulsub_f, float16) | ||
79 | +DO_MULADD(gvec_vfms_s, float32_mulsub_f, float32) | ||
80 | + | ||
81 | /* For the indexed ops, SVE applies the index per 128-bit vector segment. | ||
82 | * For AdvSIMD, there is of course only one such vector segment. | ||
83 | */ | ||
84 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
85 | index XXXXXXX..XXXXXXX 100644 | ||
86 | --- a/target/arm/translate-neon.c.inc | ||
87 | +++ b/target/arm/translate-neon.c.inc | ||
88 | @@ -XXX,XX +XXX,XX @@ DO_3SAME_PAIR(VPADD, padd_u) | ||
89 | DO_3SAME_VQDMULH(VQDMULH, qdmulh) | ||
90 | DO_3SAME_VQDMULH(VQRDMULH, qrdmulh) | ||
91 | |||
92 | -static bool do_3same_fp(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn, | ||
93 | - bool reads_vd) | ||
94 | -{ | ||
95 | - /* | ||
96 | - * FP operations handled elementwise 32 bits at a time. | ||
97 | - * If reads_vd is true then the old value of Vd will be | ||
98 | - * loaded before calling the callback function. This is | ||
99 | - * used for multiply-accumulate type operations. | ||
100 | - */ | ||
101 | - TCGv_i32 tmp, tmp2; | ||
102 | - int pass; | ||
103 | - | ||
104 | - if (!arm_dc_feature(s, ARM_FEATURE_NEON)) { | ||
105 | - return false; | ||
106 | - } | ||
107 | - | ||
108 | - /* UNDEF accesses to D16-D31 if they don't exist. */ | ||
109 | - if (!dc_isar_feature(aa32_simd_r32, s) && | ||
110 | - ((a->vd | a->vn | a->vm) & 0x10)) { | ||
111 | - return false; | ||
112 | - } | ||
113 | - | ||
114 | - if ((a->vn | a->vm | a->vd) & a->q) { | ||
115 | - return false; | ||
116 | - } | ||
117 | - | ||
118 | - if (!vfp_access_check(s)) { | ||
119 | - return true; | ||
120 | - } | ||
121 | - | ||
122 | - TCGv_ptr fpstatus = fpstatus_ptr(FPST_STD); | ||
123 | - for (pass = 0; pass < (a->q ? 4 : 2); pass++) { | ||
124 | - tmp = neon_load_reg(a->vn, pass); | ||
125 | - tmp2 = neon_load_reg(a->vm, pass); | ||
126 | - if (reads_vd) { | ||
127 | - TCGv_i32 tmp_rd = neon_load_reg(a->vd, pass); | ||
128 | - fn(tmp_rd, tmp, tmp2, fpstatus); | ||
129 | - neon_store_reg(a->vd, pass, tmp_rd); | ||
130 | - tcg_temp_free_i32(tmp); | ||
131 | - } else { | ||
132 | - fn(tmp, tmp, tmp2, fpstatus); | ||
133 | - neon_store_reg(a->vd, pass, tmp); | ||
134 | - } | ||
135 | - tcg_temp_free_i32(tmp2); | ||
136 | - } | ||
137 | - tcg_temp_free_ptr(fpstatus); | ||
138 | - return true; | ||
139 | -} | ||
140 | - | ||
141 | #define WRAP_FP_GVEC(WRAPNAME, FPST, FUNC) \ | ||
142 | static void WRAPNAME(unsigned vece, uint32_t rd_ofs, \ | ||
143 | uint32_t rn_ofs, uint32_t rm_ofs, \ | ||
144 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VMAX, gen_helper_gvec_fmax_s, gen_helper_gvec_fmax_h) | ||
145 | DO_3S_FP_GVEC(VMIN, gen_helper_gvec_fmin_s, gen_helper_gvec_fmin_h) | ||
146 | DO_3S_FP_GVEC(VMLA, gen_helper_gvec_fmla_s, gen_helper_gvec_fmla_h) | ||
147 | DO_3S_FP_GVEC(VMLS, gen_helper_gvec_fmls_s, gen_helper_gvec_fmls_h) | ||
148 | +DO_3S_FP_GVEC(VFMA, gen_helper_gvec_vfma_s, gen_helper_gvec_vfma_h) | ||
149 | +DO_3S_FP_GVEC(VFMS, gen_helper_gvec_vfms_s, gen_helper_gvec_vfms_h) | ||
150 | |||
151 | WRAP_FP_GVEC(gen_VMAXNM_fp32_3s, FPST_STD, gen_helper_gvec_fmaxnum_s) | ||
152 | WRAP_FP_GVEC(gen_VMAXNM_fp16_3s, FPST_STD_F16, gen_helper_gvec_fmaxnum_h) | ||
153 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRSQRTS_fp_3s(DisasContext *s, arg_3same *a) | ||
154 | return do_3same(s, a, gen_VRSQRTS_fp_3s); | ||
155 | } | ||
156 | |||
157 | -static void gen_VFMA_fp_3s(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, | ||
158 | - TCGv_ptr fpstatus) | ||
159 | -{ | ||
160 | - gen_helper_vfp_muladds(vd, vn, vm, vd, fpstatus); | ||
161 | -} | ||
162 | - | ||
163 | -static bool trans_VFMA_fp_3s(DisasContext *s, arg_3same *a) | ||
164 | -{ | ||
165 | - if (!dc_isar_feature(aa32_simdfmac, s)) { | ||
166 | - return false; | ||
167 | - } | ||
168 | - | ||
169 | - if (a->size != 0) { | ||
170 | - /* TODO fp16 support */ | ||
171 | - return false; | ||
172 | - } | ||
173 | - | ||
174 | - return do_3same_fp(s, a, gen_VFMA_fp_3s, true); | ||
175 | -} | ||
176 | - | ||
177 | -static void gen_VFMS_fp_3s(TCGv_i32 vd, TCGv_i32 vn, TCGv_i32 vm, | ||
178 | - TCGv_ptr fpstatus) | ||
179 | -{ | ||
180 | - gen_helper_vfp_negs(vn, vn); | ||
181 | - gen_helper_vfp_muladds(vd, vn, vm, vd, fpstatus); | ||
182 | -} | ||
183 | - | ||
184 | -static bool trans_VFMS_fp_3s(DisasContext *s, arg_3same *a) | ||
185 | -{ | ||
186 | - if (!dc_isar_feature(aa32_simdfmac, s)) { | ||
187 | - return false; | ||
188 | - } | ||
189 | - | ||
190 | - if (a->size != 0) { | ||
191 | - /* TODO fp16 support */ | ||
192 | - return false; | ||
193 | - } | ||
194 | - | ||
195 | - return do_3same_fp(s, a, gen_VFMS_fp_3s, true); | ||
196 | -} | ||
197 | - | ||
198 | static bool do_3same_fp_pair(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn) | ||
199 | { | ||
200 | /* FP operations handled pairwise 32 bits at a time */ | ||
315 | -- | 201 | -- |
316 | 2.20.1 | 202 | 2.20.1 |
317 | 203 | ||
318 | 204 | diff view generated by jsdifflib |
1 | From: Eric Auger <eric.auger@redhat.com> | 1 | Convert the neon floating-point vector compare-vs-0 insns VCEQ0, |
---|---|---|---|
2 | VCGT0, VCLE0, VCGE0 and VCLT0 to use a gvec helper, and use this to | ||
3 | implement the fp16 case. | ||
2 | 4 | ||
3 | Restructure the finalize_gic_version with switch cases and | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | clearly separate the following cases: | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
7 | Message-id: 20200828183354.27913-33-peter.maydell@linaro.org | ||
8 | --- | ||
9 | target/arm/helper.h | 15 +++++++++++++++ | ||
10 | target/arm/vec_helper.c | 25 +++++++++++++++++++++++++ | ||
11 | target/arm/translate-neon.c.inc | 33 +++++---------------------------- | ||
12 | 3 files changed, 45 insertions(+), 28 deletions(-) | ||
5 | 13 | ||
6 | - KVM mode / in-kernel irqchip | 14 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
7 | - KVM mode / userspace irqchip | ||
8 | - TCG mode | ||
9 | |||
10 | In KVM mode / in-kernel irqchip , we explictly check whether | ||
11 | the chosen version is supported by the host. If the end-user | ||
12 | explicitly sets v2/v3 and this is not supported by the host, | ||
13 | then the user gets an explicit error message. Note that for | ||
14 | old kernels where the CREATE_DEVICE ioctl doesn't exist then | ||
15 | we will now fail if the user specifically asked for gicv2, | ||
16 | where previously we (probably) would have succeeded. | ||
17 | |||
18 | In KVM mode / userspace irqchip we immediatly output an error | ||
19 | in case the end-user explicitly selected v3. Also we warn the | ||
20 | end-user about the unexpected usage of gic-version=host in | ||
21 | that case as only userspace GICv2 is supported. | ||
22 | |||
23 | Signed-off-by: Eric Auger <eric.auger@redhat.com> | ||
24 | Reviewed-by: Andrew Jones <drjones@redhat.com> | ||
25 | Message-id: 20200311131618.7187-6-eric.auger@redhat.com | ||
26 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
27 | --- | ||
28 | hw/arm/virt.c | 88 +++++++++++++++++++++++++++++++++++++++------------ | ||
29 | 1 file changed, 67 insertions(+), 21 deletions(-) | ||
30 | |||
31 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c | ||
32 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
33 | --- a/hw/arm/virt.c | 16 | --- a/target/arm/helper.h |
34 | +++ b/hw/arm/virt.c | 17 | +++ b/target/arm/helper.h |
35 | @@ -XXX,XX +XXX,XX @@ static void virt_set_memmap(VirtMachineState *vms) | 18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(gvec_frsqrte_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
36 | */ | 19 | DEF_HELPER_FLAGS_4(gvec_frsqrte_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
37 | static void finalize_gic_version(VirtMachineState *vms) | 20 | DEF_HELPER_FLAGS_4(gvec_frsqrte_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
38 | { | 21 | |
39 | - if (vms->gic_version == VIRT_GIC_VERSION_HOST || | 22 | +DEF_HELPER_FLAGS_4(gvec_fcgt0_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
40 | - vms->gic_version == VIRT_GIC_VERSION_MAX) { | 23 | +DEF_HELPER_FLAGS_4(gvec_fcgt0_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
41 | - if (!kvm_enabled()) { | ||
42 | - if (vms->gic_version == VIRT_GIC_VERSION_HOST) { | ||
43 | - error_report("gic-version=host requires KVM"); | ||
44 | - exit(1); | ||
45 | - } else { | ||
46 | - /* "max": currently means 3 for TCG */ | ||
47 | - vms->gic_version = VIRT_GIC_VERSION_3; | ||
48 | - } | ||
49 | - } else { | ||
50 | - int probe_bitmap = kvm_arm_vgic_probe(); | ||
51 | + if (kvm_enabled()) { | ||
52 | + int probe_bitmap; | ||
53 | |||
54 | - if (!probe_bitmap) { | ||
55 | + if (!kvm_irqchip_in_kernel()) { | ||
56 | + switch (vms->gic_version) { | ||
57 | + case VIRT_GIC_VERSION_HOST: | ||
58 | + warn_report( | ||
59 | + "gic-version=host not relevant with kernel-irqchip=off " | ||
60 | + "as only userspace GICv2 is supported. Using v2 ..."); | ||
61 | + return; | ||
62 | + case VIRT_GIC_VERSION_MAX: | ||
63 | + case VIRT_GIC_VERSION_NOSEL: | ||
64 | + vms->gic_version = VIRT_GIC_VERSION_2; | ||
65 | + return; | ||
66 | + case VIRT_GIC_VERSION_2: | ||
67 | + return; | ||
68 | + case VIRT_GIC_VERSION_3: | ||
69 | error_report( | ||
70 | - "Unable to determine GIC version supported by host"); | ||
71 | + "gic-version=3 is not supported with kernel-irqchip=off"); | ||
72 | exit(1); | ||
73 | - } else { | ||
74 | - if (probe_bitmap & KVM_ARM_VGIC_V3) { | ||
75 | - vms->gic_version = VIRT_GIC_VERSION_3; | ||
76 | - } else { | ||
77 | - vms->gic_version = VIRT_GIC_VERSION_2; | ||
78 | - } | ||
79 | } | ||
80 | } | ||
81 | - } else if (vms->gic_version == VIRT_GIC_VERSION_NOSEL) { | ||
82 | + | 24 | + |
83 | + probe_bitmap = kvm_arm_vgic_probe(); | 25 | +DEF_HELPER_FLAGS_4(gvec_fcge0_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
84 | + if (!probe_bitmap) { | 26 | +DEF_HELPER_FLAGS_4(gvec_fcge0_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
85 | + error_report("Unable to determine GIC version supported by host"); | ||
86 | + exit(1); | ||
87 | + } | ||
88 | + | 27 | + |
89 | + switch (vms->gic_version) { | 28 | +DEF_HELPER_FLAGS_4(gvec_fceq0_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
90 | + case VIRT_GIC_VERSION_HOST: | 29 | +DEF_HELPER_FLAGS_4(gvec_fceq0_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
91 | + case VIRT_GIC_VERSION_MAX: | ||
92 | + if (probe_bitmap & KVM_ARM_VGIC_V3) { | ||
93 | + vms->gic_version = VIRT_GIC_VERSION_3; | ||
94 | + } else { | ||
95 | + vms->gic_version = VIRT_GIC_VERSION_2; | ||
96 | + } | ||
97 | + return; | ||
98 | + case VIRT_GIC_VERSION_NOSEL: | ||
99 | + vms->gic_version = VIRT_GIC_VERSION_2; | ||
100 | + break; | ||
101 | + case VIRT_GIC_VERSION_2: | ||
102 | + case VIRT_GIC_VERSION_3: | ||
103 | + break; | ||
104 | + } | ||
105 | + | 30 | + |
106 | + /* Check chosen version is effectively supported by the host */ | 31 | +DEF_HELPER_FLAGS_4(gvec_fcle0_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
107 | + if (vms->gic_version == VIRT_GIC_VERSION_2 && | 32 | +DEF_HELPER_FLAGS_4(gvec_fcle0_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
108 | + !(probe_bitmap & KVM_ARM_VGIC_V2)) { | 33 | + |
109 | + error_report("host does not support in-kernel GICv2 emulation"); | 34 | +DEF_HELPER_FLAGS_4(gvec_fclt0_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
110 | + exit(1); | 35 | +DEF_HELPER_FLAGS_4(gvec_fclt0_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
111 | + } else if (vms->gic_version == VIRT_GIC_VERSION_3 && | 36 | + |
112 | + !(probe_bitmap & KVM_ARM_VGIC_V3)) { | 37 | DEF_HELPER_FLAGS_5(gvec_fadd_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
113 | + error_report("host does not support in-kernel GICv3 emulation"); | 38 | DEF_HELPER_FLAGS_5(gvec_fadd_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
114 | + exit(1); | 39 | DEF_HELPER_FLAGS_5(gvec_fadd_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
115 | + } | 40 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
116 | + return; | 41 | index XXXXXXX..XXXXXXX 100644 |
42 | --- a/target/arm/vec_helper.c | ||
43 | +++ b/target/arm/vec_helper.c | ||
44 | @@ -XXX,XX +XXX,XX @@ DO_2OP(gvec_frsqrte_h, helper_rsqrte_f16, float16) | ||
45 | DO_2OP(gvec_frsqrte_s, helper_rsqrte_f32, float32) | ||
46 | DO_2OP(gvec_frsqrte_d, helper_rsqrte_f64, float64) | ||
47 | |||
48 | +#define WRAP_CMP0_FWD(FN, CMPOP, TYPE) \ | ||
49 | + static TYPE TYPE##_##FN##0(TYPE op, float_status *stat) \ | ||
50 | + { \ | ||
51 | + return TYPE##_##CMPOP(op, TYPE##_zero, stat); \ | ||
117 | + } | 52 | + } |
118 | + | 53 | + |
119 | + /* TCG mode */ | 54 | +#define WRAP_CMP0_REV(FN, CMPOP, TYPE) \ |
120 | + switch (vms->gic_version) { | 55 | + static TYPE TYPE##_##FN##0(TYPE op, float_status *stat) \ |
121 | + case VIRT_GIC_VERSION_NOSEL: | 56 | + { \ |
122 | vms->gic_version = VIRT_GIC_VERSION_2; | 57 | + return TYPE##_##CMPOP(TYPE##_zero, op, stat); \ |
123 | + break; | 58 | + } |
124 | + case VIRT_GIC_VERSION_MAX: | 59 | + |
125 | + vms->gic_version = VIRT_GIC_VERSION_3; | 60 | +#define DO_2OP_CMP0(FN, CMPOP, DIRN) \ |
126 | + break; | 61 | + WRAP_CMP0_##DIRN(FN, CMPOP, float16) \ |
127 | + case VIRT_GIC_VERSION_HOST: | 62 | + WRAP_CMP0_##DIRN(FN, CMPOP, float32) \ |
128 | + error_report("gic-version=host requires KVM"); | 63 | + DO_2OP(gvec_f##FN##0_h, float16_##FN##0, float16) \ |
129 | + exit(1); | 64 | + DO_2OP(gvec_f##FN##0_s, float32_##FN##0, float32) |
130 | + case VIRT_GIC_VERSION_2: | 65 | + |
131 | + case VIRT_GIC_VERSION_3: | 66 | +DO_2OP_CMP0(cgt, cgt, FWD) |
132 | + break; | 67 | +DO_2OP_CMP0(cge, cge, FWD) |
133 | } | 68 | +DO_2OP_CMP0(ceq, ceq, FWD) |
69 | +DO_2OP_CMP0(clt, cgt, REV) | ||
70 | +DO_2OP_CMP0(cle, cge, REV) | ||
71 | + | ||
72 | #undef DO_2OP | ||
73 | +#undef DO_2OP_CMP0 | ||
74 | |||
75 | /* Floating-point trigonometric starting value. | ||
76 | * See the ARM ARM pseudocode function FPTrigSMul. | ||
77 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
78 | index XXXXXXX..XXXXXXX 100644 | ||
79 | --- a/target/arm/translate-neon.c.inc | ||
80 | +++ b/target/arm/translate-neon.c.inc | ||
81 | @@ -XXX,XX +XXX,XX @@ DO_2MISC_FP(VCVT_UF, gen_helper_vfp_touizs) | ||
82 | |||
83 | DO_2MISC_FP_VEC(VRECPE_F, gen_helper_gvec_frecpe_h, gen_helper_gvec_frecpe_s) | ||
84 | DO_2MISC_FP_VEC(VRSQRTE_F, gen_helper_gvec_frsqrte_h, gen_helper_gvec_frsqrte_s) | ||
85 | +DO_2MISC_FP_VEC(VCGT0_F, gen_helper_gvec_fcgt0_h, gen_helper_gvec_fcgt0_s) | ||
86 | +DO_2MISC_FP_VEC(VCGE0_F, gen_helper_gvec_fcge0_h, gen_helper_gvec_fcge0_s) | ||
87 | +DO_2MISC_FP_VEC(VCEQ0_F, gen_helper_gvec_fceq0_h, gen_helper_gvec_fceq0_s) | ||
88 | +DO_2MISC_FP_VEC(VCLT0_F, gen_helper_gvec_fclt0_h, gen_helper_gvec_fclt0_s) | ||
89 | +DO_2MISC_FP_VEC(VCLE0_F, gen_helper_gvec_fcle0_h, gen_helper_gvec_fcle0_s) | ||
90 | |||
91 | static bool trans_VRINTX(DisasContext *s, arg_2misc *a) | ||
92 | { | ||
93 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINTX(DisasContext *s, arg_2misc *a) | ||
94 | return do_2misc_fp(s, a, gen_helper_rints_exact); | ||
134 | } | 95 | } |
135 | 96 | ||
97 | -#define WRAP_FP_CMP0_FWD(WRAPNAME, FUNC) \ | ||
98 | - static void WRAPNAME(TCGv_i32 d, TCGv_i32 m, TCGv_ptr fpst) \ | ||
99 | - { \ | ||
100 | - TCGv_i32 zero = tcg_const_i32(0); \ | ||
101 | - FUNC(d, m, zero, fpst); \ | ||
102 | - tcg_temp_free_i32(zero); \ | ||
103 | - } | ||
104 | -#define WRAP_FP_CMP0_REV(WRAPNAME, FUNC) \ | ||
105 | - static void WRAPNAME(TCGv_i32 d, TCGv_i32 m, TCGv_ptr fpst) \ | ||
106 | - { \ | ||
107 | - TCGv_i32 zero = tcg_const_i32(0); \ | ||
108 | - FUNC(d, zero, m, fpst); \ | ||
109 | - tcg_temp_free_i32(zero); \ | ||
110 | - } | ||
111 | - | ||
112 | -#define DO_FP_CMP0(INSN, FUNC, REV) \ | ||
113 | - WRAP_FP_CMP0_##REV(gen_##INSN, FUNC) \ | ||
114 | - static bool trans_##INSN(DisasContext *s, arg_2misc *a) \ | ||
115 | - { \ | ||
116 | - return do_2misc_fp(s, a, gen_##INSN); \ | ||
117 | - } | ||
118 | - | ||
119 | -DO_FP_CMP0(VCGT0_F, gen_helper_neon_cgt_f32, FWD) | ||
120 | -DO_FP_CMP0(VCGE0_F, gen_helper_neon_cge_f32, FWD) | ||
121 | -DO_FP_CMP0(VCEQ0_F, gen_helper_neon_ceq_f32, FWD) | ||
122 | -DO_FP_CMP0(VCLE0_F, gen_helper_neon_cge_f32, REV) | ||
123 | -DO_FP_CMP0(VCLT0_F, gen_helper_neon_cgt_f32, REV) | ||
124 | - | ||
125 | static bool do_vrint(DisasContext *s, arg_2misc *a, int rmode) | ||
126 | { | ||
127 | /* | ||
136 | -- | 128 | -- |
137 | 2.20.1 | 129 | 2.20.1 |
138 | 130 | ||
139 | 131 | diff view generated by jsdifflib |
1 | From: Eric Auger <eric.auger@redhat.com> | 1 | Convert the Neon VRECPS insn to using a gvec helper, and |
---|---|---|---|
2 | use this to implement the fp16 case. | ||
2 | 3 | ||
3 | Let's move the code which freezes which gic-version to | 4 | The phrasing of the new float32_recps_nf() is slightly different from |
4 | be applied in a dedicated function. We also now set by | 5 | the old recps_f32() so that it parallels the f16 version; for f16 we |
5 | default the VIRT_GIC_VERSION_NO_SET. This eventually | 6 | can't assume that flush-to-zero is always enabled. |
6 | turns into the legacy v2 choice in the finalize() function. | ||
7 | 7 | ||
8 | Signed-off-by: Eric Auger <eric.auger@redhat.com> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
10 | Reviewed-by: Andrew Jones <drjones@redhat.com> | 10 | Message-id: 20200828183354.27913-34-peter.maydell@linaro.org |
11 | Message-id: 20200311131618.7187-4-eric.auger@redhat.com | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | --- | 11 | --- |
14 | include/hw/arm/virt.h | 1 + | 12 | target/arm/helper.h | 4 +++- |
15 | hw/arm/virt.c | 54 ++++++++++++++++++++++++++----------------- | 13 | target/arm/vec_helper.c | 31 +++++++++++++++++++++++++++++++ |
16 | 2 files changed, 34 insertions(+), 21 deletions(-) | 14 | target/arm/vfp_helper.c | 13 ------------- |
15 | target/arm/translate-neon.c.inc | 21 +-------------------- | ||
16 | 4 files changed, 35 insertions(+), 34 deletions(-) | ||
17 | 17 | ||
18 | diff --git a/include/hw/arm/virt.h b/include/hw/arm/virt.h | 18 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
19 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/include/hw/arm/virt.h | 20 | --- a/target/arm/helper.h |
21 | +++ b/include/hw/arm/virt.h | 21 | +++ b/target/arm/helper.h |
22 | @@ -XXX,XX +XXX,XX @@ typedef enum VirtGICType { | 22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_4(vfp_muladdd, f64, f64, f64, f64, ptr) |
23 | VIRT_GIC_VERSION_HOST, | 23 | DEF_HELPER_4(vfp_muladds, f32, f32, f32, f32, ptr) |
24 | VIRT_GIC_VERSION_2, | 24 | DEF_HELPER_4(vfp_muladdh, f16, f16, f16, f16, ptr) |
25 | VIRT_GIC_VERSION_3, | 25 | |
26 | + VIRT_GIC_VERSION_NOSEL, | 26 | -DEF_HELPER_3(recps_f32, f32, env, f32, f32) |
27 | } VirtGICType; | 27 | DEF_HELPER_3(rsqrts_f32, f32, env, f32, f32) |
28 | 28 | DEF_HELPER_FLAGS_2(recpe_f16, TCG_CALL_NO_RWG, f16, f16, ptr) | |
29 | typedef struct MemMapEntry { | 29 | DEF_HELPER_FLAGS_2(recpe_f32, TCG_CALL_NO_RWG, f32, f32, ptr) |
30 | diff --git a/hw/arm/virt.c b/hw/arm/virt.c | 30 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmaxnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i3 |
31 | DEF_HELPER_FLAGS_5(gvec_fminnum_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
32 | DEF_HELPER_FLAGS_5(gvec_fminnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
33 | |||
34 | +DEF_HELPER_FLAGS_5(gvec_recps_nf_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
35 | +DEF_HELPER_FLAGS_5(gvec_recps_nf_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
36 | + | ||
37 | DEF_HELPER_FLAGS_5(gvec_fmla_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
38 | DEF_HELPER_FLAGS_5(gvec_fmla_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | ||
39 | |||
40 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
31 | index XXXXXXX..XXXXXXX 100644 | 41 | index XXXXXXX..XXXXXXX 100644 |
32 | --- a/hw/arm/virt.c | 42 | --- a/target/arm/vec_helper.c |
33 | +++ b/hw/arm/virt.c | 43 | +++ b/target/arm/vec_helper.c |
34 | @@ -XXX,XX +XXX,XX @@ static void virt_set_memmap(VirtMachineState *vms) | 44 | @@ -XXX,XX +XXX,XX @@ static float32 float32_abd(float32 op1, float32 op2, float_status *stat) |
35 | } | 45 | return float32_abs(float32_sub(op1, op2, stat)); |
36 | } | 46 | } |
37 | 47 | ||
38 | +/* | 48 | +/* |
39 | + * finalize_gic_version - Determines the final gic_version | 49 | + * Reciprocal step. These are the AArch32 version which uses a |
40 | + * according to the gic-version property | 50 | + * non-fused multiply-and-subtract. |
41 | + * | ||
42 | + * Default GIC type is v2 | ||
43 | + */ | 51 | + */ |
44 | +static void finalize_gic_version(VirtMachineState *vms) | 52 | +static float16 float16_recps_nf(float16 op1, float16 op2, float_status *stat) |
45 | +{ | 53 | +{ |
46 | + if (vms->gic_version == VIRT_GIC_VERSION_HOST || | 54 | + op1 = float16_squash_input_denormal(op1, stat); |
47 | + vms->gic_version == VIRT_GIC_VERSION_MAX) { | 55 | + op2 = float16_squash_input_denormal(op2, stat); |
48 | + if (!kvm_enabled()) { | 56 | + |
49 | + if (vms->gic_version == VIRT_GIC_VERSION_HOST) { | 57 | + if ((float16_is_infinity(op1) && float16_is_zero(op2)) || |
50 | + error_report("gic-version=host requires KVM"); | 58 | + (float16_is_infinity(op2) && float16_is_zero(op1))) { |
51 | + exit(1); | 59 | + return float16_two; |
52 | + } else { | ||
53 | + /* "max": currently means 3 for TCG */ | ||
54 | + vms->gic_version = VIRT_GIC_VERSION_3; | ||
55 | + } | ||
56 | + } else { | ||
57 | + vms->gic_version = kvm_arm_vgic_probe(); | ||
58 | + if (!vms->gic_version) { | ||
59 | + error_report( | ||
60 | + "Unable to determine GIC version supported by host"); | ||
61 | + exit(1); | ||
62 | + } | ||
63 | + } | ||
64 | + } else if (vms->gic_version == VIRT_GIC_VERSION_NOSEL) { | ||
65 | + vms->gic_version = VIRT_GIC_VERSION_2; | ||
66 | + } | 60 | + } |
61 | + return float16_sub(float16_two, float16_mul(op1, op2, stat), stat); | ||
67 | +} | 62 | +} |
68 | + | 63 | + |
69 | static void machvirt_init(MachineState *machine) | 64 | +static float32 float32_recps_nf(float32 op1, float32 op2, float_status *stat) |
65 | +{ | ||
66 | + op1 = float32_squash_input_denormal(op1, stat); | ||
67 | + op2 = float32_squash_input_denormal(op2, stat); | ||
68 | + | ||
69 | + if ((float32_is_infinity(op1) && float32_is_zero(op2)) || | ||
70 | + (float32_is_infinity(op2) && float32_is_zero(op1))) { | ||
71 | + return float32_two; | ||
72 | + } | ||
73 | + return float32_sub(float32_two, float32_mul(op1, op2, stat), stat); | ||
74 | +} | ||
75 | + | ||
76 | #define DO_3OP(NAME, FUNC, TYPE) \ | ||
77 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ | ||
78 | { \ | ||
79 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_fmaxnum_s, float32_maxnum, float32) | ||
80 | DO_3OP(gvec_fminnum_h, float16_minnum, float16) | ||
81 | DO_3OP(gvec_fminnum_s, float32_minnum, float32) | ||
82 | |||
83 | +DO_3OP(gvec_recps_nf_h, float16_recps_nf, float16) | ||
84 | +DO_3OP(gvec_recps_nf_s, float32_recps_nf, float32) | ||
85 | + | ||
86 | #ifdef TARGET_AARCH64 | ||
87 | |||
88 | DO_3OP(gvec_recps_h, helper_recpsf_f16, float16) | ||
89 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
90 | index XXXXXXX..XXXXXXX 100644 | ||
91 | --- a/target/arm/vfp_helper.c | ||
92 | +++ b/target/arm/vfp_helper.c | ||
93 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(vfp_fcvt_f64_to_f16)(float64 a, void *fpstp, uint32_t ahp_mode) | ||
94 | return r; | ||
95 | } | ||
96 | |||
97 | -float32 HELPER(recps_f32)(CPUARMState *env, float32 a, float32 b) | ||
98 | -{ | ||
99 | - float_status *s = &env->vfp.standard_fp_status; | ||
100 | - if ((float32_is_infinity(a) && float32_is_zero_or_denormal(b)) || | ||
101 | - (float32_is_infinity(b) && float32_is_zero_or_denormal(a))) { | ||
102 | - if (!(float32_is_zero(a) || float32_is_zero(b))) { | ||
103 | - float_raise(float_flag_input_denormal, s); | ||
104 | - } | ||
105 | - return float32_two; | ||
106 | - } | ||
107 | - return float32_sub(float32_two, float32_mul(a, b, s), s); | ||
108 | -} | ||
109 | - | ||
110 | float32 HELPER(rsqrts_f32)(CPUARMState *env, float32 a, float32 b) | ||
70 | { | 111 | { |
71 | VirtMachineState *vms = VIRT_MACHINE(machine); | 112 | float_status *s = &env->vfp.standard_fp_status; |
72 | @@ -XXX,XX +XXX,XX @@ static void machvirt_init(MachineState *machine) | 113 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
73 | /* We can probe only here because during property set | 114 | index XXXXXXX..XXXXXXX 100644 |
74 | * KVM is not available yet | 115 | --- a/target/arm/translate-neon.c.inc |
75 | */ | 116 | +++ b/target/arm/translate-neon.c.inc |
76 | - if (vms->gic_version == VIRT_GIC_VERSION_HOST || | 117 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VMLA, gen_helper_gvec_fmla_s, gen_helper_gvec_fmla_h) |
77 | - vms->gic_version == VIRT_GIC_VERSION_MAX) { | 118 | DO_3S_FP_GVEC(VMLS, gen_helper_gvec_fmls_s, gen_helper_gvec_fmls_h) |
78 | - if (!kvm_enabled()) { | 119 | DO_3S_FP_GVEC(VFMA, gen_helper_gvec_vfma_s, gen_helper_gvec_vfma_h) |
79 | - if (vms->gic_version == VIRT_GIC_VERSION_HOST) { | 120 | DO_3S_FP_GVEC(VFMS, gen_helper_gvec_vfms_s, gen_helper_gvec_vfms_h) |
80 | - error_report("gic-version=host requires KVM"); | 121 | +DO_3S_FP_GVEC(VRECPS, gen_helper_gvec_recps_nf_s, gen_helper_gvec_recps_nf_h) |
81 | - exit(1); | 122 | |
82 | - } else { | 123 | WRAP_FP_GVEC(gen_VMAXNM_fp32_3s, FPST_STD, gen_helper_gvec_fmaxnum_s) |
83 | - /* "max": currently means 3 for TCG */ | 124 | WRAP_FP_GVEC(gen_VMAXNM_fp16_3s, FPST_STD_F16, gen_helper_gvec_fmaxnum_h) |
84 | - vms->gic_version = VIRT_GIC_VERSION_3; | 125 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMINNM_fp_3s(DisasContext *s, arg_3same *a) |
85 | - } | 126 | return do_3same(s, a, gen_VMINNM_fp32_3s); |
86 | - } else { | 127 | } |
87 | - vms->gic_version = kvm_arm_vgic_probe(); | 128 | |
88 | - if (!vms->gic_version) { | 129 | -WRAP_ENV_FN(gen_VRECPS_tramp, gen_helper_recps_f32) |
89 | - error_report( | 130 | - |
90 | - "Unable to determine GIC version supported by host"); | 131 | -static void gen_VRECPS_fp_3s(unsigned vece, uint32_t rd_ofs, |
91 | - exit(1); | 132 | - uint32_t rn_ofs, uint32_t rm_ofs, |
92 | - } | 133 | - uint32_t oprsz, uint32_t maxsz) |
93 | - } | 134 | -{ |
135 | - static const GVecGen3 ops = { .fni4 = gen_VRECPS_tramp }; | ||
136 | - tcg_gen_gvec_3(rd_ofs, rn_ofs, rm_ofs, oprsz, maxsz, &ops); | ||
137 | -} | ||
138 | - | ||
139 | -static bool trans_VRECPS_fp_3s(DisasContext *s, arg_3same *a) | ||
140 | -{ | ||
141 | - if (a->size != 0) { | ||
142 | - /* TODO fp16 support */ | ||
143 | - return false; | ||
94 | - } | 144 | - } |
95 | + finalize_gic_version(vms); | 145 | - |
96 | 146 | - return do_3same(s, a, gen_VRECPS_fp_3s); | |
97 | if (!cpu_type_valid(machine->cpu_type)) { | 147 | -} |
98 | error_report("mach-virt: CPU type %s not supported", machine->cpu_type); | 148 | - |
99 | @@ -XXX,XX +XXX,XX @@ static void virt_instance_init(Object *obj) | 149 | WRAP_ENV_FN(gen_VRSQRTS_tramp, gen_helper_rsqrts_f32) |
100 | "Set on/off to enable/disable using " | 150 | |
101 | "physical address space above 32 bits", | 151 | static void gen_VRSQRTS_fp_3s(unsigned vece, uint32_t rd_ofs, |
102 | NULL); | ||
103 | - /* Default GIC type is v2 */ | ||
104 | - vms->gic_version = VIRT_GIC_VERSION_2; | ||
105 | + vms->gic_version = VIRT_GIC_VERSION_NOSEL; | ||
106 | object_property_add_str(obj, "gic-version", virt_get_gic_version, | ||
107 | virt_set_gic_version, NULL); | ||
108 | object_property_set_description(obj, "gic-version", | ||
109 | -- | 152 | -- |
110 | 2.20.1 | 153 | 2.20.1 |
111 | 154 | ||
112 | 155 | diff view generated by jsdifflib |
1 | From: Philippe Mathieu-Daudé <f4bug@amsat.org> | 1 | Convert the Neon VRSQRTS insn to using a gvec helper, |
---|---|---|---|
2 | and use this to implement the fp16 case. | ||
2 | 3 | ||
3 | This test boots U-Boot then NetBSD (stored on a SD card) on | 4 | As with VRECPS, we adjust the phrasing of the new implementation |
4 | a OrangePi PC board. | 5 | slightly so that the fp32 version parallels the fp16 one. |
5 | 6 | ||
6 | As it requires ~1.3GB of storage, it is disabled by default. | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20200828183354.27913-35-peter.maydell@linaro.org | ||
10 | --- | ||
11 | target/arm/helper.h | 4 +++- | ||
12 | target/arm/vec_helper.c | 30 ++++++++++++++++++++++++++++++ | ||
13 | target/arm/vfp_helper.c | 15 --------------- | ||
14 | target/arm/translate-neon.c.inc | 21 +-------------------- | ||
15 | 4 files changed, 34 insertions(+), 36 deletions(-) | ||
7 | 16 | ||
8 | U-Boot is built by the Debian project [1], and the SD card image | 17 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
9 | is provided by the NetBSD organization [2]. | ||
10 | |||
11 | Once the compressed SD card image is downloaded (304MB) and | ||
12 | extracted, this test is fast: | ||
13 | |||
14 | $ AVOCADO_ALLOW_LARGE_STORAGE=yes \ | ||
15 | avocado --show=app,console run -t machine:orangepi-pc \ | ||
16 | tests/acceptance/boot_linux_console.py | ||
17 | console: U-Boot SPL 2020.01+dfsg-1 (Jan 08 2020 - 08:19:44 +0000) | ||
18 | console: DRAM: 1024 MiB | ||
19 | console: U-Boot 2020.01+dfsg-1 (Jan 08 2020 - 08:19:44 +0000) Allwinner Technology | ||
20 | console: CPU: Allwinner H3 (SUN8I 0000) | ||
21 | console: scanning bus usb@1c1b000 for devices... 1 USB Device(s) found | ||
22 | console: scanning bus usb@1c1d000 for devices... 1 USB Device(s) found | ||
23 | console: scanning usb for storage devices... 0 Storage Device(s) found | ||
24 | console: Hit any key to stop autoboot: 0 | ||
25 | console: => setenv bootargs root=ld0a | ||
26 | console: => setenv kernel netbsd-GENERIC.ub | ||
27 | console: => setenv fdtfile dtb/sun8i-h3-orangepi-pc.dtb | ||
28 | console: => boot | ||
29 | console: ## Booting kernel from Legacy Image at 42000000 ... | ||
30 | console: Image Name: NetBSD/earmv7hf 9.0_RC1 | ||
31 | console: Image Type: ARM Linux Kernel Image (no loading done) (uncompressed) | ||
32 | console: XIP Kernel Image (no loading done) | ||
33 | console: Loading Device Tree to 49ff6000, end 49fffe01 ... OK | ||
34 | console: Starting kernel ... | ||
35 | console: [ 1.0000000] NetBSD/evbarm (fdt) booting ... | ||
36 | console: [ 1.0000000] NetBSD 9.0 (GENERIC) #0: Fri Feb 14 00:06:28 UTC 2020 | ||
37 | console: [ 1.0000000] mkrepro@mkrepro.NetBSD.org:/usr/src/sys/arch/evbarm/compile/GENERIC | ||
38 | console: [ 1.0000000] total memory = 1024 MB | ||
39 | console: [ 1.0000000] avail memory = 1003 MB | ||
40 | console: [ 1.0000000] armfdt0 (root) | ||
41 | console: [ 1.0000000] simplebus0 at armfdt0: Xunlong Orange Pi PC | ||
42 | console: [ 1.0000000] cpu0 at cpus0: Cortex-A7 r0p5 (Cortex V7A core) | ||
43 | console: [ 1.0000000] cpu0: DC enabled IC enabled WB enabled LABT branch prediction enabled | ||
44 | console: [ 1.0000000] cpu0: 32KB/64B 2-way L1 VIPT Instruction cache | ||
45 | console: [ 1.0000000] cpu0: 32KB/64B 2-way write-back-locking-C L1 PIPT Data cache | ||
46 | console: [ 1.0000000] cpu0: 2304KB/64B 16-way write-through L2 PIPT Unified cache | ||
47 | console: [ 1.0000000] vfp0 at cpu0: NEON MPE (VFP 3.0+), rounding, NaN propagation, denormals | ||
48 | ... | ||
49 | console: [ 2.3812082] sdmmc0: SD card status: 4-bit, C0 | ||
50 | console: [ 2.3812082] ld0 at sdmmc0: <0xaa:0x5859:QEMU!:0x01:0xdeadbeef:0x062> | ||
51 | console: [ 2.4012856] ld0: 1226 MB, 622 cyl, 64 head, 63 sec, 512 bytes/sect x 2511872 sectors | ||
52 | console: [ 2.5321222] ld0: 4-bit width, High-Speed/SDR25, 50.000 MHz | ||
53 | console: [ 3.1068718] WARNING: 4 errors while detecting hardware; check system log. | ||
54 | console: [ 3.1179868] boot device: ld0 | ||
55 | console: [ 3.1470623] root on ld0a dumps on ld0b | ||
56 | console: [ 3.2464436] root file system type: ffs | ||
57 | console: [ 3.2897123] kern.module.path=/stand/evbarm/9.0/modules | ||
58 | console: Mon Feb 17 20:33:35 UTC 2020 | ||
59 | console: Starting root file system check: | ||
60 | PASS (35.96 s) | ||
61 | RESULTS : PASS 1 | ERROR 0 | FAIL 0 | SKIP 0 | WARN 0 | INTERRUPT 0 | CANCEL 0 | ||
62 | JOB TIME : 36.09 s | ||
63 | |||
64 | Note, this test only took ~65 seconds to run on Travis-CI, see: [3]. | ||
65 | |||
66 | This test is based on a description from Niek Linnenbank from [4]. | ||
67 | |||
68 | [1] https://wiki.debian.org/InstallingDebianOn/Allwinner#Creating_a_bootable_SD_Card_with_u-boot | ||
69 | [2] https://wiki.netbsd.org/ports/evbarm/allwinner/ | ||
70 | [3] https://travis-ci.org/philmd/qemu/jobs/638823612#L3778 | ||
71 | [4] https://www.mail-archive.com/qemu-devel@nongnu.org/msg669347.html | ||
72 | |||
73 | Signed-off-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
74 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
75 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
76 | Tested-by: Alex Bennée <alex.bennee@linaro.org> | ||
77 | Message-id: 20200311221854.30370-18-nieklinnenbank@gmail.com | ||
78 | [NL: changed test to use NetBSD 9.0 final release and -global allwinner-rtc.base-year] | ||
79 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
80 | --- | ||
81 | tests/acceptance/boot_linux_console.py | 70 ++++++++++++++++++++++++++ | ||
82 | 1 file changed, 70 insertions(+) | ||
83 | |||
84 | diff --git a/tests/acceptance/boot_linux_console.py b/tests/acceptance/boot_linux_console.py | ||
85 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
86 | --- a/tests/acceptance/boot_linux_console.py | 19 | --- a/target/arm/helper.h |
87 | +++ b/tests/acceptance/boot_linux_console.py | 20 | +++ b/target/arm/helper.h |
88 | @@ -XXX,XX +XXX,XX @@ import shutil | 21 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_4(vfp_muladdd, f64, f64, f64, f64, ptr) |
89 | from avocado import skipUnless | 22 | DEF_HELPER_4(vfp_muladds, f32, f32, f32, f32, ptr) |
90 | from avocado_qemu import Test | 23 | DEF_HELPER_4(vfp_muladdh, f16, f16, f16, f16, ptr) |
91 | from avocado_qemu import exec_command_and_wait_for_pattern | 24 | |
92 | +from avocado_qemu import interrupt_interactive_console_until_pattern | 25 | -DEF_HELPER_3(rsqrts_f32, f32, env, f32, f32) |
93 | from avocado_qemu import wait_for_console_pattern | 26 | DEF_HELPER_FLAGS_2(recpe_f16, TCG_CALL_NO_RWG, f16, f16, ptr) |
94 | from avocado.utils import process | 27 | DEF_HELPER_FLAGS_2(recpe_f32, TCG_CALL_NO_RWG, f32, f32, ptr) |
95 | from avocado.utils import archive | 28 | DEF_HELPER_FLAGS_2(recpe_f64, TCG_CALL_NO_RWG, f64, f64, ptr) |
96 | @@ -XXX,XX +XXX,XX @@ class BootLinuxConsole(Test): | 29 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fminnum_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i3 |
97 | 'to <orangepipc>') | 30 | DEF_HELPER_FLAGS_5(gvec_recps_nf_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
98 | self.wait_for_console_pattern('Starting Load Kernel Modules...') | 31 | DEF_HELPER_FLAGS_5(gvec_recps_nf_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
99 | 32 | ||
100 | + @skipUnless(os.getenv('AVOCADO_ALLOW_LARGE_STORAGE'), 'storage limited') | 33 | +DEF_HELPER_FLAGS_5(gvec_rsqrts_nf_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
101 | + def test_arm_orangepi_uboot_netbsd9(self): | 34 | +DEF_HELPER_FLAGS_5(gvec_rsqrts_nf_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
102 | + """ | ||
103 | + :avocado: tags=arch:arm | ||
104 | + :avocado: tags=machine:orangepi-pc | ||
105 | + """ | ||
106 | + # This test download a 304MB compressed image and expand it to 1.3GB... | ||
107 | + deb_url = ('http://snapshot.debian.org/archive/debian/' | ||
108 | + '20200108T145233Z/pool/main/u/u-boot/' | ||
109 | + 'u-boot-sunxi_2020.01%2Bdfsg-1_armhf.deb') | ||
110 | + deb_hash = 'f67f404a80753ca3d1258f13e38f2b060e13db99' | ||
111 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | ||
112 | + # We use the common OrangePi PC 'plus' build of U-Boot for our secondary | ||
113 | + # program loader (SPL). We will then set the path to the more specific | ||
114 | + # OrangePi "PC" device tree blob with 'setenv fdtfile' in U-Boot prompt, | ||
115 | + # before to boot NetBSD. | ||
116 | + uboot_path = '/usr/lib/u-boot/orangepi_plus/u-boot-sunxi-with-spl.bin' | ||
117 | + uboot_path = self.extract_from_deb(deb_path, uboot_path) | ||
118 | + image_url = ('https://cdn.netbsd.org/pub/NetBSD/NetBSD-9.0/' | ||
119 | + 'evbarm-earmv7hf/binary/gzimg/armv7.img.gz') | ||
120 | + image_hash = '2babb29d36d8360adcb39c09e31060945259917a' | ||
121 | + image_path_gz = self.fetch_asset(image_url, asset_hash=image_hash) | ||
122 | + image_path = os.path.join(self.workdir, 'armv7.img') | ||
123 | + image_drive_args = 'if=sd,format=raw,snapshot=on,file=' + image_path | ||
124 | + archive.gzip_uncompress(image_path_gz, image_path) | ||
125 | + | 35 | + |
126 | + # dd if=u-boot-sunxi-with-spl.bin of=armv7.img bs=1K seek=8 conv=notrunc | 36 | DEF_HELPER_FLAGS_5(gvec_fmla_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
127 | + with open(uboot_path, 'rb') as f_in: | 37 | DEF_HELPER_FLAGS_5(gvec_fmla_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
128 | + with open(image_path, 'r+b') as f_out: | 38 | |
129 | + f_out.seek(8 * 1024) | 39 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
130 | + shutil.copyfileobj(f_in, f_out) | 40 | index XXXXXXX..XXXXXXX 100644 |
41 | --- a/target/arm/vec_helper.c | ||
42 | +++ b/target/arm/vec_helper.c | ||
43 | @@ -XXX,XX +XXX,XX @@ static float32 float32_recps_nf(float32 op1, float32 op2, float_status *stat) | ||
44 | return float32_sub(float32_two, float32_mul(op1, op2, stat), stat); | ||
45 | } | ||
46 | |||
47 | +/* Reciprocal square-root step. AArch32 non-fused semantics. */ | ||
48 | +static float16 float16_rsqrts_nf(float16 op1, float16 op2, float_status *stat) | ||
49 | +{ | ||
50 | + op1 = float16_squash_input_denormal(op1, stat); | ||
51 | + op2 = float16_squash_input_denormal(op2, stat); | ||
131 | + | 52 | + |
132 | + # Extend image, to avoid that NetBSD thinks the partition | 53 | + if ((float16_is_infinity(op1) && float16_is_zero(op2)) || |
133 | + # inside the image is larger than device size itself | 54 | + (float16_is_infinity(op2) && float16_is_zero(op1))) { |
134 | + f_out.seek(0, 2) | 55 | + return float16_one_point_five; |
135 | + f_out.seek(64 * 1024 * 1024, 1) | 56 | + } |
136 | + f_out.write(bytearray([0x00])) | 57 | + op1 = float16_sub(float16_three, float16_mul(op1, op2, stat), stat); |
58 | + return float16_div(op1, float16_two, stat); | ||
59 | +} | ||
137 | + | 60 | + |
138 | + self.vm.set_console() | 61 | +static float32 float32_rsqrts_nf(float32 op1, float32 op2, float_status *stat) |
139 | + self.vm.add_args('-nic', 'user', | 62 | +{ |
140 | + '-drive', image_drive_args, | 63 | + op1 = float32_squash_input_denormal(op1, stat); |
141 | + '-global', 'allwinner-rtc.base-year=2000', | 64 | + op2 = float32_squash_input_denormal(op2, stat); |
142 | + '-no-reboot') | ||
143 | + self.vm.launch() | ||
144 | + wait_for_console_pattern(self, 'U-Boot 2020.01+dfsg-1') | ||
145 | + interrupt_interactive_console_until_pattern(self, | ||
146 | + 'Hit any key to stop autoboot:', | ||
147 | + 'switch to partitions #0, OK') | ||
148 | + | 65 | + |
149 | + exec_command_and_wait_for_pattern(self, '', '=>') | 66 | + if ((float32_is_infinity(op1) && float32_is_zero(op2)) || |
150 | + cmd = 'setenv bootargs root=ld0a' | 67 | + (float32_is_infinity(op2) && float32_is_zero(op1))) { |
151 | + exec_command_and_wait_for_pattern(self, cmd, '=>') | 68 | + return float32_one_point_five; |
152 | + cmd = 'setenv kernel netbsd-GENERIC.ub' | 69 | + } |
153 | + exec_command_and_wait_for_pattern(self, cmd, '=>') | 70 | + op1 = float32_sub(float32_three, float32_mul(op1, op2, stat), stat); |
154 | + cmd = 'setenv fdtfile dtb/sun8i-h3-orangepi-pc.dtb' | 71 | + return float32_div(op1, float32_two, stat); |
155 | + exec_command_and_wait_for_pattern(self, cmd, '=>') | 72 | +} |
156 | + cmd = ("setenv bootcmd 'fatload mmc 0:1 ${kernel_addr_r} ${kernel}; " | ||
157 | + "fatload mmc 0:1 ${fdt_addr_r} ${fdtfile}; " | ||
158 | + "fdt addr ${fdt_addr_r}; " | ||
159 | + "bootm ${kernel_addr_r} - ${fdt_addr_r}'") | ||
160 | + exec_command_and_wait_for_pattern(self, cmd, '=>') | ||
161 | + | 73 | + |
162 | + exec_command_and_wait_for_pattern(self, 'boot', | 74 | #define DO_3OP(NAME, FUNC, TYPE) \ |
163 | + 'Booting kernel from Legacy Image') | 75 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ |
164 | + wait_for_console_pattern(self, 'Starting kernel ...') | 76 | { \ |
165 | + wait_for_console_pattern(self, 'NetBSD 9.0 (GENERIC)') | 77 | @@ -XXX,XX +XXX,XX @@ DO_3OP(gvec_fminnum_s, float32_minnum, float32) |
166 | + # Wait for user-space | 78 | DO_3OP(gvec_recps_nf_h, float16_recps_nf, float16) |
167 | + wait_for_console_pattern(self, 'Starting root file system check') | 79 | DO_3OP(gvec_recps_nf_s, float32_recps_nf, float32) |
80 | |||
81 | +DO_3OP(gvec_rsqrts_nf_h, float16_rsqrts_nf, float16) | ||
82 | +DO_3OP(gvec_rsqrts_nf_s, float32_rsqrts_nf, float32) | ||
168 | + | 83 | + |
169 | def test_s390x_s390_ccw_virtio(self): | 84 | #ifdef TARGET_AARCH64 |
170 | """ | 85 | |
171 | :avocado: tags=arch:s390x | 86 | DO_3OP(gvec_recps_h, helper_recpsf_f16, float16) |
87 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
88 | index XXXXXXX..XXXXXXX 100644 | ||
89 | --- a/target/arm/vfp_helper.c | ||
90 | +++ b/target/arm/vfp_helper.c | ||
91 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(vfp_fcvt_f64_to_f16)(float64 a, void *fpstp, uint32_t ahp_mode) | ||
92 | return r; | ||
93 | } | ||
94 | |||
95 | -float32 HELPER(rsqrts_f32)(CPUARMState *env, float32 a, float32 b) | ||
96 | -{ | ||
97 | - float_status *s = &env->vfp.standard_fp_status; | ||
98 | - float32 product; | ||
99 | - if ((float32_is_infinity(a) && float32_is_zero_or_denormal(b)) || | ||
100 | - (float32_is_infinity(b) && float32_is_zero_or_denormal(a))) { | ||
101 | - if (!(float32_is_zero(a) || float32_is_zero(b))) { | ||
102 | - float_raise(float_flag_input_denormal, s); | ||
103 | - } | ||
104 | - return float32_one_point_five; | ||
105 | - } | ||
106 | - product = float32_mul(a, b, s); | ||
107 | - return float32_div(float32_sub(float32_three, product, s), float32_two, s); | ||
108 | -} | ||
109 | - | ||
110 | /* NEON helpers. */ | ||
111 | |||
112 | /* Constants 256 and 512 are used in some helpers; we avoid relying on | ||
113 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
114 | index XXXXXXX..XXXXXXX 100644 | ||
115 | --- a/target/arm/translate-neon.c.inc | ||
116 | +++ b/target/arm/translate-neon.c.inc | ||
117 | @@ -XXX,XX +XXX,XX @@ DO_3S_FP_GVEC(VMLS, gen_helper_gvec_fmls_s, gen_helper_gvec_fmls_h) | ||
118 | DO_3S_FP_GVEC(VFMA, gen_helper_gvec_vfma_s, gen_helper_gvec_vfma_h) | ||
119 | DO_3S_FP_GVEC(VFMS, gen_helper_gvec_vfms_s, gen_helper_gvec_vfms_h) | ||
120 | DO_3S_FP_GVEC(VRECPS, gen_helper_gvec_recps_nf_s, gen_helper_gvec_recps_nf_h) | ||
121 | +DO_3S_FP_GVEC(VRSQRTS, gen_helper_gvec_rsqrts_nf_s, gen_helper_gvec_rsqrts_nf_h) | ||
122 | |||
123 | WRAP_FP_GVEC(gen_VMAXNM_fp32_3s, FPST_STD, gen_helper_gvec_fmaxnum_s) | ||
124 | WRAP_FP_GVEC(gen_VMAXNM_fp16_3s, FPST_STD_F16, gen_helper_gvec_fmaxnum_h) | ||
125 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMINNM_fp_3s(DisasContext *s, arg_3same *a) | ||
126 | return do_3same(s, a, gen_VMINNM_fp32_3s); | ||
127 | } | ||
128 | |||
129 | -WRAP_ENV_FN(gen_VRSQRTS_tramp, gen_helper_rsqrts_f32) | ||
130 | - | ||
131 | -static void gen_VRSQRTS_fp_3s(unsigned vece, uint32_t rd_ofs, | ||
132 | - uint32_t rn_ofs, uint32_t rm_ofs, | ||
133 | - uint32_t oprsz, uint32_t maxsz) | ||
134 | -{ | ||
135 | - static const GVecGen3 ops = { .fni4 = gen_VRSQRTS_tramp }; | ||
136 | - tcg_gen_gvec_3(rd_ofs, rn_ofs, rm_ofs, oprsz, maxsz, &ops); | ||
137 | -} | ||
138 | - | ||
139 | -static bool trans_VRSQRTS_fp_3s(DisasContext *s, arg_3same *a) | ||
140 | -{ | ||
141 | - if (a->size != 0) { | ||
142 | - /* TODO fp16 support */ | ||
143 | - return false; | ||
144 | - } | ||
145 | - | ||
146 | - return do_3same(s, a, gen_VRSQRTS_fp_3s); | ||
147 | -} | ||
148 | - | ||
149 | static bool do_3same_fp_pair(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn) | ||
150 | { | ||
151 | /* FP operations handled pairwise 32 bits at a time */ | ||
172 | -- | 152 | -- |
173 | 2.20.1 | 153 | 2.20.1 |
174 | 154 | ||
175 | 155 | diff view generated by jsdifflib |
1 | From: Philippe Mathieu-Daudé <f4bug@amsat.org> | 1 | Convert the Neon pairwise fp ops to use a single gvic-style |
---|---|---|---|
2 | helper to do the full operation instead of one helper call | ||
3 | for each 32-bit part. This allows us to use the same | ||
4 | framework to implement the fp16. | ||
2 | 5 | ||
3 | This test boots Ubuntu Bionic on a OrangePi PC board. | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20200828183354.27913-36-peter.maydell@linaro.org | ||
9 | --- | ||
10 | target/arm/helper.h | 7 +++++ | ||
11 | target/arm/vec_helper.c | 45 +++++++++++++++++++++++++++++++++ | ||
12 | target/arm/translate-neon.c.inc | 42 ++++++++++++------------------ | ||
13 | 3 files changed, 68 insertions(+), 26 deletions(-) | ||
4 | 14 | ||
5 | As it requires 1GB of storage, and is slow, this test is disabled | 15 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
6 | on automatic CI testing. | ||
7 | |||
8 | It is useful for workstation testing. Currently Avocado timeouts too | ||
9 | quickly, so we can't run userland commands. | ||
10 | |||
11 | The kernel image and DeviceTree blob are built by the Armbian | ||
12 | project (based on Debian): | ||
13 | https://www.armbian.com/orange-pi-pc/ | ||
14 | |||
15 | The Ubuntu image is downloaded from: | ||
16 | https://dl.armbian.com/orangepipc/Bionic_current | ||
17 | |||
18 | This test can be run using: | ||
19 | |||
20 | $ AVOCADO_ALLOW_LARGE_STORAGE=yes \ | ||
21 | avocado --show=app,console run -t machine:orangepi-pc \ | ||
22 | tests/acceptance/boot_linux_console.py | ||
23 | console: U-Boot SPL 2019.04-armbian (Nov 18 2019 - 23:08:35 +0100) | ||
24 | console: DRAM: 1024 MiB | ||
25 | console: Failed to set core voltage! Can't set CPU frequency | ||
26 | console: Trying to boot from MMC1 | ||
27 | console: U-Boot 2019.04-armbian (Nov 18 2019 - 23:08:35 +0100) Allwinner Technology | ||
28 | console: CPU: Allwinner H3 (SUN8I 0000) | ||
29 | console: Model: Xunlong Orange Pi PC | ||
30 | console: DRAM: 1 GiB | ||
31 | console: MMC: mmc@1c0f000: 0 | ||
32 | [...] | ||
33 | console: Uncompressing Linux... done, booting the kernel. | ||
34 | console: Booting Linux on physical CPU 0x0 | ||
35 | console: Linux version 5.3.9-sunxi (root@builder) (gcc version 8.3.0 (GNU Toolchain for the A-profile Architecture 8.3-2019.03 (arm-rel-8.36))) #19.11.3 SMP Mon Nov 18 18:49:43 CET 2019 | ||
36 | console: CPU: ARMv7 Processor [410fc075] revision 5 (ARMv7), cr=50c5387d | ||
37 | console: CPU: div instructions available: patching division code | ||
38 | console: CPU: PIPT / VIPT nonaliasing data cache, VIPT aliasing instruction cache | ||
39 | console: OF: fdt: Machine model: Xunlong Orange Pi PC | ||
40 | [...] | ||
41 | console: EXT4-fs (mmcblk0p1): mounted filesystem with writeback data mode. Opts: (null) | ||
42 | console: done. | ||
43 | console: Begin: Running /scripts/local-bottom ... done. | ||
44 | console: Begin: Running /scripts/init-bottom ... done. | ||
45 | console: systemd[1]: systemd 237 running in system mode. (...) | ||
46 | console: systemd[1]: Detected architecture arm. | ||
47 | console: Welcome to Ubuntu 18.04.3 LTS! | ||
48 | console: systemd[1]: Set hostname to <orangepipc>. | ||
49 | |||
50 | Signed-off-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
51 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
52 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
53 | Tested-by: Alex Bennée <alex.bennee@linaro.org> | ||
54 | Message-id: 20200311221854.30370-17-nieklinnenbank@gmail.com | ||
55 | [NL: rename in commit message Raspbian to Armbian, remove vm.set_machine()] | ||
56 | [NL: changed test to boot from SD card via BootROM, added check for 7z] | ||
57 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
58 | --- | ||
59 | tests/acceptance/boot_linux_console.py | 48 ++++++++++++++++++++++++++ | ||
60 | 1 file changed, 48 insertions(+) | ||
61 | |||
62 | diff --git a/tests/acceptance/boot_linux_console.py b/tests/acceptance/boot_linux_console.py | ||
63 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
64 | --- a/tests/acceptance/boot_linux_console.py | 17 | --- a/target/arm/helper.h |
65 | +++ b/tests/acceptance/boot_linux_console.py | 18 | +++ b/target/arm/helper.h |
66 | @@ -XXX,XX +XXX,XX @@ from avocado_qemu import exec_command_and_wait_for_pattern | 19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fcmlas_idx, TCG_CALL_NO_RWG, |
67 | from avocado_qemu import wait_for_console_pattern | 20 | DEF_HELPER_FLAGS_5(gvec_fcmlad, TCG_CALL_NO_RWG, |
68 | from avocado.utils import process | 21 | void, ptr, ptr, ptr, ptr, i32) |
69 | from avocado.utils import archive | 22 | |
70 | +from avocado.utils.path import find_command, CmdNotFoundError | 23 | +DEF_HELPER_FLAGS_5(neon_paddh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
71 | 24 | +DEF_HELPER_FLAGS_5(neon_pmaxh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | |
72 | +P7ZIP_AVAILABLE = True | 25 | +DEF_HELPER_FLAGS_5(neon_pminh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
73 | +try: | 26 | +DEF_HELPER_FLAGS_5(neon_padds, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
74 | + find_command('7z') | 27 | +DEF_HELPER_FLAGS_5(neon_pmaxs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
75 | +except CmdNotFoundError: | 28 | +DEF_HELPER_FLAGS_5(neon_pmins, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
76 | + P7ZIP_AVAILABLE = False | ||
77 | |||
78 | class BootLinuxConsole(Test): | ||
79 | """ | ||
80 | @@ -XXX,XX +XXX,XX @@ class BootLinuxConsole(Test): | ||
81 | exec_command_and_wait_for_pattern(self, 'reboot', | ||
82 | 'reboot: Restarting system') | ||
83 | |||
84 | + @skipUnless(os.getenv('AVOCADO_ALLOW_LARGE_STORAGE'), 'storage limited') | ||
85 | + @skipUnless(P7ZIP_AVAILABLE, '7z not installed') | ||
86 | + def test_arm_orangepi_bionic(self): | ||
87 | + """ | ||
88 | + :avocado: tags=arch:arm | ||
89 | + :avocado: tags=machine:orangepi-pc | ||
90 | + """ | ||
91 | + | 29 | + |
92 | + # This test download a 196MB compressed image and expand it to 932MB... | 30 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
93 | + image_url = ('https://dl.armbian.com/orangepipc/archive/' | 31 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
94 | + 'Armbian_19.11.3_Orangepipc_bionic_current_5.3.9.7z') | 32 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
95 | + image_hash = '196a8ffb72b0123d92cea4a070894813d305c71e' | 33 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
96 | + image_path_7z = self.fetch_asset(image_url, asset_hash=image_hash) | 34 | index XXXXXXX..XXXXXXX 100644 |
97 | + image_name = 'Armbian_19.11.3_Orangepipc_bionic_current_5.3.9.img' | 35 | --- a/target/arm/vec_helper.c |
98 | + image_path = os.path.join(self.workdir, image_name) | 36 | +++ b/target/arm/vec_helper.c |
99 | + process.run("7z e -o%s %s" % (self.workdir, image_path_7z)) | 37 | @@ -XXX,XX +XXX,XX @@ DO_ABA(gvec_uaba_s, uint32_t) |
38 | DO_ABA(gvec_uaba_d, uint64_t) | ||
39 | |||
40 | #undef DO_ABA | ||
100 | + | 41 | + |
101 | + self.vm.set_console() | 42 | +#define DO_NEON_PAIRWISE(NAME, OP) \ |
102 | + self.vm.add_args('-drive', 'file=' + image_path + ',if=sd,format=raw', | 43 | + void HELPER(NAME##s)(void *vd, void *vn, void *vm, \ |
103 | + '-nic', 'user', | 44 | + void *stat, uint32_t oprsz) \ |
104 | + '-no-reboot') | 45 | + { \ |
105 | + self.vm.launch() | 46 | + float_status *fpst = stat; \ |
47 | + float32 *d = vd; \ | ||
48 | + float32 *n = vn; \ | ||
49 | + float32 *m = vm; \ | ||
50 | + float32 r0, r1; \ | ||
51 | + \ | ||
52 | + /* Read all inputs before writing outputs in case vm == vd */ \ | ||
53 | + r0 = float32_##OP(n[H4(0)], n[H4(1)], fpst); \ | ||
54 | + r1 = float32_##OP(m[H4(0)], m[H4(1)], fpst); \ | ||
55 | + \ | ||
56 | + d[H4(0)] = r0; \ | ||
57 | + d[H4(1)] = r1; \ | ||
58 | + } \ | ||
59 | + \ | ||
60 | + void HELPER(NAME##h)(void *vd, void *vn, void *vm, \ | ||
61 | + void *stat, uint32_t oprsz) \ | ||
62 | + { \ | ||
63 | + float_status *fpst = stat; \ | ||
64 | + float16 *d = vd; \ | ||
65 | + float16 *n = vn; \ | ||
66 | + float16 *m = vm; \ | ||
67 | + float16 r0, r1, r2, r3; \ | ||
68 | + \ | ||
69 | + /* Read all inputs before writing outputs in case vm == vd */ \ | ||
70 | + r0 = float16_##OP(n[H2(0)], n[H2(1)], fpst); \ | ||
71 | + r1 = float16_##OP(n[H2(2)], n[H2(3)], fpst); \ | ||
72 | + r2 = float16_##OP(m[H2(0)], m[H2(1)], fpst); \ | ||
73 | + r3 = float16_##OP(m[H2(2)], m[H2(3)], fpst); \ | ||
74 | + \ | ||
75 | + d[H4(0)] = r0; \ | ||
76 | + d[H4(1)] = r1; \ | ||
77 | + d[H4(2)] = r2; \ | ||
78 | + d[H4(3)] = r3; \ | ||
79 | + } | ||
106 | + | 80 | + |
107 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | 81 | +DO_NEON_PAIRWISE(neon_padd, add) |
108 | + 'console=ttyS0,115200 ' | 82 | +DO_NEON_PAIRWISE(neon_pmax, max) |
109 | + 'loglevel=7 ' | 83 | +DO_NEON_PAIRWISE(neon_pmin, min) |
110 | + 'nosmp ' | ||
111 | + 'systemd.default_timeout_start_sec=9000 ' | ||
112 | + 'systemd.mask=armbian-zram-config.service ' | ||
113 | + 'systemd.mask=armbian-ramlog.service') | ||
114 | + | 84 | + |
115 | + self.wait_for_console_pattern('U-Boot SPL') | 85 | +#undef DO_NEON_PAIRWISE |
116 | + self.wait_for_console_pattern('Autoboot in ') | 86 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
117 | + exec_command_and_wait_for_pattern(self, ' ', '=>') | 87 | index XXXXXXX..XXXXXXX 100644 |
118 | + exec_command_and_wait_for_pattern(self, "setenv extraargs '" + | 88 | --- a/target/arm/translate-neon.c.inc |
119 | + kernel_command_line + "'", '=>') | 89 | +++ b/target/arm/translate-neon.c.inc |
120 | + exec_command_and_wait_for_pattern(self, 'boot', 'Starting kernel ...'); | 90 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMINNM_fp_3s(DisasContext *s, arg_3same *a) |
121 | + | 91 | return do_3same(s, a, gen_VMINNM_fp32_3s); |
122 | + self.wait_for_console_pattern('systemd[1]: Set hostname ' + | 92 | } |
123 | + 'to <orangepipc>') | 93 | |
124 | + self.wait_for_console_pattern('Starting Load Kernel Modules...') | 94 | -static bool do_3same_fp_pair(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn) |
125 | + | 95 | +static bool do_3same_fp_pair(DisasContext *s, arg_3same *a, |
126 | def test_s390x_s390_ccw_virtio(self): | 96 | + gen_helper_gvec_3_ptr *fn) |
127 | """ | 97 | { |
128 | :avocado: tags=arch:s390x | 98 | - /* FP operations handled pairwise 32 bits at a time */ |
99 | - TCGv_i32 tmp, tmp2, tmp3; | ||
100 | + /* FP pairwise operations */ | ||
101 | TCGv_ptr fpstatus; | ||
102 | |||
103 | if (!arm_dc_feature(s, ARM_FEATURE_NEON)) { | ||
104 | @@ -XXX,XX +XXX,XX @@ static bool do_3same_fp_pair(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn) | ||
105 | |||
106 | assert(a->q == 0); /* enforced by decode patterns */ | ||
107 | |||
108 | - /* | ||
109 | - * Note that we have to be careful not to clobber the source operands | ||
110 | - * in the "vm == vd" case by storing the result of the first pass too | ||
111 | - * early. Since Q is 0 there are always just two passes, so instead | ||
112 | - * of a complicated loop over each pass we just unroll. | ||
113 | - */ | ||
114 | - fpstatus = fpstatus_ptr(FPST_STD); | ||
115 | - tmp = neon_load_reg(a->vn, 0); | ||
116 | - tmp2 = neon_load_reg(a->vn, 1); | ||
117 | - fn(tmp, tmp, tmp2, fpstatus); | ||
118 | - tcg_temp_free_i32(tmp2); | ||
119 | |||
120 | - tmp3 = neon_load_reg(a->vm, 0); | ||
121 | - tmp2 = neon_load_reg(a->vm, 1); | ||
122 | - fn(tmp3, tmp3, tmp2, fpstatus); | ||
123 | - tcg_temp_free_i32(tmp2); | ||
124 | + fpstatus = fpstatus_ptr(a->size != 0 ? FPST_STD_F16 : FPST_STD); | ||
125 | + tcg_gen_gvec_3_ptr(vfp_reg_offset(1, a->vd), | ||
126 | + vfp_reg_offset(1, a->vn), | ||
127 | + vfp_reg_offset(1, a->vm), | ||
128 | + fpstatus, 8, 8, 0, fn); | ||
129 | tcg_temp_free_ptr(fpstatus); | ||
130 | |||
131 | - neon_store_reg(a->vd, 0, tmp); | ||
132 | - neon_store_reg(a->vd, 1, tmp3); | ||
133 | return true; | ||
134 | } | ||
135 | |||
136 | @@ -XXX,XX +XXX,XX @@ static bool do_3same_fp_pair(DisasContext *s, arg_3same *a, VFPGen3OpSPFn *fn) | ||
137 | static bool trans_##INSN##_fp_3s(DisasContext *s, arg_3same *a) \ | ||
138 | { \ | ||
139 | if (a->size != 0) { \ | ||
140 | - /* TODO fp16 support */ \ | ||
141 | - return false; \ | ||
142 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { \ | ||
143 | + return false; \ | ||
144 | + } \ | ||
145 | + return do_3same_fp_pair(s, a, FUNC##h); \ | ||
146 | } \ | ||
147 | - return do_3same_fp_pair(s, a, FUNC); \ | ||
148 | + return do_3same_fp_pair(s, a, FUNC##s); \ | ||
149 | } | ||
150 | |||
151 | -DO_3S_FP_PAIR(VPADD, gen_helper_vfp_adds) | ||
152 | -DO_3S_FP_PAIR(VPMAX, gen_helper_vfp_maxs) | ||
153 | -DO_3S_FP_PAIR(VPMIN, gen_helper_vfp_mins) | ||
154 | +DO_3S_FP_PAIR(VPADD, gen_helper_neon_padd) | ||
155 | +DO_3S_FP_PAIR(VPMAX, gen_helper_neon_pmax) | ||
156 | +DO_3S_FP_PAIR(VPMIN, gen_helper_neon_pmin) | ||
157 | |||
158 | static bool do_vector_2sh(DisasContext *s, arg_2reg_shift *a, GVecGen2iFn *fn) | ||
159 | { | ||
129 | -- | 160 | -- |
130 | 2.20.1 | 161 | 2.20.1 |
131 | 162 | ||
132 | 163 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | Convert the Neon float-integer VCVT insns to gvec, and use this |
---|---|---|---|
2 | to implement fp16 support for them. | ||
2 | 3 | ||
3 | The Clock Control Unit is responsible for clock signal generation, | 4 | Note that unlike the VFP int<->fp16 VCVT insns we converted |
4 | configuration and distribution in the Allwinner H3 System on Chip. | 5 | earlier and which convert to/from a 32-bit integer, these |
5 | This commit adds support for the Clock Control Unit which emulates | 6 | Neon insns convert to/from 16-bit integers. So we can use |
6 | a simple read/write register interface. | 7 | the existing vfp conversion helpers for the f32<->u32/i32 |
8 | case but need to provide our own for f16<->u16/i16. | ||
7 | 9 | ||
8 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
9 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
10 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
11 | Tested-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
12 | Message-id: 20200311221854.30370-4-nieklinnenbank@gmail.com | ||
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
12 | Message-id: 20200828183354.27913-37-peter.maydell@linaro.org | ||
14 | --- | 13 | --- |
15 | hw/misc/Makefile.objs | 1 + | 14 | target/arm/helper.h | 9 +++++++++ |
16 | include/hw/arm/allwinner-h3.h | 3 + | 15 | target/arm/vec_helper.c | 29 +++++++++++++++++++++++++++++ |
17 | include/hw/misc/allwinner-h3-ccu.h | 66 ++++++++ | 16 | target/arm/translate-neon.c.inc | 15 ++++----------- |
18 | hw/arm/allwinner-h3.c | 9 +- | 17 | 3 files changed, 42 insertions(+), 11 deletions(-) |
19 | hw/misc/allwinner-h3-ccu.c | 242 +++++++++++++++++++++++++++++ | ||
20 | 5 files changed, 320 insertions(+), 1 deletion(-) | ||
21 | create mode 100644 include/hw/misc/allwinner-h3-ccu.h | ||
22 | create mode 100644 hw/misc/allwinner-h3-ccu.c | ||
23 | 18 | ||
24 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs | 19 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
25 | index XXXXXXX..XXXXXXX 100644 | 20 | index XXXXXXX..XXXXXXX 100644 |
26 | --- a/hw/misc/Makefile.objs | 21 | --- a/target/arm/helper.h |
27 | +++ b/hw/misc/Makefile.objs | 22 | +++ b/target/arm/helper.h |
28 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_MACIO) += macio/ | 23 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(neon_padds, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
29 | 24 | DEF_HELPER_FLAGS_5(neon_pmaxs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) | |
30 | common-obj-$(CONFIG_IVSHMEM_DEVICE) += ivshmem.o | 25 | DEF_HELPER_FLAGS_5(neon_pmins, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, ptr, i32) |
31 | 26 | ||
32 | +common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-ccu.o | 27 | +DEF_HELPER_FLAGS_4(gvec_sstoh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
33 | common-obj-$(CONFIG_REALVIEW) += arm_sysctl.o | 28 | +DEF_HELPER_FLAGS_4(gvec_sitos, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
34 | common-obj-$(CONFIG_NSERIES) += cbus.o | 29 | +DEF_HELPER_FLAGS_4(gvec_ustoh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
35 | common-obj-$(CONFIG_ECCMEMCTL) += eccmemctl.o | 30 | +DEF_HELPER_FLAGS_4(gvec_uitos, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
36 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | 31 | +DEF_HELPER_FLAGS_4(gvec_tosszh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
32 | +DEF_HELPER_FLAGS_4(gvec_tosizs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
33 | +DEF_HELPER_FLAGS_4(gvec_touszh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
34 | +DEF_HELPER_FLAGS_4(gvec_touizs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
35 | + | ||
36 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
37 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
38 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
39 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
37 | index XXXXXXX..XXXXXXX 100644 | 40 | index XXXXXXX..XXXXXXX 100644 |
38 | --- a/include/hw/arm/allwinner-h3.h | 41 | --- a/target/arm/vec_helper.c |
39 | +++ b/include/hw/arm/allwinner-h3.h | 42 | +++ b/target/arm/vec_helper.c |
40 | @@ -XXX,XX +XXX,XX @@ | 43 | @@ -XXX,XX +XXX,XX @@ static uint32_t float32_acgt(float32 op1, float32 op2, float_status *stat) |
41 | #include "hw/arm/boot.h" | 44 | return -float32_lt(float32_abs(op2), float32_abs(op1), stat); |
42 | #include "hw/timer/allwinner-a10-pit.h" | ||
43 | #include "hw/intc/arm_gic.h" | ||
44 | +#include "hw/misc/allwinner-h3-ccu.h" | ||
45 | #include "target/arm/cpu.h" | ||
46 | |||
47 | /** | ||
48 | @@ -XXX,XX +XXX,XX @@ enum { | ||
49 | AW_H3_SRAM_A1, | ||
50 | AW_H3_SRAM_A2, | ||
51 | AW_H3_SRAM_C, | ||
52 | + AW_H3_CCU, | ||
53 | AW_H3_PIT, | ||
54 | AW_H3_UART0, | ||
55 | AW_H3_UART1, | ||
56 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
57 | ARMCPU cpus[AW_H3_NUM_CPUS]; | ||
58 | const hwaddr *memmap; | ||
59 | AwA10PITState timer; | ||
60 | + AwH3ClockCtlState ccu; | ||
61 | GICState gic; | ||
62 | MemoryRegion sram_a1; | ||
63 | MemoryRegion sram_a2; | ||
64 | diff --git a/include/hw/misc/allwinner-h3-ccu.h b/include/hw/misc/allwinner-h3-ccu.h | ||
65 | new file mode 100644 | ||
66 | index XXXXXXX..XXXXXXX | ||
67 | --- /dev/null | ||
68 | +++ b/include/hw/misc/allwinner-h3-ccu.h | ||
69 | @@ -XXX,XX +XXX,XX @@ | ||
70 | +/* | ||
71 | + * Allwinner H3 Clock Control Unit emulation | ||
72 | + * | ||
73 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
74 | + * | ||
75 | + * This program is free software: you can redistribute it and/or modify | ||
76 | + * it under the terms of the GNU General Public License as published by | ||
77 | + * the Free Software Foundation, either version 2 of the License, or | ||
78 | + * (at your option) any later version. | ||
79 | + * | ||
80 | + * This program is distributed in the hope that it will be useful, | ||
81 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
82 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
83 | + * GNU General Public License for more details. | ||
84 | + * | ||
85 | + * You should have received a copy of the GNU General Public License | ||
86 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
87 | + */ | ||
88 | + | ||
89 | +#ifndef HW_MISC_ALLWINNER_H3_CCU_H | ||
90 | +#define HW_MISC_ALLWINNER_H3_CCU_H | ||
91 | + | ||
92 | +#include "qom/object.h" | ||
93 | +#include "hw/sysbus.h" | ||
94 | + | ||
95 | +/** | ||
96 | + * @name Constants | ||
97 | + * @{ | ||
98 | + */ | ||
99 | + | ||
100 | +/** Size of register I/O address space used by CCU device */ | ||
101 | +#define AW_H3_CCU_IOSIZE (0x400) | ||
102 | + | ||
103 | +/** Total number of known registers */ | ||
104 | +#define AW_H3_CCU_REGS_NUM (AW_H3_CCU_IOSIZE / sizeof(uint32_t)) | ||
105 | + | ||
106 | +/** @} */ | ||
107 | + | ||
108 | +/** | ||
109 | + * @name Object model | ||
110 | + * @{ | ||
111 | + */ | ||
112 | + | ||
113 | +#define TYPE_AW_H3_CCU "allwinner-h3-ccu" | ||
114 | +#define AW_H3_CCU(obj) \ | ||
115 | + OBJECT_CHECK(AwH3ClockCtlState, (obj), TYPE_AW_H3_CCU) | ||
116 | + | ||
117 | +/** @} */ | ||
118 | + | ||
119 | +/** | ||
120 | + * Allwinner H3 CCU object instance state. | ||
121 | + */ | ||
122 | +typedef struct AwH3ClockCtlState { | ||
123 | + /*< private >*/ | ||
124 | + SysBusDevice parent_obj; | ||
125 | + /*< public >*/ | ||
126 | + | ||
127 | + /** Maps I/O registers in physical memory */ | ||
128 | + MemoryRegion iomem; | ||
129 | + | ||
130 | + /** Array of hardware registers */ | ||
131 | + uint32_t regs[AW_H3_CCU_REGS_NUM]; | ||
132 | + | ||
133 | +} AwH3ClockCtlState; | ||
134 | + | ||
135 | +#endif /* HW_MISC_ALLWINNER_H3_CCU_H */ | ||
136 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
137 | index XXXXXXX..XXXXXXX 100644 | ||
138 | --- a/hw/arm/allwinner-h3.c | ||
139 | +++ b/hw/arm/allwinner-h3.c | ||
140 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
141 | [AW_H3_SRAM_A1] = 0x00000000, | ||
142 | [AW_H3_SRAM_A2] = 0x00044000, | ||
143 | [AW_H3_SRAM_C] = 0x00010000, | ||
144 | + [AW_H3_CCU] = 0x01c20000, | ||
145 | [AW_H3_PIT] = 0x01c20c00, | ||
146 | [AW_H3_UART0] = 0x01c28000, | ||
147 | [AW_H3_UART1] = 0x01c28400, | ||
148 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
149 | { "usb2-phy", 0x01c1c000, 4 * KiB }, | ||
150 | { "usb3-phy", 0x01c1d000, 4 * KiB }, | ||
151 | { "smc", 0x01c1e000, 4 * KiB }, | ||
152 | - { "ccu", 0x01c20000, 1 * KiB }, | ||
153 | { "pio", 0x01c20800, 1 * KiB }, | ||
154 | { "owa", 0x01c21000, 1 * KiB }, | ||
155 | { "pwm", 0x01c21400, 1 * KiB }, | ||
156 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
157 | "clk0-freq", &error_abort); | ||
158 | object_property_add_alias(obj, "clk1-freq", OBJECT(&s->timer), | ||
159 | "clk1-freq", &error_abort); | ||
160 | + | ||
161 | + sysbus_init_child_obj(obj, "ccu", &s->ccu, sizeof(s->ccu), | ||
162 | + TYPE_AW_H3_CCU); | ||
163 | } | 45 | } |
164 | 46 | ||
165 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | 47 | +static int16_t vfp_tosszh(float16 x, void *fpstp) |
166 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
167 | memory_region_add_subregion(get_system_memory(), s->memmap[AW_H3_SRAM_C], | ||
168 | &s->sram_c); | ||
169 | |||
170 | + /* Clock Control Unit */ | ||
171 | + qdev_init_nofail(DEVICE(&s->ccu)); | ||
172 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->ccu), 0, s->memmap[AW_H3_CCU]); | ||
173 | + | ||
174 | /* UART0. For future clocktree API: All UARTS are connected to APB2_CLK. */ | ||
175 | serial_mm_init(get_system_memory(), s->memmap[AW_H3_UART0], 2, | ||
176 | qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART0), | ||
177 | diff --git a/hw/misc/allwinner-h3-ccu.c b/hw/misc/allwinner-h3-ccu.c | ||
178 | new file mode 100644 | ||
179 | index XXXXXXX..XXXXXXX | ||
180 | --- /dev/null | ||
181 | +++ b/hw/misc/allwinner-h3-ccu.c | ||
182 | @@ -XXX,XX +XXX,XX @@ | ||
183 | +/* | ||
184 | + * Allwinner H3 Clock Control Unit emulation | ||
185 | + * | ||
186 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
187 | + * | ||
188 | + * This program is free software: you can redistribute it and/or modify | ||
189 | + * it under the terms of the GNU General Public License as published by | ||
190 | + * the Free Software Foundation, either version 2 of the License, or | ||
191 | + * (at your option) any later version. | ||
192 | + * | ||
193 | + * This program is distributed in the hope that it will be useful, | ||
194 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
195 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
196 | + * GNU General Public License for more details. | ||
197 | + * | ||
198 | + * You should have received a copy of the GNU General Public License | ||
199 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
200 | + */ | ||
201 | + | ||
202 | +#include "qemu/osdep.h" | ||
203 | +#include "qemu/units.h" | ||
204 | +#include "hw/sysbus.h" | ||
205 | +#include "migration/vmstate.h" | ||
206 | +#include "qemu/log.h" | ||
207 | +#include "qemu/module.h" | ||
208 | +#include "hw/misc/allwinner-h3-ccu.h" | ||
209 | + | ||
210 | +/* CCU register offsets */ | ||
211 | +enum { | ||
212 | + REG_PLL_CPUX = 0x0000, /* PLL CPUX Control */ | ||
213 | + REG_PLL_AUDIO = 0x0008, /* PLL Audio Control */ | ||
214 | + REG_PLL_VIDEO = 0x0010, /* PLL Video Control */ | ||
215 | + REG_PLL_VE = 0x0018, /* PLL VE Control */ | ||
216 | + REG_PLL_DDR = 0x0020, /* PLL DDR Control */ | ||
217 | + REG_PLL_PERIPH0 = 0x0028, /* PLL Peripherals 0 Control */ | ||
218 | + REG_PLL_GPU = 0x0038, /* PLL GPU Control */ | ||
219 | + REG_PLL_PERIPH1 = 0x0044, /* PLL Peripherals 1 Control */ | ||
220 | + REG_PLL_DE = 0x0048, /* PLL Display Engine Control */ | ||
221 | + REG_CPUX_AXI = 0x0050, /* CPUX/AXI Configuration */ | ||
222 | + REG_APB1 = 0x0054, /* ARM Peripheral Bus 1 Config */ | ||
223 | + REG_APB2 = 0x0058, /* ARM Peripheral Bus 2 Config */ | ||
224 | + REG_DRAM_CFG = 0x00F4, /* DRAM Configuration */ | ||
225 | + REG_MBUS = 0x00FC, /* MBUS Reset */ | ||
226 | + REG_PLL_TIME0 = 0x0200, /* PLL Stable Time 0 */ | ||
227 | + REG_PLL_TIME1 = 0x0204, /* PLL Stable Time 1 */ | ||
228 | + REG_PLL_CPUX_BIAS = 0x0220, /* PLL CPUX Bias */ | ||
229 | + REG_PLL_AUDIO_BIAS = 0x0224, /* PLL Audio Bias */ | ||
230 | + REG_PLL_VIDEO_BIAS = 0x0228, /* PLL Video Bias */ | ||
231 | + REG_PLL_VE_BIAS = 0x022C, /* PLL VE Bias */ | ||
232 | + REG_PLL_DDR_BIAS = 0x0230, /* PLL DDR Bias */ | ||
233 | + REG_PLL_PERIPH0_BIAS = 0x0234, /* PLL Peripherals 0 Bias */ | ||
234 | + REG_PLL_GPU_BIAS = 0x023C, /* PLL GPU Bias */ | ||
235 | + REG_PLL_PERIPH1_BIAS = 0x0244, /* PLL Peripherals 1 Bias */ | ||
236 | + REG_PLL_DE_BIAS = 0x0248, /* PLL Display Engine Bias */ | ||
237 | + REG_PLL_CPUX_TUNING = 0x0250, /* PLL CPUX Tuning */ | ||
238 | + REG_PLL_DDR_TUNING = 0x0260, /* PLL DDR Tuning */ | ||
239 | +}; | ||
240 | + | ||
241 | +#define REG_INDEX(offset) (offset / sizeof(uint32_t)) | ||
242 | + | ||
243 | +/* CCU register flags */ | ||
244 | +enum { | ||
245 | + REG_DRAM_CFG_UPDATE = (1 << 16), | ||
246 | +}; | ||
247 | + | ||
248 | +enum { | ||
249 | + REG_PLL_ENABLE = (1 << 31), | ||
250 | + REG_PLL_LOCK = (1 << 28), | ||
251 | +}; | ||
252 | + | ||
253 | + | ||
254 | +/* CCU register reset values */ | ||
255 | +enum { | ||
256 | + REG_PLL_CPUX_RST = 0x00001000, | ||
257 | + REG_PLL_AUDIO_RST = 0x00035514, | ||
258 | + REG_PLL_VIDEO_RST = 0x03006207, | ||
259 | + REG_PLL_VE_RST = 0x03006207, | ||
260 | + REG_PLL_DDR_RST = 0x00001000, | ||
261 | + REG_PLL_PERIPH0_RST = 0x00041811, | ||
262 | + REG_PLL_GPU_RST = 0x03006207, | ||
263 | + REG_PLL_PERIPH1_RST = 0x00041811, | ||
264 | + REG_PLL_DE_RST = 0x03006207, | ||
265 | + REG_CPUX_AXI_RST = 0x00010000, | ||
266 | + REG_APB1_RST = 0x00001010, | ||
267 | + REG_APB2_RST = 0x01000000, | ||
268 | + REG_DRAM_CFG_RST = 0x00000000, | ||
269 | + REG_MBUS_RST = 0x80000000, | ||
270 | + REG_PLL_TIME0_RST = 0x000000FF, | ||
271 | + REG_PLL_TIME1_RST = 0x000000FF, | ||
272 | + REG_PLL_CPUX_BIAS_RST = 0x08100200, | ||
273 | + REG_PLL_AUDIO_BIAS_RST = 0x10100000, | ||
274 | + REG_PLL_VIDEO_BIAS_RST = 0x10100000, | ||
275 | + REG_PLL_VE_BIAS_RST = 0x10100000, | ||
276 | + REG_PLL_DDR_BIAS_RST = 0x81104000, | ||
277 | + REG_PLL_PERIPH0_BIAS_RST = 0x10100010, | ||
278 | + REG_PLL_GPU_BIAS_RST = 0x10100000, | ||
279 | + REG_PLL_PERIPH1_BIAS_RST = 0x10100010, | ||
280 | + REG_PLL_DE_BIAS_RST = 0x10100000, | ||
281 | + REG_PLL_CPUX_TUNING_RST = 0x0A101000, | ||
282 | + REG_PLL_DDR_TUNING_RST = 0x14880000, | ||
283 | +}; | ||
284 | + | ||
285 | +static uint64_t allwinner_h3_ccu_read(void *opaque, hwaddr offset, | ||
286 | + unsigned size) | ||
287 | +{ | 48 | +{ |
288 | + const AwH3ClockCtlState *s = AW_H3_CCU(opaque); | 49 | + float_status *fpst = fpstp; |
289 | + const uint32_t idx = REG_INDEX(offset); | 50 | + if (float16_is_any_nan(x)) { |
290 | + | 51 | + float_raise(float_flag_invalid, fpst); |
291 | + switch (offset) { | ||
292 | + case 0x308 ... AW_H3_CCU_IOSIZE: | ||
293 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
294 | + __func__, (uint32_t)offset); | ||
295 | + return 0; | 52 | + return 0; |
296 | + } | 53 | + } |
297 | + | 54 | + return float16_to_int16_round_to_zero(x, fpst); |
298 | + return s->regs[idx]; | ||
299 | +} | 55 | +} |
300 | + | 56 | + |
301 | +static void allwinner_h3_ccu_write(void *opaque, hwaddr offset, | 57 | +static uint16_t vfp_touszh(float16 x, void *fpstp) |
302 | + uint64_t val, unsigned size) | ||
303 | +{ | 58 | +{ |
304 | + AwH3ClockCtlState *s = AW_H3_CCU(opaque); | 59 | + float_status *fpst = fpstp; |
305 | + const uint32_t idx = REG_INDEX(offset); | 60 | + if (float16_is_any_nan(x)) { |
306 | + | 61 | + float_raise(float_flag_invalid, fpst); |
307 | + switch (offset) { | 62 | + return 0; |
308 | + case REG_DRAM_CFG: /* DRAM Configuration */ | ||
309 | + val &= ~REG_DRAM_CFG_UPDATE; | ||
310 | + break; | ||
311 | + case REG_PLL_CPUX: /* PLL CPUX Control */ | ||
312 | + case REG_PLL_AUDIO: /* PLL Audio Control */ | ||
313 | + case REG_PLL_VIDEO: /* PLL Video Control */ | ||
314 | + case REG_PLL_VE: /* PLL VE Control */ | ||
315 | + case REG_PLL_DDR: /* PLL DDR Control */ | ||
316 | + case REG_PLL_PERIPH0: /* PLL Peripherals 0 Control */ | ||
317 | + case REG_PLL_GPU: /* PLL GPU Control */ | ||
318 | + case REG_PLL_PERIPH1: /* PLL Peripherals 1 Control */ | ||
319 | + case REG_PLL_DE: /* PLL Display Engine Control */ | ||
320 | + if (val & REG_PLL_ENABLE) { | ||
321 | + val |= REG_PLL_LOCK; | ||
322 | + } | ||
323 | + break; | ||
324 | + case 0x308 ... AW_H3_CCU_IOSIZE: | ||
325 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
326 | + __func__, (uint32_t)offset); | ||
327 | + break; | ||
328 | + default: | ||
329 | + qemu_log_mask(LOG_UNIMP, "%s: unimplemented write offset 0x%04x\n", | ||
330 | + __func__, (uint32_t)offset); | ||
331 | + break; | ||
332 | + } | 63 | + } |
333 | + | 64 | + return float16_to_uint16_round_to_zero(x, fpst); |
334 | + s->regs[idx] = (uint32_t) val; | ||
335 | +} | 65 | +} |
336 | + | 66 | + |
337 | +static const MemoryRegionOps allwinner_h3_ccu_ops = { | 67 | #define DO_2OP(NAME, FUNC, TYPE) \ |
338 | + .read = allwinner_h3_ccu_read, | 68 | void HELPER(NAME)(void *vd, void *vn, void *stat, uint32_t desc) \ |
339 | + .write = allwinner_h3_ccu_write, | 69 | { \ |
340 | + .endianness = DEVICE_NATIVE_ENDIAN, | 70 | @@ -XXX,XX +XXX,XX @@ DO_2OP(gvec_frsqrte_h, helper_rsqrte_f16, float16) |
341 | + .valid = { | 71 | DO_2OP(gvec_frsqrte_s, helper_rsqrte_f32, float32) |
342 | + .min_access_size = 4, | 72 | DO_2OP(gvec_frsqrte_d, helper_rsqrte_f64, float64) |
343 | + .max_access_size = 4, | 73 | |
344 | + }, | 74 | +DO_2OP(gvec_sitos, helper_vfp_sitos, int32_t) |
345 | + .impl.min_access_size = 4, | 75 | +DO_2OP(gvec_uitos, helper_vfp_uitos, uint32_t) |
346 | +}; | 76 | +DO_2OP(gvec_tosizs, helper_vfp_tosizs, float32) |
77 | +DO_2OP(gvec_touizs, helper_vfp_touizs, float32) | ||
78 | +DO_2OP(gvec_sstoh, int16_to_float16, int16_t) | ||
79 | +DO_2OP(gvec_ustoh, uint16_to_float16, uint16_t) | ||
80 | +DO_2OP(gvec_tosszh, vfp_tosszh, float16) | ||
81 | +DO_2OP(gvec_touszh, vfp_touszh, float16) | ||
347 | + | 82 | + |
348 | +static void allwinner_h3_ccu_reset(DeviceState *dev) | 83 | #define WRAP_CMP0_FWD(FN, CMPOP, TYPE) \ |
349 | +{ | 84 | static TYPE TYPE##_##FN##0(TYPE op, float_status *stat) \ |
350 | + AwH3ClockCtlState *s = AW_H3_CCU(dev); | 85 | { \ |
351 | + | 86 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
352 | + /* Set default values for registers */ | 87 | index XXXXXXX..XXXXXXX 100644 |
353 | + s->regs[REG_INDEX(REG_PLL_CPUX)] = REG_PLL_CPUX_RST; | 88 | --- a/target/arm/translate-neon.c.inc |
354 | + s->regs[REG_INDEX(REG_PLL_AUDIO)] = REG_PLL_AUDIO_RST; | 89 | +++ b/target/arm/translate-neon.c.inc |
355 | + s->regs[REG_INDEX(REG_PLL_VIDEO)] = REG_PLL_VIDEO_RST; | 90 | @@ -XXX,XX +XXX,XX @@ static bool do_2misc_fp(DisasContext *s, arg_2misc *a, |
356 | + s->regs[REG_INDEX(REG_PLL_VE)] = REG_PLL_VE_RST; | 91 | return true; |
357 | + s->regs[REG_INDEX(REG_PLL_DDR)] = REG_PLL_DDR_RST; | 92 | } |
358 | + s->regs[REG_INDEX(REG_PLL_PERIPH0)] = REG_PLL_PERIPH0_RST; | 93 | |
359 | + s->regs[REG_INDEX(REG_PLL_GPU)] = REG_PLL_GPU_RST; | 94 | -#define DO_2MISC_FP(INSN, FUNC) \ |
360 | + s->regs[REG_INDEX(REG_PLL_PERIPH1)] = REG_PLL_PERIPH1_RST; | 95 | - static bool trans_##INSN(DisasContext *s, arg_2misc *a) \ |
361 | + s->regs[REG_INDEX(REG_PLL_DE)] = REG_PLL_DE_RST; | 96 | - { \ |
362 | + s->regs[REG_INDEX(REG_CPUX_AXI)] = REG_CPUX_AXI_RST; | 97 | - return do_2misc_fp(s, a, FUNC); \ |
363 | + s->regs[REG_INDEX(REG_APB1)] = REG_APB1_RST; | 98 | - } |
364 | + s->regs[REG_INDEX(REG_APB2)] = REG_APB2_RST; | 99 | - |
365 | + s->regs[REG_INDEX(REG_DRAM_CFG)] = REG_DRAM_CFG_RST; | 100 | -DO_2MISC_FP(VCVT_FS, gen_helper_vfp_sitos) |
366 | + s->regs[REG_INDEX(REG_MBUS)] = REG_MBUS_RST; | 101 | -DO_2MISC_FP(VCVT_FU, gen_helper_vfp_uitos) |
367 | + s->regs[REG_INDEX(REG_PLL_TIME0)] = REG_PLL_TIME0_RST; | 102 | -DO_2MISC_FP(VCVT_SF, gen_helper_vfp_tosizs) |
368 | + s->regs[REG_INDEX(REG_PLL_TIME1)] = REG_PLL_TIME1_RST; | 103 | -DO_2MISC_FP(VCVT_UF, gen_helper_vfp_touizs) |
369 | + s->regs[REG_INDEX(REG_PLL_CPUX_BIAS)] = REG_PLL_CPUX_BIAS_RST; | 104 | - |
370 | + s->regs[REG_INDEX(REG_PLL_AUDIO_BIAS)] = REG_PLL_AUDIO_BIAS_RST; | 105 | #define DO_2MISC_FP_VEC(INSN, HFUNC, SFUNC) \ |
371 | + s->regs[REG_INDEX(REG_PLL_VIDEO_BIAS)] = REG_PLL_VIDEO_BIAS_RST; | 106 | static void gen_##INSN(unsigned vece, uint32_t rd_ofs, \ |
372 | + s->regs[REG_INDEX(REG_PLL_VE_BIAS)] = REG_PLL_VE_BIAS_RST; | 107 | uint32_t rm_ofs, \ |
373 | + s->regs[REG_INDEX(REG_PLL_DDR_BIAS)] = REG_PLL_DDR_BIAS_RST; | 108 | @@ -XXX,XX +XXX,XX @@ DO_2MISC_FP_VEC(VCGE0_F, gen_helper_gvec_fcge0_h, gen_helper_gvec_fcge0_s) |
374 | + s->regs[REG_INDEX(REG_PLL_PERIPH0_BIAS)] = REG_PLL_PERIPH0_BIAS_RST; | 109 | DO_2MISC_FP_VEC(VCEQ0_F, gen_helper_gvec_fceq0_h, gen_helper_gvec_fceq0_s) |
375 | + s->regs[REG_INDEX(REG_PLL_GPU_BIAS)] = REG_PLL_GPU_BIAS_RST; | 110 | DO_2MISC_FP_VEC(VCLT0_F, gen_helper_gvec_fclt0_h, gen_helper_gvec_fclt0_s) |
376 | + s->regs[REG_INDEX(REG_PLL_PERIPH1_BIAS)] = REG_PLL_PERIPH1_BIAS_RST; | 111 | DO_2MISC_FP_VEC(VCLE0_F, gen_helper_gvec_fcle0_h, gen_helper_gvec_fcle0_s) |
377 | + s->regs[REG_INDEX(REG_PLL_DE_BIAS)] = REG_PLL_DE_BIAS_RST; | 112 | +DO_2MISC_FP_VEC(VCVT_FS, gen_helper_gvec_sstoh, gen_helper_gvec_sitos) |
378 | + s->regs[REG_INDEX(REG_PLL_CPUX_TUNING)] = REG_PLL_CPUX_TUNING_RST; | 113 | +DO_2MISC_FP_VEC(VCVT_FU, gen_helper_gvec_ustoh, gen_helper_gvec_uitos) |
379 | + s->regs[REG_INDEX(REG_PLL_DDR_TUNING)] = REG_PLL_DDR_TUNING_RST; | 114 | +DO_2MISC_FP_VEC(VCVT_SF, gen_helper_gvec_tosszh, gen_helper_gvec_tosizs) |
380 | +} | 115 | +DO_2MISC_FP_VEC(VCVT_UF, gen_helper_gvec_touszh, gen_helper_gvec_touizs) |
381 | + | 116 | |
382 | +static void allwinner_h3_ccu_init(Object *obj) | 117 | static bool trans_VRINTX(DisasContext *s, arg_2misc *a) |
383 | +{ | 118 | { |
384 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
385 | + AwH3ClockCtlState *s = AW_H3_CCU(obj); | ||
386 | + | ||
387 | + /* Memory mapping */ | ||
388 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_h3_ccu_ops, s, | ||
389 | + TYPE_AW_H3_CCU, AW_H3_CCU_IOSIZE); | ||
390 | + sysbus_init_mmio(sbd, &s->iomem); | ||
391 | +} | ||
392 | + | ||
393 | +static const VMStateDescription allwinner_h3_ccu_vmstate = { | ||
394 | + .name = "allwinner-h3-ccu", | ||
395 | + .version_id = 1, | ||
396 | + .minimum_version_id = 1, | ||
397 | + .fields = (VMStateField[]) { | ||
398 | + VMSTATE_UINT32_ARRAY(regs, AwH3ClockCtlState, AW_H3_CCU_REGS_NUM), | ||
399 | + VMSTATE_END_OF_LIST() | ||
400 | + } | ||
401 | +}; | ||
402 | + | ||
403 | +static void allwinner_h3_ccu_class_init(ObjectClass *klass, void *data) | ||
404 | +{ | ||
405 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
406 | + | ||
407 | + dc->reset = allwinner_h3_ccu_reset; | ||
408 | + dc->vmsd = &allwinner_h3_ccu_vmstate; | ||
409 | +} | ||
410 | + | ||
411 | +static const TypeInfo allwinner_h3_ccu_info = { | ||
412 | + .name = TYPE_AW_H3_CCU, | ||
413 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
414 | + .instance_init = allwinner_h3_ccu_init, | ||
415 | + .instance_size = sizeof(AwH3ClockCtlState), | ||
416 | + .class_init = allwinner_h3_ccu_class_init, | ||
417 | +}; | ||
418 | + | ||
419 | +static void allwinner_h3_ccu_register(void) | ||
420 | +{ | ||
421 | + type_register_static(&allwinner_h3_ccu_info); | ||
422 | +} | ||
423 | + | ||
424 | +type_init(allwinner_h3_ccu_register) | ||
425 | -- | 119 | -- |
426 | 2.20.1 | 120 | 2.20.1 |
427 | 121 | ||
428 | 122 | diff view generated by jsdifflib |
1 | From: Guenter Roeck <linux@roeck-us.net> | 1 | Convert the Neon VCVT float<->fixed-point insns to a |
---|---|---|---|
2 | gvec style, in preparation for adding fp16 support. | ||
2 | 3 | ||
3 | i.MX25 supports two USB controllers. Let's wire them up. | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
6 | Message-id: 20200828183354.27913-38-peter.maydell@linaro.org | ||
7 | --- | ||
8 | target/arm/helper.h | 5 +++++ | ||
9 | target/arm/vec_helper.c | 20 +++++++++++++++++++ | ||
10 | target/arm/translate-neon.c.inc | 35 +++++++++++++++++---------------- | ||
11 | 3 files changed, 43 insertions(+), 17 deletions(-) | ||
4 | 12 | ||
5 | With this patch, imx25-pdk can boot from both USB ports. | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
6 | |||
7 | Signed-off-by: Guenter Roeck <linux@roeck-us.net> | ||
8 | Message-id: 20200310215146.19688-3-linux@roeck-us.net | ||
9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | --- | ||
12 | include/hw/arm/fsl-imx25.h | 9 +++++++++ | ||
13 | hw/arm/fsl-imx25.c | 24 ++++++++++++++++++++++++ | ||
14 | 2 files changed, 33 insertions(+) | ||
15 | |||
16 | diff --git a/include/hw/arm/fsl-imx25.h b/include/hw/arm/fsl-imx25.h | ||
17 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/include/hw/arm/fsl-imx25.h | 15 | --- a/target/arm/helper.h |
19 | +++ b/include/hw/arm/fsl-imx25.h | 16 | +++ b/target/arm/helper.h |
20 | @@ -XXX,XX +XXX,XX @@ | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(gvec_tosizs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
21 | #include "hw/i2c/imx_i2c.h" | 18 | DEF_HELPER_FLAGS_4(gvec_touszh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
22 | #include "hw/gpio/imx_gpio.h" | 19 | DEF_HELPER_FLAGS_4(gvec_touizs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
23 | #include "hw/sd/sdhci.h" | 20 | |
24 | +#include "hw/usb/chipidea.h" | 21 | +DEF_HELPER_FLAGS_4(gvec_vcvt_sf, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
25 | #include "exec/memory.h" | 22 | +DEF_HELPER_FLAGS_4(gvec_vcvt_uf, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
26 | #include "target/arm/cpu.h" | 23 | +DEF_HELPER_FLAGS_4(gvec_vcvt_fs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
27 | 24 | +DEF_HELPER_FLAGS_4(gvec_vcvt_fu, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | |
28 | @@ -XXX,XX +XXX,XX @@ | 25 | + |
29 | #define FSL_IMX25_NUM_I2CS 3 | 26 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
30 | #define FSL_IMX25_NUM_GPIOS 4 | 27 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
31 | #define FSL_IMX25_NUM_ESDHCS 2 | 28 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
32 | +#define FSL_IMX25_NUM_USBS 2 | 29 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
33 | |||
34 | typedef struct FslIMX25State { | ||
35 | /*< private >*/ | ||
36 | @@ -XXX,XX +XXX,XX @@ typedef struct FslIMX25State { | ||
37 | IMXI2CState i2c[FSL_IMX25_NUM_I2CS]; | ||
38 | IMXGPIOState gpio[FSL_IMX25_NUM_GPIOS]; | ||
39 | SDHCIState esdhc[FSL_IMX25_NUM_ESDHCS]; | ||
40 | + ChipideaState usb[FSL_IMX25_NUM_USBS]; | ||
41 | MemoryRegion rom[2]; | ||
42 | MemoryRegion iram; | ||
43 | MemoryRegion iram_alias; | ||
44 | @@ -XXX,XX +XXX,XX @@ typedef struct FslIMX25State { | ||
45 | #define FSL_IMX25_GPIO1_SIZE 0x4000 | ||
46 | #define FSL_IMX25_GPIO2_ADDR 0x53FD0000 | ||
47 | #define FSL_IMX25_GPIO2_SIZE 0x4000 | ||
48 | +#define FSL_IMX25_USB1_ADDR 0x53FF4000 | ||
49 | +#define FSL_IMX25_USB1_SIZE 0x0200 | ||
50 | +#define FSL_IMX25_USB2_ADDR 0x53FF4400 | ||
51 | +#define FSL_IMX25_USB2_SIZE 0x0200 | ||
52 | #define FSL_IMX25_AVIC_ADDR 0x68000000 | ||
53 | #define FSL_IMX25_AVIC_SIZE 0x4000 | ||
54 | #define FSL_IMX25_IRAM_ADDR 0x78000000 | ||
55 | @@ -XXX,XX +XXX,XX @@ typedef struct FslIMX25State { | ||
56 | #define FSL_IMX25_GPIO4_IRQ 23 | ||
57 | #define FSL_IMX25_ESDHC1_IRQ 9 | ||
58 | #define FSL_IMX25_ESDHC2_IRQ 8 | ||
59 | +#define FSL_IMX25_USB1_IRQ 37 | ||
60 | +#define FSL_IMX25_USB2_IRQ 35 | ||
61 | |||
62 | #endif /* FSL_IMX25_H */ | ||
63 | diff --git a/hw/arm/fsl-imx25.c b/hw/arm/fsl-imx25.c | ||
64 | index XXXXXXX..XXXXXXX 100644 | 30 | index XXXXXXX..XXXXXXX 100644 |
65 | --- a/hw/arm/fsl-imx25.c | 31 | --- a/target/arm/vec_helper.c |
66 | +++ b/hw/arm/fsl-imx25.c | 32 | +++ b/target/arm/vec_helper.c |
67 | @@ -XXX,XX +XXX,XX @@ static void fsl_imx25_init(Object *obj) | 33 | @@ -XXX,XX +XXX,XX @@ DO_NEON_PAIRWISE(neon_pmax, max) |
68 | sysbus_init_child_obj(obj, "sdhc[*]", &s->esdhc[i], sizeof(s->esdhc[i]), | 34 | DO_NEON_PAIRWISE(neon_pmin, min) |
69 | TYPE_IMX_USDHC); | 35 | |
70 | } | 36 | #undef DO_NEON_PAIRWISE |
71 | + | 37 | + |
72 | + for (i = 0; i < FSL_IMX25_NUM_USBS; i++) { | 38 | +#define DO_VCVT_FIXED(NAME, FUNC, TYPE) \ |
73 | + sysbus_init_child_obj(obj, "usb[*]", &s->usb[i], sizeof(s->usb[i]), | 39 | + void HELPER(NAME)(void *vd, void *vn, void *stat, uint32_t desc) \ |
74 | + TYPE_CHIPIDEA); | 40 | + { \ |
41 | + intptr_t i, oprsz = simd_oprsz(desc); \ | ||
42 | + int shift = simd_data(desc); \ | ||
43 | + TYPE *d = vd, *n = vn; \ | ||
44 | + float_status *fpst = stat; \ | ||
45 | + for (i = 0; i < oprsz / sizeof(TYPE); i++) { \ | ||
46 | + d[i] = FUNC(n[i], shift, fpst); \ | ||
47 | + } \ | ||
48 | + clear_tail(d, oprsz, simd_maxsz(desc)); \ | ||
75 | + } | 49 | + } |
76 | + | 50 | + |
51 | +DO_VCVT_FIXED(gvec_vcvt_sf, helper_vfp_sltos, uint32_t) | ||
52 | +DO_VCVT_FIXED(gvec_vcvt_uf, helper_vfp_ultos, uint32_t) | ||
53 | +DO_VCVT_FIXED(gvec_vcvt_fs, helper_vfp_tosls_round_to_zero, uint32_t) | ||
54 | +DO_VCVT_FIXED(gvec_vcvt_fu, helper_vfp_touls_round_to_zero, uint32_t) | ||
55 | + | ||
56 | +#undef DO_VCVT_FIXED | ||
57 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
58 | index XXXXXXX..XXXXXXX 100644 | ||
59 | --- a/target/arm/translate-neon.c.inc | ||
60 | +++ b/target/arm/translate-neon.c.inc | ||
61 | @@ -XXX,XX +XXX,XX @@ static bool trans_VSHLL_U_2sh(DisasContext *s, arg_2reg_shift *a) | ||
77 | } | 62 | } |
78 | 63 | ||
79 | static void fsl_imx25_realize(DeviceState *dev, Error **errp) | 64 | static bool do_fp_2sh(DisasContext *s, arg_2reg_shift *a, |
80 | @@ -XXX,XX +XXX,XX @@ static void fsl_imx25_realize(DeviceState *dev, Error **errp) | 65 | - NeonGenTwoSingleOpFn *fn) |
81 | esdhc_table[i].irq)); | 66 | + gen_helper_gvec_2_ptr *fn) |
67 | { | ||
68 | /* FP operations in 2-reg-and-shift group */ | ||
69 | - TCGv_i32 tmp, shiftv; | ||
70 | - TCGv_ptr fpstatus; | ||
71 | - int pass; | ||
72 | + int vec_size = a->q ? 16 : 8; | ||
73 | + int rd_ofs = neon_reg_offset(a->vd, 0); | ||
74 | + int rm_ofs = neon_reg_offset(a->vm, 0); | ||
75 | + TCGv_ptr fpst; | ||
76 | |||
77 | if (!arm_dc_feature(s, ARM_FEATURE_NEON)) { | ||
78 | return false; | ||
82 | } | 79 | } |
83 | 80 | ||
84 | + /* USB */ | 81 | + if (a->size != 0) { |
85 | + for (i = 0; i < FSL_IMX25_NUM_USBS; i++) { | 82 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { |
86 | + static const struct { | 83 | + return false; |
87 | + hwaddr addr; | 84 | + } |
88 | + unsigned int irq; | ||
89 | + } usb_table[FSL_IMX25_NUM_USBS] = { | ||
90 | + { FSL_IMX25_USB1_ADDR, FSL_IMX25_USB1_IRQ }, | ||
91 | + { FSL_IMX25_USB2_ADDR, FSL_IMX25_USB2_IRQ }, | ||
92 | + }; | ||
93 | + | ||
94 | + object_property_set_bool(OBJECT(&s->usb[i]), true, "realized", | ||
95 | + &error_abort); | ||
96 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->usb[i]), 0, usb_table[i].addr); | ||
97 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->usb[i]), 0, | ||
98 | + qdev_get_gpio_in(DEVICE(&s->avic), | ||
99 | + usb_table[i].irq)); | ||
100 | + } | 85 | + } |
101 | + | 86 | + |
102 | /* initialize 2 x 16 KB ROM */ | 87 | /* UNDEF accesses to D16-D31 if they don't exist. */ |
103 | memory_region_init_rom(&s->rom[0], NULL, | 88 | if (!dc_isar_feature(aa32_simd_r32, s) && |
104 | "imx25.rom0", FSL_IMX25_ROM0_SIZE, &err); | 89 | ((a->vd | a->vm) & 0x10)) { |
90 | @@ -XXX,XX +XXX,XX @@ static bool do_fp_2sh(DisasContext *s, arg_2reg_shift *a, | ||
91 | return true; | ||
92 | } | ||
93 | |||
94 | - fpstatus = fpstatus_ptr(FPST_STD); | ||
95 | - shiftv = tcg_const_i32(a->shift); | ||
96 | - for (pass = 0; pass < (a->q ? 4 : 2); pass++) { | ||
97 | - tmp = neon_load_reg(a->vm, pass); | ||
98 | - fn(tmp, tmp, shiftv, fpstatus); | ||
99 | - neon_store_reg(a->vd, pass, tmp); | ||
100 | - } | ||
101 | - tcg_temp_free_ptr(fpstatus); | ||
102 | - tcg_temp_free_i32(shiftv); | ||
103 | + fpst = fpstatus_ptr(a->size ? FPST_STD_F16 : FPST_STD); | ||
104 | + tcg_gen_gvec_2_ptr(rd_ofs, rm_ofs, fpst, vec_size, vec_size, a->shift, fn); | ||
105 | + tcg_temp_free_ptr(fpst); | ||
106 | return true; | ||
107 | } | ||
108 | |||
109 | @@ -XXX,XX +XXX,XX @@ static bool do_fp_2sh(DisasContext *s, arg_2reg_shift *a, | ||
110 | return do_fp_2sh(s, a, FUNC); \ | ||
111 | } | ||
112 | |||
113 | -DO_FP_2SH(VCVT_SF, gen_helper_vfp_sltos) | ||
114 | -DO_FP_2SH(VCVT_UF, gen_helper_vfp_ultos) | ||
115 | -DO_FP_2SH(VCVT_FS, gen_helper_vfp_tosls_round_to_zero) | ||
116 | -DO_FP_2SH(VCVT_FU, gen_helper_vfp_touls_round_to_zero) | ||
117 | +DO_FP_2SH(VCVT_SF, gen_helper_gvec_vcvt_sf) | ||
118 | +DO_FP_2SH(VCVT_UF, gen_helper_gvec_vcvt_uf) | ||
119 | +DO_FP_2SH(VCVT_FS, gen_helper_gvec_vcvt_fs) | ||
120 | +DO_FP_2SH(VCVT_FU, gen_helper_gvec_vcvt_fu) | ||
121 | |||
122 | static uint64_t asimd_imm_const(uint32_t imm, int cmode, int op) | ||
123 | { | ||
105 | -- | 124 | -- |
106 | 2.20.1 | 125 | 2.20.1 |
107 | 126 | ||
108 | 127 | diff view generated by jsdifflib |
1 | From: Philippe Mathieu-Daudé <f4bug@amsat.org> | 1 | Implement fp16 for the Neon VCVT insns which convert between |
---|---|---|---|
2 | float and fixed-point. | ||
2 | 3 | ||
3 | The kernel image and DeviceTree blob are built by the Armbian | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | project (based on Debian): | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | https://www.armbian.com/orange-pi-pc/ | 6 | Message-id: 20200828183354.27913-39-peter.maydell@linaro.org |
7 | --- | ||
8 | target/arm/helper.h | 5 +++++ | ||
9 | target/arm/neon-dp.decode | 8 +++++++- | ||
10 | target/arm/vec_helper.c | 4 ++++ | ||
11 | target/arm/translate-neon.c.inc | 5 +++++ | ||
12 | 4 files changed, 21 insertions(+), 1 deletion(-) | ||
6 | 13 | ||
7 | The SD image is from the kernelci.org project: | 14 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
8 | https://kernelci.org/faq/#the-code | ||
9 | |||
10 | If ARM is a target being built, "make check-acceptance" will | ||
11 | automatically include this test by the use of the "arch:arm" tags. | ||
12 | |||
13 | Alternatively, this test can be run using: | ||
14 | |||
15 | $ avocado --show=console run -t machine:orangepi-pc tests/acceptance/boot_linux_console.py | ||
16 | console: Uncompressing Linux... done, booting the kernel. | ||
17 | console: Booting Linux on physical CPU 0x0 | ||
18 | console: Linux version 4.20.7-sunxi (root@armbian.com) (gcc version 7.2.1 20171011 (Linaro GCC 7.2-2017.11)) #5.75 SMP Fri Feb 8 09:02:10 CET 2019 | ||
19 | console: CPU: ARMv7 Processor [410fc075] revision 5 (ARMv7), cr=50c5387d | ||
20 | [...] | ||
21 | console: sunxi-wdt 1c20ca0.watchdog: Watchdog enabled (timeout=16 sec, nowayout=0) | ||
22 | console: sunxi-mmc 1c0f000.mmc: Linked as a consumer to regulator.2 | ||
23 | console: sunxi-mmc 1c0f000.mmc: Got CD GPIO | ||
24 | console: ledtrig-cpu: registered to indicate activity on CPUs | ||
25 | console: hidraw: raw HID events driver (C) Jiri Kosina | ||
26 | console: usbcore: registered new interface driver usbhid | ||
27 | console: usbhid: USB HID core driver | ||
28 | console: Initializing XFRM netlink socket | ||
29 | console: sunxi-mmc 1c0f000.mmc: initialized, max. request size: 16384 KB | ||
30 | console: NET: Registered protocol family 10 | ||
31 | console: mmc0: host does not support reading read-only switch, assuming write-enable | ||
32 | console: mmc0: Problem switching card into high-speed mode! | ||
33 | console: mmc0: new SD card at address 4567 | ||
34 | console: mmcblk0: mmc0:4567 QEMU! 60.0 MiB | ||
35 | [...] | ||
36 | console: EXT4-fs (mmcblk0): mounting ext2 file system using the ext4 subsystem | ||
37 | console: EXT4-fs (mmcblk0): mounted filesystem without journal. Opts: (null) | ||
38 | console: VFS: Mounted root (ext2 filesystem) on device 179:0. | ||
39 | console: Run /sbin/init as init process | ||
40 | console: EXT4-fs (mmcblk0): re-mounted. Opts: block_validity,barrier,user_xattr,acl | ||
41 | console: Starting syslogd: OK | ||
42 | console: Starting klogd: OK | ||
43 | console: Populating /dev using udev: udevd[203]: starting version 3.2.7 | ||
44 | console: /bin/sh: can't access tty; job control turned off | ||
45 | console: cat /proc/partitions | ||
46 | console: / # cat /proc/partitions | ||
47 | console: major minor #blocks name | ||
48 | console: 1 0 4096 ram0 | ||
49 | console: 1 1 4096 ram1 | ||
50 | console: 1 2 4096 ram2 | ||
51 | console: 1 3 4096 ram3 | ||
52 | console: 179 0 61440 mmcblk0 | ||
53 | console: reboot | ||
54 | console: / # reboot | ||
55 | console: umount: devtmpfs busy - remounted read-only | ||
56 | console: EXT4-fs (mmcblk0): re-mounted. Opts: (null) | ||
57 | console: The system is going down NOW! | ||
58 | console: Sent SIGTERM to all processes | ||
59 | console: Sent SIGKILL to all processes | ||
60 | console: Requesting system reboot | ||
61 | console: reboot: Restarting system | ||
62 | JOB TIME : 68.64 s | ||
63 | |||
64 | Signed-off-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
65 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
66 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
67 | Tested-by: Alex Bennée <alex.bennee@linaro.org> | ||
68 | Message-id: 20200311221854.30370-16-nieklinnenbank@gmail.com | ||
69 | [NL: rename in commit message Raspbian to Armbian, remove vm.set_machine()] | ||
70 | [NL: extend test with ethernet device checks] | ||
71 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
72 | --- | ||
73 | tests/acceptance/boot_linux_console.py | 47 ++++++++++++++++++++++++++ | ||
74 | 1 file changed, 47 insertions(+) | ||
75 | |||
76 | diff --git a/tests/acceptance/boot_linux_console.py b/tests/acceptance/boot_linux_console.py | ||
77 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
78 | --- a/tests/acceptance/boot_linux_console.py | 16 | --- a/target/arm/helper.h |
79 | +++ b/tests/acceptance/boot_linux_console.py | 17 | +++ b/target/arm/helper.h |
80 | @@ -XXX,XX +XXX,XX @@ class BootLinuxConsole(Test): | 18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(gvec_vcvt_uf, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
81 | exec_command_and_wait_for_pattern(self, 'reboot', | 19 | DEF_HELPER_FLAGS_4(gvec_vcvt_fs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
82 | 'reboot: Restarting system') | 20 | DEF_HELPER_FLAGS_4(gvec_vcvt_fu, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
83 | 21 | ||
84 | + def test_arm_orangepi_sd(self): | 22 | +DEF_HELPER_FLAGS_4(gvec_vcvt_sh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
85 | + """ | 23 | +DEF_HELPER_FLAGS_4(gvec_vcvt_uh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
86 | + :avocado: tags=arch:arm | 24 | +DEF_HELPER_FLAGS_4(gvec_vcvt_hs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
87 | + :avocado: tags=machine:orangepi-pc | 25 | +DEF_HELPER_FLAGS_4(gvec_vcvt_hu, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
88 | + """ | ||
89 | + deb_url = ('https://apt.armbian.com/pool/main/l/' | ||
90 | + 'linux-4.20.7-sunxi/linux-image-dev-sunxi_5.75_armhf.deb') | ||
91 | + deb_hash = '1334c29c44d984ffa05ed10de8c3361f33d78315' | ||
92 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | ||
93 | + kernel_path = self.extract_from_deb(deb_path, | ||
94 | + '/boot/vmlinuz-4.20.7-sunxi') | ||
95 | + dtb_path = '/usr/lib/linux-image-dev-sunxi/sun8i-h3-orangepi-pc.dtb' | ||
96 | + dtb_path = self.extract_from_deb(deb_path, dtb_path) | ||
97 | + rootfs_url = ('http://storage.kernelci.org/images/rootfs/buildroot/' | ||
98 | + 'kci-2019.02/armel/base/rootfs.ext2.xz') | ||
99 | + rootfs_hash = '692510cb625efda31640d1de0a8d60e26040f061' | ||
100 | + rootfs_path_xz = self.fetch_asset(rootfs_url, asset_hash=rootfs_hash) | ||
101 | + rootfs_path = os.path.join(self.workdir, 'rootfs.cpio') | ||
102 | + archive.lzma_uncompress(rootfs_path_xz, rootfs_path) | ||
103 | + | 26 | + |
104 | + self.vm.set_console() | 27 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
105 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | 28 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
106 | + 'console=ttyS0,115200 ' | 29 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
107 | + 'root=/dev/mmcblk0 rootwait rw ' | 30 | diff --git a/target/arm/neon-dp.decode b/target/arm/neon-dp.decode |
108 | + 'panic=-1 noreboot') | 31 | index XXXXXXX..XXXXXXX 100644 |
109 | + self.vm.add_args('-kernel', kernel_path, | 32 | --- a/target/arm/neon-dp.decode |
110 | + '-dtb', dtb_path, | 33 | +++ b/target/arm/neon-dp.decode |
111 | + '-drive', 'file=' + rootfs_path + ',if=sd,format=raw', | 34 | @@ -XXX,XX +XXX,XX @@ VMINNM_fp_3s 1111 001 1 0 . 1 . .... .... 1111 ... 1 .... @3same_fp |
112 | + '-append', kernel_command_line, | 35 | # We use size=0 for fp32 and size=1 for fp16 to match the 3-same encodings. |
113 | + '-no-reboot') | 36 | @2reg_vcvt .... ... . . . 1 ..... .... .... . q:1 . . .... \ |
114 | + self.vm.launch() | 37 | &2reg_shift vm=%vm_dp vd=%vd_dp size=0 shift=%neon_rshift_i5 |
115 | + shell_ready = "/bin/sh: can't access tty; job control turned off" | 38 | +@2reg_vcvt_f16 .... ... . . . 11 .... .... .... . q:1 . . .... \ |
116 | + self.wait_for_console_pattern(shell_ready) | 39 | + &2reg_shift vm=%vm_dp vd=%vd_dp size=1 shift=%neon_rshift_i4 |
40 | |||
41 | VSHR_S_2sh 1111 001 0 1 . ...... .... 0000 . . . 1 .... @2reg_shr_d | ||
42 | VSHR_S_2sh 1111 001 0 1 . ...... .... 0000 . . . 1 .... @2reg_shr_s | ||
43 | @@ -XXX,XX +XXX,XX @@ VSHLL_U_2sh 1111 001 1 1 . ...... .... 1010 . 0 . 1 .... @2reg_shll_h | ||
44 | VSHLL_U_2sh 1111 001 1 1 . ...... .... 1010 . 0 . 1 .... @2reg_shll_b | ||
45 | |||
46 | # VCVT fixed<->float conversions | ||
47 | -# TODO: FP16 fixed<->float conversions are opc==0b1100 and 0b1101 | ||
48 | +VCVT_SH_2sh 1111 001 0 1 . ...... .... 1100 0 . . 1 .... @2reg_vcvt_f16 | ||
49 | +VCVT_UH_2sh 1111 001 1 1 . ...... .... 1100 0 . . 1 .... @2reg_vcvt_f16 | ||
50 | +VCVT_HS_2sh 1111 001 0 1 . ...... .... 1101 0 . . 1 .... @2reg_vcvt_f16 | ||
51 | +VCVT_HU_2sh 1111 001 1 1 . ...... .... 1101 0 . . 1 .... @2reg_vcvt_f16 | ||
117 | + | 52 | + |
118 | + exec_command_and_wait_for_pattern(self, 'cat /proc/cpuinfo', | 53 | VCVT_SF_2sh 1111 001 0 1 . ...... .... 1110 0 . . 1 .... @2reg_vcvt |
119 | + 'Allwinner sun8i Family') | 54 | VCVT_UF_2sh 1111 001 1 1 . ...... .... 1110 0 . . 1 .... @2reg_vcvt |
120 | + exec_command_and_wait_for_pattern(self, 'cat /proc/partitions', | 55 | VCVT_FS_2sh 1111 001 0 1 . ...... .... 1111 0 . . 1 .... @2reg_vcvt |
121 | + 'mmcblk0') | 56 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
122 | + exec_command_and_wait_for_pattern(self, 'ifconfig eth0 up', | 57 | index XXXXXXX..XXXXXXX 100644 |
123 | + 'eth0: Link is Up') | 58 | --- a/target/arm/vec_helper.c |
124 | + exec_command_and_wait_for_pattern(self, 'udhcpc eth0', | 59 | +++ b/target/arm/vec_helper.c |
125 | + 'udhcpc: lease of 10.0.2.15 obtained') | 60 | @@ -XXX,XX +XXX,XX @@ DO_VCVT_FIXED(gvec_vcvt_sf, helper_vfp_sltos, uint32_t) |
126 | + exec_command_and_wait_for_pattern(self, 'ping -c 3 10.0.2.2', | 61 | DO_VCVT_FIXED(gvec_vcvt_uf, helper_vfp_ultos, uint32_t) |
127 | + '3 packets transmitted, 3 packets received, 0% packet loss') | 62 | DO_VCVT_FIXED(gvec_vcvt_fs, helper_vfp_tosls_round_to_zero, uint32_t) |
128 | + exec_command_and_wait_for_pattern(self, 'reboot', | 63 | DO_VCVT_FIXED(gvec_vcvt_fu, helper_vfp_touls_round_to_zero, uint32_t) |
129 | + 'reboot: Restarting system') | 64 | +DO_VCVT_FIXED(gvec_vcvt_sh, helper_vfp_shtoh, uint16_t) |
65 | +DO_VCVT_FIXED(gvec_vcvt_uh, helper_vfp_uhtoh, uint16_t) | ||
66 | +DO_VCVT_FIXED(gvec_vcvt_hs, helper_vfp_toshh_round_to_zero, uint16_t) | ||
67 | +DO_VCVT_FIXED(gvec_vcvt_hu, helper_vfp_touhh_round_to_zero, uint16_t) | ||
68 | |||
69 | #undef DO_VCVT_FIXED | ||
70 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
71 | index XXXXXXX..XXXXXXX 100644 | ||
72 | --- a/target/arm/translate-neon.c.inc | ||
73 | +++ b/target/arm/translate-neon.c.inc | ||
74 | @@ -XXX,XX +XXX,XX @@ DO_FP_2SH(VCVT_UF, gen_helper_gvec_vcvt_uf) | ||
75 | DO_FP_2SH(VCVT_FS, gen_helper_gvec_vcvt_fs) | ||
76 | DO_FP_2SH(VCVT_FU, gen_helper_gvec_vcvt_fu) | ||
77 | |||
78 | +DO_FP_2SH(VCVT_SH, gen_helper_gvec_vcvt_sh) | ||
79 | +DO_FP_2SH(VCVT_UH, gen_helper_gvec_vcvt_uh) | ||
80 | +DO_FP_2SH(VCVT_HS, gen_helper_gvec_vcvt_hs) | ||
81 | +DO_FP_2SH(VCVT_HU, gen_helper_gvec_vcvt_hu) | ||
130 | + | 82 | + |
131 | def test_s390x_s390_ccw_virtio(self): | 83 | static uint64_t asimd_imm_const(uint32_t imm, int cmode, int op) |
132 | """ | 84 | { |
133 | :avocado: tags=arch:s390x | 85 | /* |
134 | -- | 86 | -- |
135 | 2.20.1 | 87 | 2.20.1 |
136 | 88 | ||
137 | 89 | diff view generated by jsdifflib |
1 | From: Igor Mammedov <imammedo@redhat.com> | 1 | Convert the Neon VCVT with-specified-rounding-mode instructions |
---|---|---|---|
2 | to gvec, and use this to implement fp16 support for them. | ||
2 | 3 | ||
3 | SOC object returned by object_new() is leaked in current code. | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Set SOC parent explicitly to board and then unref to SOC object | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | to make sure that refererence returned by object_new() is taken | 6 | Message-id: 20200828183354.27913-40-peter.maydell@linaro.org |
6 | care of. | 7 | --- |
8 | target/arm/helper.h | 5 ++ | ||
9 | target/arm/vec_helper.c | 23 +++++++ | ||
10 | target/arm/translate-neon.c.inc | 105 ++++++++++++-------------------- | ||
11 | 3 files changed, 66 insertions(+), 67 deletions(-) | ||
7 | 12 | ||
8 | The SOC object will be kept alive by its parent (machine) and | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
9 | will be automatically freed when MachineState is destroyed. | ||
10 | |||
11 | Signed-off-by: Igor Mammedov <imammedo@redhat.com> | ||
12 | Reported-by: Andrew Jones <drjones@redhat.com> | ||
13 | Tested-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
14 | Message-id: 20200303091254.22373-1-imammedo@redhat.com | ||
15 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
16 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
17 | --- | ||
18 | hw/arm/cubieboard.c | 3 +++ | ||
19 | 1 file changed, 3 insertions(+) | ||
20 | |||
21 | diff --git a/hw/arm/cubieboard.c b/hw/arm/cubieboard.c | ||
22 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
23 | --- a/hw/arm/cubieboard.c | 15 | --- a/target/arm/helper.h |
24 | +++ b/hw/arm/cubieboard.c | 16 | +++ b/target/arm/helper.h |
25 | @@ -XXX,XX +XXX,XX @@ static void cubieboard_init(MachineState *machine) | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(gvec_vcvt_uh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
18 | DEF_HELPER_FLAGS_4(gvec_vcvt_hs, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
19 | DEF_HELPER_FLAGS_4(gvec_vcvt_hu, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
20 | |||
21 | +DEF_HELPER_FLAGS_4(gvec_vcvt_rm_ss, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
22 | +DEF_HELPER_FLAGS_4(gvec_vcvt_rm_us, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
23 | +DEF_HELPER_FLAGS_4(gvec_vcvt_rm_sh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
24 | +DEF_HELPER_FLAGS_4(gvec_vcvt_rm_uh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
25 | + | ||
26 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
27 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
28 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
29 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
30 | index XXXXXXX..XXXXXXX 100644 | ||
31 | --- a/target/arm/vec_helper.c | ||
32 | +++ b/target/arm/vec_helper.c | ||
33 | @@ -XXX,XX +XXX,XX @@ DO_VCVT_FIXED(gvec_vcvt_hs, helper_vfp_toshh_round_to_zero, uint16_t) | ||
34 | DO_VCVT_FIXED(gvec_vcvt_hu, helper_vfp_touhh_round_to_zero, uint16_t) | ||
35 | |||
36 | #undef DO_VCVT_FIXED | ||
37 | + | ||
38 | +#define DO_VCVT_RMODE(NAME, FUNC, TYPE) \ | ||
39 | + void HELPER(NAME)(void *vd, void *vn, void *stat, uint32_t desc) \ | ||
40 | + { \ | ||
41 | + float_status *fpst = stat; \ | ||
42 | + intptr_t i, oprsz = simd_oprsz(desc); \ | ||
43 | + uint32_t rmode = simd_data(desc); \ | ||
44 | + uint32_t prev_rmode = get_float_rounding_mode(fpst); \ | ||
45 | + TYPE *d = vd, *n = vn; \ | ||
46 | + set_float_rounding_mode(rmode, fpst); \ | ||
47 | + for (i = 0; i < oprsz / sizeof(TYPE); i++) { \ | ||
48 | + d[i] = FUNC(n[i], 0, fpst); \ | ||
49 | + } \ | ||
50 | + set_float_rounding_mode(prev_rmode, fpst); \ | ||
51 | + clear_tail(d, oprsz, simd_maxsz(desc)); \ | ||
52 | + } | ||
53 | + | ||
54 | +DO_VCVT_RMODE(gvec_vcvt_rm_ss, helper_vfp_tosls, uint32_t) | ||
55 | +DO_VCVT_RMODE(gvec_vcvt_rm_us, helper_vfp_touls, uint32_t) | ||
56 | +DO_VCVT_RMODE(gvec_vcvt_rm_sh, helper_vfp_toshh, uint16_t) | ||
57 | +DO_VCVT_RMODE(gvec_vcvt_rm_uh, helper_vfp_touhh, uint16_t) | ||
58 | + | ||
59 | +#undef DO_VCVT_RMODE | ||
60 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
61 | index XXXXXXX..XXXXXXX 100644 | ||
62 | --- a/target/arm/translate-neon.c.inc | ||
63 | +++ b/target/arm/translate-neon.c.inc | ||
64 | @@ -XXX,XX +XXX,XX @@ DO_VRINT(VRINTZ, FPROUNDING_ZERO) | ||
65 | DO_VRINT(VRINTM, FPROUNDING_NEGINF) | ||
66 | DO_VRINT(VRINTP, FPROUNDING_POSINF) | ||
67 | |||
68 | -static bool do_vcvt(DisasContext *s, arg_2misc *a, int rmode, bool is_signed) | ||
69 | -{ | ||
70 | - /* | ||
71 | - * Handle a VCVT* operation by iterating 32 bits at a time, | ||
72 | - * with a specified rounding mode in operation. | ||
73 | - */ | ||
74 | - int pass; | ||
75 | - TCGv_ptr fpst; | ||
76 | - TCGv_i32 tcg_rmode, tcg_shift; | ||
77 | - | ||
78 | - if (!arm_dc_feature(s, ARM_FEATURE_NEON) || | ||
79 | - !arm_dc_feature(s, ARM_FEATURE_V8)) { | ||
80 | - return false; | ||
81 | +#define DO_VEC_RMODE(INSN, RMODE, OP) \ | ||
82 | + static void gen_##INSN(unsigned vece, uint32_t rd_ofs, \ | ||
83 | + uint32_t rm_ofs, \ | ||
84 | + uint32_t oprsz, uint32_t maxsz) \ | ||
85 | + { \ | ||
86 | + static gen_helper_gvec_2_ptr * const fns[4] = { \ | ||
87 | + NULL, \ | ||
88 | + gen_helper_gvec_##OP##h, \ | ||
89 | + gen_helper_gvec_##OP##s, \ | ||
90 | + NULL, \ | ||
91 | + }; \ | ||
92 | + TCGv_ptr fpst; \ | ||
93 | + fpst = fpstatus_ptr(vece == 1 ? FPST_STD_F16 : FPST_STD); \ | ||
94 | + tcg_gen_gvec_2_ptr(rd_ofs, rm_ofs, fpst, oprsz, maxsz, \ | ||
95 | + arm_rmode_to_sf(RMODE), fns[vece]); \ | ||
96 | + tcg_temp_free_ptr(fpst); \ | ||
97 | + } \ | ||
98 | + static bool trans_##INSN(DisasContext *s, arg_2misc *a) \ | ||
99 | + { \ | ||
100 | + if (!arm_dc_feature(s, ARM_FEATURE_V8)) { \ | ||
101 | + return false; \ | ||
102 | + } \ | ||
103 | + if (a->size == MO_16) { \ | ||
104 | + if (!dc_isar_feature(aa32_fp16_arith, s)) { \ | ||
105 | + return false; \ | ||
106 | + } \ | ||
107 | + } else if (a->size != MO_32) { \ | ||
108 | + return false; \ | ||
109 | + } \ | ||
110 | + return do_2misc_vec(s, a, gen_##INSN); \ | ||
26 | } | 111 | } |
27 | 112 | ||
28 | a10 = AW_A10(object_new(TYPE_AW_A10)); | 113 | - /* UNDEF accesses to D16-D31 if they don't exist. */ |
29 | + object_property_add_child(OBJECT(machine), "soc", OBJECT(a10), | 114 | - if (!dc_isar_feature(aa32_simd_r32, s) && |
30 | + &error_abort); | 115 | - ((a->vd | a->vm) & 0x10)) { |
31 | + object_unref(OBJECT(a10)); | 116 | - return false; |
32 | 117 | - } | |
33 | object_property_set_int(OBJECT(&a10->emac), 1, "phy-addr", &err); | 118 | - |
34 | if (err != NULL) { | 119 | - if (a->size != 2) { |
120 | - /* TODO: FP16 will be the size == 1 case */ | ||
121 | - return false; | ||
122 | - } | ||
123 | - | ||
124 | - if ((a->vd | a->vm) & a->q) { | ||
125 | - return false; | ||
126 | - } | ||
127 | - | ||
128 | - if (!vfp_access_check(s)) { | ||
129 | - return true; | ||
130 | - } | ||
131 | - | ||
132 | - fpst = fpstatus_ptr(FPST_STD); | ||
133 | - tcg_shift = tcg_const_i32(0); | ||
134 | - tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | ||
135 | - gen_helper_set_neon_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
136 | - for (pass = 0; pass < (a->q ? 4 : 2); pass++) { | ||
137 | - TCGv_i32 tmp = neon_load_reg(a->vm, pass); | ||
138 | - if (is_signed) { | ||
139 | - gen_helper_vfp_tosls(tmp, tmp, tcg_shift, fpst); | ||
140 | - } else { | ||
141 | - gen_helper_vfp_touls(tmp, tmp, tcg_shift, fpst); | ||
142 | - } | ||
143 | - neon_store_reg(a->vd, pass, tmp); | ||
144 | - } | ||
145 | - gen_helper_set_neon_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
146 | - tcg_temp_free_i32(tcg_rmode); | ||
147 | - tcg_temp_free_i32(tcg_shift); | ||
148 | - tcg_temp_free_ptr(fpst); | ||
149 | - | ||
150 | - return true; | ||
151 | -} | ||
152 | - | ||
153 | -#define DO_VCVT(INSN, RMODE, SIGNED) \ | ||
154 | - static bool trans_##INSN(DisasContext *s, arg_2misc *a) \ | ||
155 | - { \ | ||
156 | - return do_vcvt(s, a, RMODE, SIGNED); \ | ||
157 | - } | ||
158 | - | ||
159 | -DO_VCVT(VCVTAU, FPROUNDING_TIEAWAY, false) | ||
160 | -DO_VCVT(VCVTAS, FPROUNDING_TIEAWAY, true) | ||
161 | -DO_VCVT(VCVTNU, FPROUNDING_TIEEVEN, false) | ||
162 | -DO_VCVT(VCVTNS, FPROUNDING_TIEEVEN, true) | ||
163 | -DO_VCVT(VCVTPU, FPROUNDING_POSINF, false) | ||
164 | -DO_VCVT(VCVTPS, FPROUNDING_POSINF, true) | ||
165 | -DO_VCVT(VCVTMU, FPROUNDING_NEGINF, false) | ||
166 | -DO_VCVT(VCVTMS, FPROUNDING_NEGINF, true) | ||
167 | +DO_VEC_RMODE(VCVTAU, FPROUNDING_TIEAWAY, vcvt_rm_u) | ||
168 | +DO_VEC_RMODE(VCVTAS, FPROUNDING_TIEAWAY, vcvt_rm_s) | ||
169 | +DO_VEC_RMODE(VCVTNU, FPROUNDING_TIEEVEN, vcvt_rm_u) | ||
170 | +DO_VEC_RMODE(VCVTNS, FPROUNDING_TIEEVEN, vcvt_rm_s) | ||
171 | +DO_VEC_RMODE(VCVTPU, FPROUNDING_POSINF, vcvt_rm_u) | ||
172 | +DO_VEC_RMODE(VCVTPS, FPROUNDING_POSINF, vcvt_rm_s) | ||
173 | +DO_VEC_RMODE(VCVTMU, FPROUNDING_NEGINF, vcvt_rm_u) | ||
174 | +DO_VEC_RMODE(VCVTMS, FPROUNDING_NEGINF, vcvt_rm_s) | ||
175 | |||
176 | static bool trans_VSWP(DisasContext *s, arg_2misc *a) | ||
177 | { | ||
35 | -- | 178 | -- |
36 | 2.20.1 | 179 | 2.20.1 |
37 | 180 | ||
38 | 181 | diff view generated by jsdifflib |
1 | From: Philippe Mathieu-Daudé <f4bug@amsat.org> | 1 | Convert the Neon VRINT-with-specified-rounding-mode insns to gvec, |
---|---|---|---|
2 | and use this to implement the fp16 versions. | ||
2 | 3 | ||
3 | This test boots a Linux kernel on a OrangePi PC board and verify | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | the serial output is working. | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
6 | Message-id: 20200828183354.27913-41-peter.maydell@linaro.org | ||
7 | --- | ||
8 | target/arm/helper.h | 4 +- | ||
9 | target/arm/vec_helper.c | 21 +++++++++++ | ||
10 | target/arm/vfp_helper.c | 17 --------- | ||
11 | target/arm/translate-neon.c.inc | 67 +++------------------------------ | ||
12 | 4 files changed, 30 insertions(+), 79 deletions(-) | ||
5 | 13 | ||
6 | The kernel image and DeviceTree blob are built by the Armbian | 14 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
7 | project (based on Debian): | ||
8 | https://www.armbian.com/orange-pi-pc/ | ||
9 | |||
10 | The cpio image used comes from the linux-build-test project: | ||
11 | https://github.com/groeck/linux-build-test | ||
12 | |||
13 | If ARM is a target being built, "make check-acceptance" will | ||
14 | automatically include this test by the use of the "arch:arm" tags. | ||
15 | |||
16 | Alternatively, this test can be run using: | ||
17 | |||
18 | $ avocado --show=console run -t machine:orangepi-pc tests/acceptance/boot_linux_console.py | ||
19 | console: Uncompressing Linux... done, booting the kernel. | ||
20 | console: Booting Linux on physical CPU 0x0 | ||
21 | console: Linux version 4.20.7-sunxi (root@armbian.com) (gcc version 7.2.1 20171011 (Linaro GCC 7.2-2017.11)) #5.75 SMP Fri Feb 8 09:02:10 CET 2019 | ||
22 | console: CPU: ARMv7 Processor [410fc075] revision 5 (ARMv7), cr=50c5387d | ||
23 | console: CPU: div instructions available: patching division code | ||
24 | console: CPU: PIPT / VIPT nonaliasing data cache, VIPT aliasing instruction cache | ||
25 | console: OF: fdt: Machine model: Xunlong Orange Pi PC | ||
26 | [...] | ||
27 | console: Trying to unpack rootfs image as initramfs... | ||
28 | console: Freeing initrd memory: 3256K | ||
29 | console: Freeing unused kernel memory: 1024K | ||
30 | console: Run /init as init process | ||
31 | console: mount: mounting devtmpfs on /dev failed: Device or resource busy | ||
32 | console: Starting logging: OK | ||
33 | console: Initializing random number generator... random: dd: uninitialized urandom read (512 bytes read) | ||
34 | console: done. | ||
35 | console: Starting network: OK | ||
36 | console: Found console ttyS0 | ||
37 | console: Linux version 4.20.7-sunxi (root@armbian.com) (gcc version 7.2.1 20171011 (Linaro GCC 7.2-2017.11)) #5.75 SMP Fri Feb 8 09:02:10 CET 2019 | ||
38 | console: Boot successful. | ||
39 | console: cat /proc/cpuinfo | ||
40 | console: / # cat /proc/cpuinfo | ||
41 | console: processor : 0 | ||
42 | console: model name : ARMv7 Processor rev 5 (v7l) | ||
43 | console: BogoMIPS : 125.00 | ||
44 | console: Features : half thumb fastmult vfp edsp neon vfpv3 tls vfpv4 idiva idivt vfpd32 lpae evtstrm | ||
45 | console: CPU implementer : 0x41 | ||
46 | console: CPU architecture: 7 | ||
47 | console: CPU variant : 0x0 | ||
48 | console: CPU part : 0xc07 | ||
49 | console: CPU revision : 5 | ||
50 | [...] | ||
51 | console: processor : 3 | ||
52 | console: model name : ARMv7 Processor rev 5 (v7l) | ||
53 | console: BogoMIPS : 125.00 | ||
54 | console: Features : half thumb fastmult vfp edsp neon vfpv3 tls vfpv4 idiva idivt vfpd32 lpae evtstrm | ||
55 | console: CPU implementer : 0x41 | ||
56 | console: CPU architecture: 7 | ||
57 | console: CPU variant : 0x0 | ||
58 | console: CPU part : 0xc07 | ||
59 | console: CPU revision : 5 | ||
60 | console: Hardware : Allwinner sun8i Family | ||
61 | console: Revision : 0000 | ||
62 | console: Serial : 0000000000000000 | ||
63 | console: cat /proc/iomem | ||
64 | console: / # cat /proc/iomem | ||
65 | console: 01000000-010fffff : clock@1000000 | ||
66 | console: 01c00000-01c00fff : system-control@1c00000 | ||
67 | console: 01c02000-01c02fff : dma-controller@1c02000 | ||
68 | [...] | ||
69 | console: reboot | ||
70 | console: / # reboot | ||
71 | console: / # Found console ttyS0 | ||
72 | console: Stopping network: OK | ||
73 | console: hrtimer: interrupt took 21852064 ns | ||
74 | console: Saving random seed... random: dd: uninitialized urandom read (512 bytes read) | ||
75 | console: done. | ||
76 | console: Stopping logging: OK | ||
77 | console: umount: devtmpfs busy - remounted read-only | ||
78 | console: umount: can't unmount /: Invalid argument | ||
79 | console: The system is going down NOW! | ||
80 | console: Sent SIGTERM to all processes | ||
81 | console: Sent SIGKILL to all processes | ||
82 | console: Requesting system reboot | ||
83 | console: reboot: Restarting system | ||
84 | PASS (48.32 s) | ||
85 | JOB TIME : 49.16 s | ||
86 | |||
87 | Signed-off-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
88 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
89 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
90 | Tested-by: Alex Bennée <alex.bennee@linaro.org> | ||
91 | Message-id: 20200311221854.30370-15-nieklinnenbank@gmail.com | ||
92 | [NL: rename in commit message Raspbian to Armbian, remove vm.set_machine()] | ||
93 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
94 | --- | ||
95 | tests/acceptance/boot_linux_console.py | 40 ++++++++++++++++++++++++++ | ||
96 | 1 file changed, 40 insertions(+) | ||
97 | |||
98 | diff --git a/tests/acceptance/boot_linux_console.py b/tests/acceptance/boot_linux_console.py | ||
99 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
100 | --- a/tests/acceptance/boot_linux_console.py | 16 | --- a/target/arm/helper.h |
101 | +++ b/tests/acceptance/boot_linux_console.py | 17 | +++ b/target/arm/helper.h |
102 | @@ -XXX,XX +XXX,XX @@ class BootLinuxConsole(Test): | 18 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_sqtoh, f16, i64, i32, ptr) |
103 | console_pattern = 'Kernel command line: %s' % kernel_command_line | 19 | DEF_HELPER_3(vfp_uqtoh, f16, i64, i32, ptr) |
104 | self.wait_for_console_pattern(console_pattern) | 20 | |
105 | 21 | DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, ptr) | |
106 | + def test_arm_orangepi_initrd(self): | 22 | -DEF_HELPER_FLAGS_2(set_neon_rmode, TCG_CALL_NO_RWG, i32, i32, env) |
107 | + """ | 23 | |
108 | + :avocado: tags=arch:arm | 24 | DEF_HELPER_FLAGS_3(vfp_fcvt_f16_to_f32, TCG_CALL_NO_RWG, f32, f16, ptr, i32) |
109 | + :avocado: tags=machine:orangepi-pc | 25 | DEF_HELPER_FLAGS_3(vfp_fcvt_f32_to_f16, TCG_CALL_NO_RWG, f16, f32, ptr, i32) |
110 | + """ | 26 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(gvec_vcvt_rm_us, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
111 | + deb_url = ('https://apt.armbian.com/pool/main/l/' | 27 | DEF_HELPER_FLAGS_4(gvec_vcvt_rm_sh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
112 | + 'linux-4.20.7-sunxi/linux-image-dev-sunxi_5.75_armhf.deb') | 28 | DEF_HELPER_FLAGS_4(gvec_vcvt_rm_uh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
113 | + deb_hash = '1334c29c44d984ffa05ed10de8c3361f33d78315' | 29 | |
114 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | 30 | +DEF_HELPER_FLAGS_4(gvec_vrint_rm_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
115 | + kernel_path = self.extract_from_deb(deb_path, | 31 | +DEF_HELPER_FLAGS_4(gvec_vrint_rm_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
116 | + '/boot/vmlinuz-4.20.7-sunxi') | ||
117 | + dtb_path = '/usr/lib/linux-image-dev-sunxi/sun8i-h3-orangepi-pc.dtb' | ||
118 | + dtb_path = self.extract_from_deb(deb_path, dtb_path) | ||
119 | + initrd_url = ('https://github.com/groeck/linux-build-test/raw/' | ||
120 | + '2eb0a73b5d5a28df3170c546ddaaa9757e1e0848/rootfs/' | ||
121 | + 'arm/rootfs-armv7a.cpio.gz') | ||
122 | + initrd_hash = '604b2e45cdf35045846b8bbfbf2129b1891bdc9c' | ||
123 | + initrd_path_gz = self.fetch_asset(initrd_url, asset_hash=initrd_hash) | ||
124 | + initrd_path = os.path.join(self.workdir, 'rootfs.cpio') | ||
125 | + archive.gzip_uncompress(initrd_path_gz, initrd_path) | ||
126 | + | 32 | + |
127 | + self.vm.set_console() | 33 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
128 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | 34 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
129 | + 'console=ttyS0,115200 ' | 35 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
130 | + 'panic=-1 noreboot') | 36 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
131 | + self.vm.add_args('-kernel', kernel_path, | 37 | index XXXXXXX..XXXXXXX 100644 |
132 | + '-dtb', dtb_path, | 38 | --- a/target/arm/vec_helper.c |
133 | + '-initrd', initrd_path, | 39 | +++ b/target/arm/vec_helper.c |
134 | + '-append', kernel_command_line, | 40 | @@ -XXX,XX +XXX,XX @@ DO_VCVT_RMODE(gvec_vcvt_rm_sh, helper_vfp_toshh, uint16_t) |
135 | + '-no-reboot') | 41 | DO_VCVT_RMODE(gvec_vcvt_rm_uh, helper_vfp_touhh, uint16_t) |
136 | + self.vm.launch() | 42 | |
137 | + self.wait_for_console_pattern('Boot successful.') | 43 | #undef DO_VCVT_RMODE |
138 | + | 44 | + |
139 | + exec_command_and_wait_for_pattern(self, 'cat /proc/cpuinfo', | 45 | +#define DO_VRINT_RMODE(NAME, FUNC, TYPE) \ |
140 | + 'Allwinner sun8i Family') | 46 | + void HELPER(NAME)(void *vd, void *vn, void *stat, uint32_t desc) \ |
141 | + exec_command_and_wait_for_pattern(self, 'cat /proc/iomem', | 47 | + { \ |
142 | + 'system-control@1c00000') | 48 | + float_status *fpst = stat; \ |
143 | + exec_command_and_wait_for_pattern(self, 'reboot', | 49 | + intptr_t i, oprsz = simd_oprsz(desc); \ |
144 | + 'reboot: Restarting system') | 50 | + uint32_t rmode = simd_data(desc); \ |
51 | + uint32_t prev_rmode = get_float_rounding_mode(fpst); \ | ||
52 | + TYPE *d = vd, *n = vn; \ | ||
53 | + set_float_rounding_mode(rmode, fpst); \ | ||
54 | + for (i = 0; i < oprsz / sizeof(TYPE); i++) { \ | ||
55 | + d[i] = FUNC(n[i], fpst); \ | ||
56 | + } \ | ||
57 | + set_float_rounding_mode(prev_rmode, fpst); \ | ||
58 | + clear_tail(d, oprsz, simd_maxsz(desc)); \ | ||
59 | + } | ||
145 | + | 60 | + |
146 | def test_s390x_s390_ccw_virtio(self): | 61 | +DO_VRINT_RMODE(gvec_vrint_rm_h, helper_rinth, uint16_t) |
147 | """ | 62 | +DO_VRINT_RMODE(gvec_vrint_rm_s, helper_rints, uint32_t) |
148 | :avocado: tags=arch:s390x | 63 | + |
64 | +#undef DO_VRINT_RMODE | ||
65 | diff --git a/target/arm/vfp_helper.c b/target/arm/vfp_helper.c | ||
66 | index XXXXXXX..XXXXXXX 100644 | ||
67 | --- a/target/arm/vfp_helper.c | ||
68 | +++ b/target/arm/vfp_helper.c | ||
69 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(set_rmode)(uint32_t rmode, void *fpstp) | ||
70 | return prev_rmode; | ||
71 | } | ||
72 | |||
73 | -/* Set the current fp rounding mode in the standard fp status and return | ||
74 | - * the old one. This is for NEON instructions that need to change the | ||
75 | - * rounding mode but wish to use the standard FPSCR values for everything | ||
76 | - * else. Always set the rounding mode back to the correct value after | ||
77 | - * modifying it. | ||
78 | - * The argument is a softfloat float_round_ value. | ||
79 | - */ | ||
80 | -uint32_t HELPER(set_neon_rmode)(uint32_t rmode, CPUARMState *env) | ||
81 | -{ | ||
82 | - float_status *fp_status = &env->vfp.standard_fp_status; | ||
83 | - | ||
84 | - uint32_t prev_rmode = get_float_rounding_mode(fp_status); | ||
85 | - set_float_rounding_mode(rmode, fp_status); | ||
86 | - | ||
87 | - return prev_rmode; | ||
88 | -} | ||
89 | - | ||
90 | /* Half precision conversions. */ | ||
91 | float32 HELPER(vfp_fcvt_f16_to_f32)(uint32_t a, void *fpstp, uint32_t ahp_mode) | ||
92 | { | ||
93 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
94 | index XXXXXXX..XXXXXXX 100644 | ||
95 | --- a/target/arm/translate-neon.c.inc | ||
96 | +++ b/target/arm/translate-neon.c.inc | ||
97 | @@ -XXX,XX +XXX,XX @@ static bool trans_VRINTX(DisasContext *s, arg_2misc *a) | ||
98 | return do_2misc_fp(s, a, gen_helper_rints_exact); | ||
99 | } | ||
100 | |||
101 | -static bool do_vrint(DisasContext *s, arg_2misc *a, int rmode) | ||
102 | -{ | ||
103 | - /* | ||
104 | - * Handle a VRINT* operation by iterating 32 bits at a time, | ||
105 | - * with a specified rounding mode in operation. | ||
106 | - */ | ||
107 | - int pass; | ||
108 | - TCGv_ptr fpst; | ||
109 | - TCGv_i32 tcg_rmode; | ||
110 | - | ||
111 | - if (!arm_dc_feature(s, ARM_FEATURE_NEON) || | ||
112 | - !arm_dc_feature(s, ARM_FEATURE_V8)) { | ||
113 | - return false; | ||
114 | - } | ||
115 | - | ||
116 | - /* UNDEF accesses to D16-D31 if they don't exist. */ | ||
117 | - if (!dc_isar_feature(aa32_simd_r32, s) && | ||
118 | - ((a->vd | a->vm) & 0x10)) { | ||
119 | - return false; | ||
120 | - } | ||
121 | - | ||
122 | - if (a->size != 2) { | ||
123 | - /* TODO: FP16 will be the size == 1 case */ | ||
124 | - return false; | ||
125 | - } | ||
126 | - | ||
127 | - if ((a->vd | a->vm) & a->q) { | ||
128 | - return false; | ||
129 | - } | ||
130 | - | ||
131 | - if (!vfp_access_check(s)) { | ||
132 | - return true; | ||
133 | - } | ||
134 | - | ||
135 | - fpst = fpstatus_ptr(FPST_STD); | ||
136 | - tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | ||
137 | - gen_helper_set_neon_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
138 | - for (pass = 0; pass < (a->q ? 4 : 2); pass++) { | ||
139 | - TCGv_i32 tmp = neon_load_reg(a->vm, pass); | ||
140 | - gen_helper_rints(tmp, tmp, fpst); | ||
141 | - neon_store_reg(a->vd, pass, tmp); | ||
142 | - } | ||
143 | - gen_helper_set_neon_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
144 | - tcg_temp_free_i32(tcg_rmode); | ||
145 | - tcg_temp_free_ptr(fpst); | ||
146 | - | ||
147 | - return true; | ||
148 | -} | ||
149 | - | ||
150 | -#define DO_VRINT(INSN, RMODE) \ | ||
151 | - static bool trans_##INSN(DisasContext *s, arg_2misc *a) \ | ||
152 | - { \ | ||
153 | - return do_vrint(s, a, RMODE); \ | ||
154 | - } | ||
155 | - | ||
156 | -DO_VRINT(VRINTN, FPROUNDING_TIEEVEN) | ||
157 | -DO_VRINT(VRINTA, FPROUNDING_TIEAWAY) | ||
158 | -DO_VRINT(VRINTZ, FPROUNDING_ZERO) | ||
159 | -DO_VRINT(VRINTM, FPROUNDING_NEGINF) | ||
160 | -DO_VRINT(VRINTP, FPROUNDING_POSINF) | ||
161 | - | ||
162 | #define DO_VEC_RMODE(INSN, RMODE, OP) \ | ||
163 | static void gen_##INSN(unsigned vece, uint32_t rd_ofs, \ | ||
164 | uint32_t rm_ofs, \ | ||
165 | @@ -XXX,XX +XXX,XX @@ DO_VEC_RMODE(VCVTPS, FPROUNDING_POSINF, vcvt_rm_s) | ||
166 | DO_VEC_RMODE(VCVTMU, FPROUNDING_NEGINF, vcvt_rm_u) | ||
167 | DO_VEC_RMODE(VCVTMS, FPROUNDING_NEGINF, vcvt_rm_s) | ||
168 | |||
169 | +DO_VEC_RMODE(VRINTN, FPROUNDING_TIEEVEN, vrint_rm_) | ||
170 | +DO_VEC_RMODE(VRINTA, FPROUNDING_TIEAWAY, vrint_rm_) | ||
171 | +DO_VEC_RMODE(VRINTZ, FPROUNDING_ZERO, vrint_rm_) | ||
172 | +DO_VEC_RMODE(VRINTM, FPROUNDING_NEGINF, vrint_rm_) | ||
173 | +DO_VEC_RMODE(VRINTP, FPROUNDING_POSINF, vrint_rm_) | ||
174 | + | ||
175 | static bool trans_VSWP(DisasContext *s, arg_2misc *a) | ||
176 | { | ||
177 | TCGv_i64 rm, rd; | ||
149 | -- | 178 | -- |
150 | 2.20.1 | 179 | 2.20.1 |
151 | 180 | ||
152 | 181 | diff view generated by jsdifflib |
1 | Some of an M-profile CPU's cached hflags state depends on state that's | 1 | Convert the Neon VRINTX insn to use gvec, and use this to implement |
---|---|---|---|
2 | in our NVIC object. We already do an hflags rebuild when the NVIC | 2 | fp16 support for it. |
3 | registers are written, but we also need to do this on NVIC reset, | ||
4 | because there's no guarantee that this will happen before the | ||
5 | CPU reset. | ||
6 | |||
7 | This fixes an assertion due to mismatched hflags which happens if | ||
8 | the CPU is reset from inside a HardFault handler. | ||
9 | 3 | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
12 | Message-id: 20200303174950.3298-2-peter.maydell@linaro.org | 6 | Message-id: 20200828183354.27913-42-peter.maydell@linaro.org |
13 | --- | 7 | --- |
14 | hw/intc/armv7m_nvic.c | 6 ++++++ | 8 | target/arm/helper.h | 3 +++ |
15 | 1 file changed, 6 insertions(+) | 9 | target/arm/vec_helper.c | 3 +++ |
10 | target/arm/translate-neon.c.inc | 45 +++------------------------------ | ||
11 | 3 files changed, 9 insertions(+), 42 deletions(-) | ||
16 | 12 | ||
17 | diff --git a/hw/intc/armv7m_nvic.c b/hw/intc/armv7m_nvic.c | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
18 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/hw/intc/armv7m_nvic.c | 15 | --- a/target/arm/helper.h |
20 | +++ b/hw/intc/armv7m_nvic.c | 16 | +++ b/target/arm/helper.h |
21 | @@ -XXX,XX +XXX,XX @@ static void armv7m_nvic_reset(DeviceState *dev) | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(gvec_vcvt_rm_uh, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
22 | s->itns[i] = true; | 18 | DEF_HELPER_FLAGS_4(gvec_vrint_rm_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
23 | } | 19 | DEF_HELPER_FLAGS_4(gvec_vrint_rm_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) |
20 | |||
21 | +DEF_HELPER_FLAGS_4(gvec_vrintx_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
22 | +DEF_HELPER_FLAGS_4(gvec_vrintx_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
23 | + | ||
24 | DEF_HELPER_FLAGS_4(gvec_frecpe_h, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
25 | DEF_HELPER_FLAGS_4(gvec_frecpe_s, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
26 | DEF_HELPER_FLAGS_4(gvec_frecpe_d, TCG_CALL_NO_RWG, void, ptr, ptr, ptr, i32) | ||
27 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/target/arm/vec_helper.c | ||
30 | +++ b/target/arm/vec_helper.c | ||
31 | @@ -XXX,XX +XXX,XX @@ DO_2OP(gvec_frsqrte_h, helper_rsqrte_f16, float16) | ||
32 | DO_2OP(gvec_frsqrte_s, helper_rsqrte_f32, float32) | ||
33 | DO_2OP(gvec_frsqrte_d, helper_rsqrte_f64, float64) | ||
34 | |||
35 | +DO_2OP(gvec_vrintx_h, float16_round_to_int, float16) | ||
36 | +DO_2OP(gvec_vrintx_s, float32_round_to_int, float32) | ||
37 | + | ||
38 | DO_2OP(gvec_sitos, helper_vfp_sitos, int32_t) | ||
39 | DO_2OP(gvec_uitos, helper_vfp_uitos, uint32_t) | ||
40 | DO_2OP(gvec_tosizs, helper_vfp_tosizs, float32) | ||
41 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc | ||
42 | index XXXXXXX..XXXXXXX 100644 | ||
43 | --- a/target/arm/translate-neon.c.inc | ||
44 | +++ b/target/arm/translate-neon.c.inc | ||
45 | @@ -XXX,XX +XXX,XX @@ static bool trans_VQNEG(DisasContext *s, arg_2misc *a) | ||
46 | return do_2misc(s, a, fn[a->size]); | ||
47 | } | ||
48 | |||
49 | -static bool do_2misc_fp(DisasContext *s, arg_2misc *a, | ||
50 | - NeonGenOneSingleOpFn *fn) | ||
51 | -{ | ||
52 | - int pass; | ||
53 | - TCGv_ptr fpst; | ||
54 | - | ||
55 | - /* Handle a 2-reg-misc operation by iterating 32 bits at a time */ | ||
56 | - if (!arm_dc_feature(s, ARM_FEATURE_NEON)) { | ||
57 | - return false; | ||
58 | - } | ||
59 | - | ||
60 | - /* UNDEF accesses to D16-D31 if they don't exist. */ | ||
61 | - if (!dc_isar_feature(aa32_simd_r32, s) && | ||
62 | - ((a->vd | a->vm) & 0x10)) { | ||
63 | - return false; | ||
64 | - } | ||
65 | - | ||
66 | - if (a->size != 2) { | ||
67 | - /* TODO: FP16 will be the size == 1 case */ | ||
68 | - return false; | ||
69 | - } | ||
70 | - | ||
71 | - if ((a->vd | a->vm) & a->q) { | ||
72 | - return false; | ||
73 | - } | ||
74 | - | ||
75 | - if (!vfp_access_check(s)) { | ||
76 | - return true; | ||
77 | - } | ||
78 | - | ||
79 | - fpst = fpstatus_ptr(FPST_STD); | ||
80 | - for (pass = 0; pass < (a->q ? 4 : 2); pass++) { | ||
81 | - TCGv_i32 tmp = neon_load_reg(a->vm, pass); | ||
82 | - fn(tmp, tmp, fpst); | ||
83 | - neon_store_reg(a->vd, pass, tmp); | ||
84 | - } | ||
85 | - tcg_temp_free_ptr(fpst); | ||
86 | - | ||
87 | - return true; | ||
88 | -} | ||
89 | - | ||
90 | #define DO_2MISC_FP_VEC(INSN, HFUNC, SFUNC) \ | ||
91 | static void gen_##INSN(unsigned vece, uint32_t rd_ofs, \ | ||
92 | uint32_t rm_ofs, \ | ||
93 | @@ -XXX,XX +XXX,XX @@ DO_2MISC_FP_VEC(VCVT_FU, gen_helper_gvec_ustoh, gen_helper_gvec_uitos) | ||
94 | DO_2MISC_FP_VEC(VCVT_SF, gen_helper_gvec_tosszh, gen_helper_gvec_tosizs) | ||
95 | DO_2MISC_FP_VEC(VCVT_UF, gen_helper_gvec_touszh, gen_helper_gvec_touizs) | ||
96 | |||
97 | +DO_2MISC_FP_VEC(VRINTX_impl, gen_helper_gvec_vrintx_h, gen_helper_gvec_vrintx_s) | ||
98 | + | ||
99 | static bool trans_VRINTX(DisasContext *s, arg_2misc *a) | ||
100 | { | ||
101 | if (!arm_dc_feature(s, ARM_FEATURE_V8)) { | ||
102 | return false; | ||
24 | } | 103 | } |
25 | + | 104 | - return do_2misc_fp(s, a, gen_helper_rints_exact); |
26 | + /* | 105 | + return trans_VRINTX_impl(s, a); |
27 | + * We updated state that affects the CPU's MMUidx and thus its hflags; | ||
28 | + * and we can't guarantee that we run before the CPU reset function. | ||
29 | + */ | ||
30 | + arm_rebuild_hflags(&s->cpu->env); | ||
31 | } | 106 | } |
32 | 107 | ||
33 | static void nvic_systick_trigger(void *opaque, int n, int level) | 108 | #define DO_VEC_RMODE(INSN, RMODE, OP) \ |
34 | -- | 109 | -- |
35 | 2.20.1 | 110 | 2.20.1 |
36 | 111 | ||
37 | 112 | diff view generated by jsdifflib |
1 | From: Philippe Mathieu-Daudé <f4bug@amsat.org> | 1 | In the gvec helper functions for indexed operations, for AArch32 |
---|---|---|---|
2 | Neon the oprsz (total size of the vector) can be less than 16 bytes | ||
3 | if the operation is on a D reg. Since the inner loop in these | ||
4 | helpers always goes from 0 to segment, we must clamp it based | ||
5 | on oprsz to avoid processing a full 16 byte segment when asked to | ||
6 | handle an 8 byte wide vector. | ||
2 | 7 | ||
3 | This test boots a Linux kernel on a OrangePi PC board and verify | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | the serial output is working. | 9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
10 | Message-id: 20200828183354.27913-43-peter.maydell@linaro.org | ||
11 | --- | ||
12 | target/arm/vec_helper.c | 12 ++++++++---- | ||
13 | 1 file changed, 8 insertions(+), 4 deletions(-) | ||
5 | 14 | ||
6 | The kernel image and DeviceTree blob are built by the Armbian | 15 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c |
7 | project (based on Debian): | ||
8 | https://www.armbian.com/orange-pi-pc/ | ||
9 | |||
10 | If ARM is a target being built, "make check-acceptance" will | ||
11 | automatically include this test by the use of the "arch:arm" tags. | ||
12 | |||
13 | Alternatively, this test can be run using: | ||
14 | |||
15 | $ make check-venv | ||
16 | $ ./tests/venv/bin/avocado --show=console,app run -t machine:orangepi-pc tests/acceptance/boot_linux_console.py | ||
17 | JOB ID : 2e4d15eceb13c33672af406f08171e6e9de1414a | ||
18 | JOB LOG : ~/job-results/job-2019-12-17T05.46-2e4d15e/job.log | ||
19 | (1/1) tests/acceptance/boot_linux_console.py:BootLinuxConsole.test_arm_orangepi: | ||
20 | console: Uncompressing Linux... done, booting the kernel. | ||
21 | console: Booting Linux on physical CPU 0x0 | ||
22 | console: Linux version 4.20.7-sunxi (root@armbian.com) (gcc version 7.2.1 20171011 (Linaro GCC 7.2-2017.11)) #5.75 SMP Fri Feb 8 09:02:10 CET 2019 | ||
23 | console: CPU: ARMv7 Processor [410fc075] revision 5 (ARMv7), cr=50c5387d | ||
24 | console: CPU: div instructions available: patching division code | ||
25 | console: CPU: PIPT / VIPT nonaliasing data cache, VIPT aliasing instruction cache | ||
26 | console: OF: fdt: Machine model: Xunlong Orange Pi PC | ||
27 | console: Memory policy: Data cache writealloc | ||
28 | console: OF: reserved mem: failed to allocate memory for node 'cma@4a000000' | ||
29 | console: cma: Failed to reserve 128 MiB | ||
30 | console: psci: probing for conduit method from DT. | ||
31 | console: psci: PSCIv0.2 detected in firmware. | ||
32 | console: psci: Using standard PSCI v0.2 function IDs | ||
33 | console: psci: Trusted OS migration not required | ||
34 | console: random: get_random_bytes called from start_kernel+0x8d/0x3c2 with crng_init=0 | ||
35 | console: percpu: Embedded 18 pages/cpu @(ptrval) s41228 r8192 d24308 u73728 | ||
36 | console: Built 1 zonelists, mobility grouping on. Total pages: 32480 | ||
37 | console: Kernel command line: printk.time=0 console=ttyS0,115200 | ||
38 | PASS (8.59 s) | ||
39 | JOB TIME : 8.81 s | ||
40 | |||
41 | Signed-off-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
42 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | ||
43 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
44 | Tested-by: Alex Bennée <alex.bennee@linaro.org> | ||
45 | Message-id: 20200311221854.30370-14-nieklinnenbank@gmail.com | ||
46 | [NL: rename in commit message Raspbian to Armbian, remove vm.set_machine()] | ||
47 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
48 | --- | ||
49 | tests/acceptance/boot_linux_console.py | 25 +++++++++++++++++++++++++ | ||
50 | 1 file changed, 25 insertions(+) | ||
51 | |||
52 | diff --git a/tests/acceptance/boot_linux_console.py b/tests/acceptance/boot_linux_console.py | ||
53 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
54 | --- a/tests/acceptance/boot_linux_console.py | 17 | --- a/target/arm/vec_helper.c |
55 | +++ b/tests/acceptance/boot_linux_console.py | 18 | +++ b/target/arm/vec_helper.c |
56 | @@ -XXX,XX +XXX,XX @@ class BootLinuxConsole(Test): | 19 | @@ -XXX,XX +XXX,XX @@ DO_MULADD(gvec_vfms_s, float32_mulsub_f, float32) |
57 | exec_command_and_wait_for_pattern(self, 'reboot', | 20 | #define DO_MUL_IDX(NAME, TYPE, H) \ |
58 | 'reboot: Restarting system') | 21 | void HELPER(NAME)(void *vd, void *vn, void *vm, uint32_t desc) \ |
59 | 22 | { \ | |
60 | + def test_arm_orangepi(self): | 23 | - intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \ |
61 | + """ | 24 | + intptr_t i, j, oprsz = simd_oprsz(desc); \ |
62 | + :avocado: tags=arch:arm | 25 | + intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \ |
63 | + :avocado: tags=machine:orangepi-pc | 26 | intptr_t idx = simd_data(desc); \ |
64 | + """ | 27 | TYPE *d = vd, *n = vn, *m = vm; \ |
65 | + deb_url = ('https://apt.armbian.com/pool/main/l/' | 28 | for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \ |
66 | + 'linux-4.20.7-sunxi/linux-image-dev-sunxi_5.75_armhf.deb') | 29 | @@ -XXX,XX +XXX,XX @@ DO_MUL_IDX(gvec_mul_idx_d, uint64_t, ) |
67 | + deb_hash = '1334c29c44d984ffa05ed10de8c3361f33d78315' | 30 | #define DO_MLA_IDX(NAME, TYPE, OP, H) \ |
68 | + deb_path = self.fetch_asset(deb_url, asset_hash=deb_hash) | 31 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *va, uint32_t desc) \ |
69 | + kernel_path = self.extract_from_deb(deb_path, | 32 | { \ |
70 | + '/boot/vmlinuz-4.20.7-sunxi') | 33 | - intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \ |
71 | + dtb_path = '/usr/lib/linux-image-dev-sunxi/sun8i-h3-orangepi-pc.dtb' | 34 | + intptr_t i, j, oprsz = simd_oprsz(desc); \ |
72 | + dtb_path = self.extract_from_deb(deb_path, dtb_path) | 35 | + intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \ |
73 | + | 36 | intptr_t idx = simd_data(desc); \ |
74 | + self.vm.set_console() | 37 | TYPE *d = vd, *n = vn, *m = vm, *a = va; \ |
75 | + kernel_command_line = (self.KERNEL_COMMON_COMMAND_LINE + | 38 | for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \ |
76 | + 'console=ttyS0,115200n8 ' | 39 | @@ -XXX,XX +XXX,XX @@ DO_MLA_IDX(gvec_mls_idx_d, uint64_t, -, ) |
77 | + 'earlycon=uart,mmio32,0x1c28000') | 40 | #define DO_FMUL_IDX(NAME, TYPE, H) \ |
78 | + self.vm.add_args('-kernel', kernel_path, | 41 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ |
79 | + '-dtb', dtb_path, | 42 | { \ |
80 | + '-append', kernel_command_line) | 43 | - intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \ |
81 | + self.vm.launch() | 44 | + intptr_t i, j, oprsz = simd_oprsz(desc); \ |
82 | + console_pattern = 'Kernel command line: %s' % kernel_command_line | 45 | + intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \ |
83 | + self.wait_for_console_pattern(console_pattern) | 46 | intptr_t idx = simd_data(desc); \ |
84 | + | 47 | TYPE *d = vd, *n = vn, *m = vm; \ |
85 | def test_s390x_s390_ccw_virtio(self): | 48 | for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \ |
86 | """ | 49 | @@ -XXX,XX +XXX,XX @@ DO_FMUL_IDX(gvec_fmul_idx_d, float64, ) |
87 | :avocado: tags=arch:s390x | 50 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *va, \ |
51 | void *stat, uint32_t desc) \ | ||
52 | { \ | ||
53 | - intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \ | ||
54 | + intptr_t i, j, oprsz = simd_oprsz(desc); \ | ||
55 | + intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \ | ||
56 | TYPE op1_neg = extract32(desc, SIMD_DATA_SHIFT, 1); \ | ||
57 | intptr_t idx = desc >> (SIMD_DATA_SHIFT + 1); \ | ||
58 | TYPE *d = vd, *n = vn, *m = vm, *a = va; \ | ||
88 | -- | 59 | -- |
89 | 2.20.1 | 60 | 2.20.1 |
90 | 61 | ||
91 | 62 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | Add gvec helpers for doing Neon-style indexed non-fused fp |
---|---|---|---|
2 | multiply-and-accumulate operations. | ||
2 | 3 | ||
3 | We must include the tag in the FAR_ELx register when raising | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | an addressing exception. Which means that we should not clear | 5 | Message-id: 20200828183354.27913-44-peter.maydell@linaro.org |
5 | out the tag during translation. | 6 | --- |
7 | target/arm/helper.h | 10 ++++++++++ | ||
8 | target/arm/vec_helper.c | 27 ++++++++++++++++++++++----- | ||
9 | 2 files changed, 32 insertions(+), 5 deletions(-) | ||
6 | 10 | ||
7 | We cannot at present comply with this for user mode, so we | 11 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
8 | retain the clean_data_tbi function for the moment, though it | ||
9 | no longer does what it says on the tin for system mode. This | ||
10 | function is to be replaced with MTE, so don't worry about the | ||
11 | slight misnaming. | ||
12 | |||
13 | Buglink: https://bugs.launchpad.net/qemu/+bug/1867072 | ||
14 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
15 | Message-id: 20200308012946.16303-3-richard.henderson@linaro.org | ||
16 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
17 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
18 | --- | ||
19 | target/arm/translate-a64.c | 11 +++++++++++ | ||
20 | 1 file changed, 11 insertions(+) | ||
21 | |||
22 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
23 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
24 | --- a/target/arm/translate-a64.c | 13 | --- a/target/arm/helper.h |
25 | +++ b/target/arm/translate-a64.c | 14 | +++ b/target/arm/helper.h |
26 | @@ -XXX,XX +XXX,XX @@ static void gen_a64_set_pc(DisasContext *s, TCGv_i64 src) | 15 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fmul_idx_s, TCG_CALL_NO_RWG, |
27 | static TCGv_i64 clean_data_tbi(DisasContext *s, TCGv_i64 addr) | 16 | DEF_HELPER_FLAGS_5(gvec_fmul_idx_d, TCG_CALL_NO_RWG, |
28 | { | 17 | void, ptr, ptr, ptr, ptr, i32) |
29 | TCGv_i64 clean = new_tmp_a64(s); | 18 | |
30 | + /* | 19 | +DEF_HELPER_FLAGS_5(gvec_fmla_nf_idx_h, TCG_CALL_NO_RWG, |
31 | + * In order to get the correct value in the FAR_ELx register, | 20 | + void, ptr, ptr, ptr, ptr, i32) |
32 | + * we must present the memory subsystem with the "dirty" address | 21 | +DEF_HELPER_FLAGS_5(gvec_fmla_nf_idx_s, TCG_CALL_NO_RWG, |
33 | + * including the TBI. In system mode we can make this work via | 22 | + void, ptr, ptr, ptr, ptr, i32) |
34 | + * the TLB, dropping the TBI during translation. But for user-only | 23 | + |
35 | + * mode we don't have that option, and must remove the top byte now. | 24 | +DEF_HELPER_FLAGS_5(gvec_fmls_nf_idx_h, TCG_CALL_NO_RWG, |
36 | + */ | 25 | + void, ptr, ptr, ptr, ptr, i32) |
37 | +#ifdef CONFIG_USER_ONLY | 26 | +DEF_HELPER_FLAGS_5(gvec_fmls_nf_idx_s, TCG_CALL_NO_RWG, |
38 | gen_top_byte_ignore(s, clean, addr, s->tbid); | 27 | + void, ptr, ptr, ptr, ptr, i32) |
39 | +#else | 28 | + |
40 | + tcg_gen_mov_i64(clean, addr); | 29 | DEF_HELPER_FLAGS_6(gvec_fmla_idx_h, TCG_CALL_NO_RWG, |
41 | +#endif | 30 | void, ptr, ptr, ptr, ptr, ptr, i32) |
42 | return clean; | 31 | DEF_HELPER_FLAGS_6(gvec_fmla_idx_s, TCG_CALL_NO_RWG, |
32 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
33 | index XXXXXXX..XXXXXXX 100644 | ||
34 | --- a/target/arm/vec_helper.c | ||
35 | +++ b/target/arm/vec_helper.c | ||
36 | @@ -XXX,XX +XXX,XX @@ DO_MLA_IDX(gvec_mls_idx_d, uint64_t, -, ) | ||
37 | |||
38 | #undef DO_MLA_IDX | ||
39 | |||
40 | -#define DO_FMUL_IDX(NAME, TYPE, H) \ | ||
41 | +#define DO_FMUL_IDX(NAME, ADD, TYPE, H) \ | ||
42 | void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ | ||
43 | { \ | ||
44 | intptr_t i, j, oprsz = simd_oprsz(desc); \ | ||
45 | @@ -XXX,XX +XXX,XX @@ void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \ | ||
46 | for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \ | ||
47 | TYPE mm = m[H(i + idx)]; \ | ||
48 | for (j = 0; j < segment; j++) { \ | ||
49 | - d[i + j] = TYPE##_mul(n[i + j], mm, stat); \ | ||
50 | + d[i + j] = TYPE##_##ADD(d[i + j], \ | ||
51 | + TYPE##_mul(n[i + j], mm, stat), stat); \ | ||
52 | } \ | ||
53 | } \ | ||
54 | clear_tail(d, oprsz, simd_maxsz(desc)); \ | ||
43 | } | 55 | } |
44 | 56 | ||
57 | -DO_FMUL_IDX(gvec_fmul_idx_h, float16, H2) | ||
58 | -DO_FMUL_IDX(gvec_fmul_idx_s, float32, H4) | ||
59 | -DO_FMUL_IDX(gvec_fmul_idx_d, float64, ) | ||
60 | +#define float16_nop(N, M, S) (M) | ||
61 | +#define float32_nop(N, M, S) (M) | ||
62 | +#define float64_nop(N, M, S) (M) | ||
63 | |||
64 | +DO_FMUL_IDX(gvec_fmul_idx_h, nop, float16, H2) | ||
65 | +DO_FMUL_IDX(gvec_fmul_idx_s, nop, float32, H4) | ||
66 | +DO_FMUL_IDX(gvec_fmul_idx_d, nop, float64, ) | ||
67 | + | ||
68 | +/* | ||
69 | + * Non-fused multiply-accumulate operations, for Neon. NB that unlike | ||
70 | + * the fused ops below they assume accumulate both from and into Vd. | ||
71 | + */ | ||
72 | +DO_FMUL_IDX(gvec_fmla_nf_idx_h, add, float16, H2) | ||
73 | +DO_FMUL_IDX(gvec_fmla_nf_idx_s, add, float32, H4) | ||
74 | +DO_FMUL_IDX(gvec_fmls_nf_idx_h, sub, float16, H2) | ||
75 | +DO_FMUL_IDX(gvec_fmls_nf_idx_s, sub, float32, H4) | ||
76 | + | ||
77 | +#undef float16_nop | ||
78 | +#undef float32_nop | ||
79 | +#undef float64_nop | ||
80 | #undef DO_FMUL_IDX | ||
81 | |||
82 | #define DO_FMLA_IDX(NAME, TYPE, H) \ | ||
45 | -- | 83 | -- |
46 | 2.20.1 | 84 | 2.20.1 |
47 | 85 | ||
48 | 86 | diff view generated by jsdifflib |
1 | From: Cédric Le Goater <clg@kaod.org> | 1 | Convert the Neon floating-point VMUL, VMLA and VMLS to use gvec, |
---|---|---|---|
2 | and use this to implement fp16 support. | ||
2 | 3 | ||
3 | Signed-off-by: Cédric Le Goater <clg@kaod.org> | ||
4 | Reviewed-by: Andrew Jeffery <andrew@aj.id.au> | ||
5 | Reviewed-by: Joel Stanley <joel@jms.id.au> | ||
6 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | ||
7 | Message-id: 20200206112645.21275-2-clg@kaod.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
6 | Message-id: 20200828183354.27913-45-peter.maydell@linaro.org | ||
9 | --- | 7 | --- |
10 | Makefile.objs | 1 + | 8 | target/arm/translate-neon.c.inc | 114 ++++++++++++++++---------------- |
11 | hw/ssi/aspeed_smc.c | 17 +++++++++++++++++ | 9 | 1 file changed, 57 insertions(+), 57 deletions(-) |
12 | hw/ssi/trace-events | 9 +++++++++ | ||
13 | 3 files changed, 27 insertions(+) | ||
14 | create mode 100644 hw/ssi/trace-events | ||
15 | 10 | ||
16 | diff --git a/Makefile.objs b/Makefile.objs | 11 | diff --git a/target/arm/translate-neon.c.inc b/target/arm/translate-neon.c.inc |
17 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/Makefile.objs | 13 | --- a/target/arm/translate-neon.c.inc |
19 | +++ b/Makefile.objs | 14 | +++ b/target/arm/translate-neon.c.inc |
20 | @@ -XXX,XX +XXX,XX @@ trace-events-subdirs += hw/scsi | 15 | @@ -XXX,XX +XXX,XX @@ static bool trans_VMLS_2sc(DisasContext *s, arg_2scalar *a) |
21 | trace-events-subdirs += hw/sd | 16 | return do_2scalar(s, a, opfn[a->size], accfn[a->size]); |
22 | trace-events-subdirs += hw/sparc | 17 | } |
23 | trace-events-subdirs += hw/sparc64 | 18 | |
24 | +trace-events-subdirs += hw/ssi | 19 | -/* |
25 | trace-events-subdirs += hw/timer | 20 | - * Rather than have a float-specific version of do_2scalar just for |
26 | trace-events-subdirs += hw/tpm | 21 | - * three insns, we wrap a NeonGenTwoSingleOpFn to turn it into |
27 | trace-events-subdirs += hw/usb | 22 | - * a NeonGenTwoOpFn. |
28 | diff --git a/hw/ssi/aspeed_smc.c b/hw/ssi/aspeed_smc.c | 23 | - */ |
29 | index XXXXXXX..XXXXXXX 100644 | 24 | -#define WRAP_FP_FN(WRAPNAME, FUNC) \ |
30 | --- a/hw/ssi/aspeed_smc.c | 25 | - static void WRAPNAME(TCGv_i32 rd, TCGv_i32 rn, TCGv_i32 rm) \ |
31 | +++ b/hw/ssi/aspeed_smc.c | 26 | - { \ |
32 | @@ -XXX,XX +XXX,XX @@ | 27 | - TCGv_ptr fpstatus = fpstatus_ptr(FPST_STD); \ |
33 | #include "qapi/error.h" | 28 | - FUNC(rd, rn, rm, fpstatus); \ |
34 | #include "exec/address-spaces.h" | 29 | - tcg_temp_free_ptr(fpstatus); \ |
35 | #include "qemu/units.h" | 30 | +static bool do_2scalar_fp_vec(DisasContext *s, arg_2scalar *a, |
36 | +#include "trace.h" | 31 | + gen_helper_gvec_3_ptr *fn) |
37 | 32 | +{ | |
38 | #include "hw/irq.h" | 33 | + /* Two registers and a scalar, using gvec */ |
39 | #include "hw/qdev-properties.h" | 34 | + int vec_size = a->q ? 16 : 8; |
40 | @@ -XXX,XX +XXX,XX @@ static void aspeed_smc_flash_set_segment(AspeedSMCState *s, int cs, | 35 | + int rd_ofs = neon_reg_offset(a->vd, 0); |
41 | 36 | + int rn_ofs = neon_reg_offset(a->vn, 0); | |
42 | s->ctrl->reg_to_segment(s, new, &seg); | 37 | + int rm_ofs; |
43 | 38 | + int idx; | |
44 | + trace_aspeed_smc_flash_set_segment(cs, new, seg.addr, seg.addr + seg.size); | 39 | + TCGv_ptr fpstatus; |
45 | + | 40 | + |
46 | /* The start address of CS0 is read-only */ | 41 | + if (!arm_dc_feature(s, ARM_FEATURE_NEON)) { |
47 | if (cs == 0 && seg.addr != s->ctrl->flash_window_base) { | 42 | + return false; |
48 | qemu_log_mask(LOG_GUEST_ERROR, | ||
49 | @@ -XXX,XX +XXX,XX @@ static uint64_t aspeed_smc_flash_read(void *opaque, hwaddr addr, unsigned size) | ||
50 | __func__, aspeed_smc_flash_mode(fl)); | ||
51 | } | 43 | } |
52 | 44 | ||
53 | + trace_aspeed_smc_flash_read(fl->id, addr, size, ret, | 45 | -WRAP_FP_FN(gen_VMUL_F_mul, gen_helper_vfp_muls) |
54 | + aspeed_smc_flash_mode(fl)); | 46 | -WRAP_FP_FN(gen_VMUL_F_add, gen_helper_vfp_adds) |
55 | return ret; | 47 | -WRAP_FP_FN(gen_VMUL_F_sub, gen_helper_vfp_subs) |
48 | + /* UNDEF accesses to D16-D31 if they don't exist. */ | ||
49 | + if (!dc_isar_feature(aa32_simd_r32, s) && | ||
50 | + ((a->vd | a->vn | a->vm) & 0x10)) { | ||
51 | + return false; | ||
52 | + } | ||
53 | |||
54 | -static bool trans_VMUL_F_2sc(DisasContext *s, arg_2scalar *a) | ||
55 | -{ | ||
56 | - static NeonGenTwoOpFn * const opfn[] = { | ||
57 | - NULL, | ||
58 | - NULL, /* TODO: fp16 support */ | ||
59 | - gen_VMUL_F_mul, | ||
60 | - NULL, | ||
61 | - }; | ||
62 | + if (!fn) { | ||
63 | + /* Bad size (including size == 3, which is a different insn group) */ | ||
64 | + return false; | ||
65 | + } | ||
66 | |||
67 | - return do_2scalar(s, a, opfn[a->size], NULL); | ||
68 | + if (a->q && ((a->vd | a->vn) & 1)) { | ||
69 | + return false; | ||
70 | + } | ||
71 | + | ||
72 | + if (!vfp_access_check(s)) { | ||
73 | + return true; | ||
74 | + } | ||
75 | + | ||
76 | + /* a->vm is M:Vm, which encodes both register and index */ | ||
77 | + idx = extract32(a->vm, a->size + 2, 2); | ||
78 | + a->vm = extract32(a->vm, 0, a->size + 2); | ||
79 | + rm_ofs = neon_reg_offset(a->vm, 0); | ||
80 | + | ||
81 | + fpstatus = fpstatus_ptr(a->size == 1 ? FPST_STD_F16 : FPST_STD); | ||
82 | + tcg_gen_gvec_3_ptr(rd_ofs, rn_ofs, rm_ofs, fpstatus, | ||
83 | + vec_size, vec_size, idx, fn); | ||
84 | + tcg_temp_free_ptr(fpstatus); | ||
85 | + return true; | ||
56 | } | 86 | } |
57 | 87 | ||
58 | @@ -XXX,XX +XXX,XX @@ static bool aspeed_smc_do_snoop(AspeedSMCFlash *fl, uint64_t data, | 88 | -static bool trans_VMLA_F_2sc(DisasContext *s, arg_2scalar *a) |
59 | AspeedSMCState *s = fl->controller; | 89 | -{ |
60 | uint8_t addr_width = aspeed_smc_flash_is_4byte(fl) ? 4 : 3; | 90 | - static NeonGenTwoOpFn * const opfn[] = { |
61 | 91 | - NULL, | |
62 | + trace_aspeed_smc_do_snoop(fl->id, s->snoop_index, s->snoop_dummies, | 92 | - NULL, /* TODO: fp16 support */ |
63 | + (uint8_t) data & 0xff); | 93 | - gen_VMUL_F_mul, |
64 | + | 94 | - NULL, |
65 | if (s->snoop_index == SNOOP_OFF) { | 95 | - }; |
66 | return false; /* Do nothing */ | 96 | - static NeonGenTwoOpFn * const accfn[] = { |
67 | 97 | - NULL, | |
68 | @@ -XXX,XX +XXX,XX @@ static void aspeed_smc_flash_write(void *opaque, hwaddr addr, uint64_t data, | 98 | - NULL, /* TODO: fp16 support */ |
69 | AspeedSMCState *s = fl->controller; | 99 | - gen_VMUL_F_add, |
70 | int i; | 100 | - NULL, |
71 | 101 | - }; | |
72 | + trace_aspeed_smc_flash_write(fl->id, addr, size, data, | 102 | +#define DO_VMUL_F_2sc(NAME, FUNC) \ |
73 | + aspeed_smc_flash_mode(fl)); | 103 | + static bool trans_##NAME##_F_2sc(DisasContext *s, arg_2scalar *a) \ |
74 | + | 104 | + { \ |
75 | if (!aspeed_smc_is_writable(fl)) { | 105 | + static gen_helper_gvec_3_ptr * const opfn[] = { \ |
76 | qemu_log_mask(LOG_GUEST_ERROR, "%s: flash is not writable at 0x%" | 106 | + NULL, \ |
77 | HWADDR_PRIx "\n", __func__, addr); | 107 | + gen_helper_##FUNC##_h, \ |
78 | @@ -XXX,XX +XXX,XX @@ static uint64_t aspeed_smc_read(void *opaque, hwaddr addr, unsigned int size) | 108 | + gen_helper_##FUNC##_s, \ |
79 | (s->ctrl->has_dma && addr == R_DMA_CHECKSUM) || | 109 | + NULL, \ |
80 | (addr >= R_SEG_ADDR0 && addr < R_SEG_ADDR0 + s->ctrl->max_slaves) || | 110 | + }; \ |
81 | (addr >= s->r_ctrl0 && addr < s->r_ctrl0 + s->ctrl->max_slaves)) { | 111 | + if (a->size == MO_16 && !dc_isar_feature(aa32_fp16_arith, s)) { \ |
82 | + | 112 | + return false; \ |
83 | + trace_aspeed_smc_read(addr, size, s->regs[addr]); | 113 | + } \ |
84 | + | 114 | + return do_2scalar_fp_vec(s, a, opfn[a->size]); \ |
85 | return s->regs[addr]; | 115 | + } |
86 | } else { | 116 | |
87 | qemu_log_mask(LOG_UNIMP, "%s: not implemented: 0x%" HWADDR_PRIx "\n", | 117 | - return do_2scalar(s, a, opfn[a->size], accfn[a->size]); |
88 | @@ -XXX,XX +XXX,XX @@ static void aspeed_smc_dma_checksum(AspeedSMCState *s) | 118 | -} |
89 | __func__, s->regs[R_DMA_FLASH_ADDR]); | 119 | - |
90 | return; | 120 | -static bool trans_VMLS_F_2sc(DisasContext *s, arg_2scalar *a) |
91 | } | 121 | -{ |
92 | + trace_aspeed_smc_dma_checksum(s->regs[R_DMA_FLASH_ADDR], data); | 122 | - static NeonGenTwoOpFn * const opfn[] = { |
93 | 123 | - NULL, | |
94 | /* | 124 | - NULL, /* TODO: fp16 support */ |
95 | * When the DMA is on-going, the DMA registers are updated | 125 | - gen_VMUL_F_mul, |
96 | @@ -XXX,XX +XXX,XX @@ static void aspeed_smc_write(void *opaque, hwaddr addr, uint64_t data, | 126 | - NULL, |
97 | 127 | - }; | |
98 | addr >>= 2; | 128 | - static NeonGenTwoOpFn * const accfn[] = { |
99 | 129 | - NULL, | |
100 | + trace_aspeed_smc_write(addr, size, data); | 130 | - NULL, /* TODO: fp16 support */ |
101 | + | 131 | - gen_VMUL_F_sub, |
102 | if (addr == s->r_conf || | 132 | - NULL, |
103 | (addr >= s->r_timings && | 133 | - }; |
104 | addr < s->r_timings + s->ctrl->nregs_timings) || | 134 | - |
105 | diff --git a/hw/ssi/trace-events b/hw/ssi/trace-events | 135 | - return do_2scalar(s, a, opfn[a->size], accfn[a->size]); |
106 | new file mode 100644 | 136 | -} |
107 | index XXXXXXX..XXXXXXX | 137 | +DO_VMUL_F_2sc(VMUL, gvec_fmul_idx) |
108 | --- /dev/null | 138 | +DO_VMUL_F_2sc(VMLA, gvec_fmla_nf_idx) |
109 | +++ b/hw/ssi/trace-events | 139 | +DO_VMUL_F_2sc(VMLS, gvec_fmls_nf_idx) |
110 | @@ -XXX,XX +XXX,XX @@ | 140 | |
111 | +# aspeed_smc.c | 141 | WRAP_ENV_FN(gen_VQDMULH_16, gen_helper_neon_qdmulh_s16) |
112 | + | 142 | WRAP_ENV_FN(gen_VQDMULH_32, gen_helper_neon_qdmulh_s32) |
113 | +aspeed_smc_flash_set_segment(int cs, uint64_t reg, uint64_t start, uint64_t end) "CS%d segreg=0x%"PRIx64" [ 0x%"PRIx64" - 0x%"PRIx64" ]" | ||
114 | +aspeed_smc_flash_read(int cs, uint64_t addr, uint32_t size, uint64_t data, int mode) "CS%d @0x%" PRIx64 " size %u: 0x%" PRIx64" mode:%d" | ||
115 | +aspeed_smc_do_snoop(int cs, int index, int dummies, int data) "CS%d index:0x%x dummies:%d data:0x%x" | ||
116 | +aspeed_smc_flash_write(int cs, uint64_t addr, uint32_t size, uint64_t data, int mode) "CS%d @0x%" PRIx64 " size %u: 0x%" PRIx64" mode:%d" | ||
117 | +aspeed_smc_read(uint64_t addr, uint32_t size, uint64_t data) "@0x%" PRIx64 " size %u: 0x%" PRIx64 | ||
118 | +aspeed_smc_dma_checksum(uint32_t addr, uint32_t data) "0x%08x: 0x%08x" | ||
119 | +aspeed_smc_write(uint64_t addr, uint32_t size, uint64_t data) "@0x%" PRIx64 " size %u: 0x%" PRIx64 | ||
120 | -- | 143 | -- |
121 | 2.20.1 | 144 | 2.20.1 |
122 | 145 | ||
123 | 146 | diff view generated by jsdifflib |
1 | For M-profile CPUs, the FAULTMASK value affects the CPU's MMU index | 1 | Set the MVFR1 ID register FPHP and SIMDHP fields to indicate |
---|---|---|---|
2 | (it changes the NegPri bit). We update the hflags after calls | 2 | that our "-cpu max" has v8.2-FP16. |
3 | to the v7m_msr helper in trans_MSR_v7m() but forgot to do so | ||
4 | in trans_CPS_v7m(). | ||
5 | 3 | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20200303174950.3298-3-peter.maydell@linaro.org | 6 | Message-id: 20200828183354.27913-46-peter.maydell@linaro.org |
9 | --- | 7 | --- |
10 | target/arm/translate.c | 5 ++++- | 8 | target/arm/cpu.c | 3 ++- |
11 | 1 file changed, 4 insertions(+), 1 deletion(-) | 9 | target/arm/cpu64.c | 10 ++++------ |
10 | 2 files changed, 6 insertions(+), 7 deletions(-) | ||
12 | 11 | ||
13 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 12 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c |
14 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/translate.c | 14 | --- a/target/arm/cpu.c |
16 | +++ b/target/arm/translate.c | 15 | +++ b/target/arm/cpu.c |
17 | @@ -XXX,XX +XXX,XX @@ static bool trans_CPS(DisasContext *s, arg_CPS *a) | 16 | @@ -XXX,XX +XXX,XX @@ static void arm_max_initfn(Object *obj) |
18 | 17 | cpu->isar.id_isar6 = t; | |
19 | static bool trans_CPS_v7m(DisasContext *s, arg_CPS_v7m *a) | 18 | |
20 | { | 19 | t = cpu->isar.mvfr1; |
21 | - TCGv_i32 tmp, addr; | 20 | - t = FIELD_DP32(t, MVFR1, FPHP, 2); /* v8.0 FP support */ |
22 | + TCGv_i32 tmp, addr, el; | 21 | + t = FIELD_DP32(t, MVFR1, FPHP, 3); /* v8.2-FP16 */ |
23 | 22 | + t = FIELD_DP32(t, MVFR1, SIMDHP, 2); /* v8.2-FP16 */ | |
24 | if (!arm_dc_feature(s, ARM_FEATURE_M)) { | 23 | cpu->isar.mvfr1 = t; |
25 | return false; | 24 | |
26 | @@ -XXX,XX +XXX,XX @@ static bool trans_CPS_v7m(DisasContext *s, arg_CPS_v7m *a) | 25 | t = cpu->isar.mvfr2; |
27 | gen_helper_v7m_msr(cpu_env, addr, tmp); | 26 | diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c |
28 | tcg_temp_free_i32(addr); | 27 | index XXXXXXX..XXXXXXX 100644 |
29 | } | 28 | --- a/target/arm/cpu64.c |
30 | + el = tcg_const_i32(s->current_el); | 29 | +++ b/target/arm/cpu64.c |
31 | + gen_helper_rebuild_hflags_m32(cpu_env, el); | 30 | @@ -XXX,XX +XXX,XX @@ static void aarch64_max_initfn(Object *obj) |
32 | + tcg_temp_free_i32(el); | 31 | u = FIELD_DP32(u, ID_DFR0, PERFMON, 5); /* v8.4-PMU */ |
33 | tcg_temp_free_i32(tmp); | 32 | cpu->isar.id_dfr0 = u; |
34 | gen_lookup_tb(s); | 33 | |
35 | return true; | 34 | - /* |
35 | - * FIXME: We do not yet support ARMv8.2-fp16 for AArch32 yet, | ||
36 | - * so do not set MVFR1.FPHP. Strictly speaking this is not legal, | ||
37 | - * but it is also not legal to enable SVE without support for FP16, | ||
38 | - * and enabling SVE in system mode is more useful in the short term. | ||
39 | - */ | ||
40 | + u = cpu->isar.mvfr1; | ||
41 | + u = FIELD_DP32(u, MVFR1, FPHP, 3); /* v8.2-FP16 */ | ||
42 | + u = FIELD_DP32(u, MVFR1, SIMDHP, 2); /* v8.2-FP16 */ | ||
43 | + cpu->isar.mvfr1 = u; | ||
44 | |||
45 | #ifdef CONFIG_USER_ONLY | ||
46 | /* For usermode -cpu max we can use a larger and more efficient DCZ | ||
36 | -- | 47 | -- |
37 | 2.20.1 | 48 | 2.20.1 |
38 | 49 | ||
39 | 50 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | From: Leif Lindholm <leif@nuviainc.com> |
---|---|---|---|
2 | 2 | ||
3 | The Allwinner H3 System on Chip contains multiple USB 2.0 bus | 3 | The sbsa-ref platform uses a minimal device tree to pass amount of memory |
4 | connections which provide software access using the Enhanced | 4 | as well as number of cpus to the firmware. However, when dumping that |
5 | Host Controller Interface (EHCI) and Open Host Controller | 5 | minimal dtb (with -M sbsa-virt,dumpdtb=<file>), the resulting blob |
6 | Interface (OHCI) interfaces. This commit adds support for | 6 | generates a warning when decompiled by dtc due to lack of reg property. |
7 | both interfaces in the Allwinner H3 System on Chip. | ||
8 | 7 | ||
9 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | 8 | Add a simple reg property per cpu, representing a 64-bit MPIDR_EL1. |
10 | Reviewed-by: Gerd Hoffmann <kraxel@redhat.com> | 9 | |
11 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | 10 | This also ends up being cleaner than having the firmware calculating its |
12 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | 11 | own IDs for generating APCI. |
13 | Tested-by: Philippe Mathieu-Daudé <philmd@redhat.com> | 12 | |
14 | Message-id: 20200311221854.30370-5-nieklinnenbank@gmail.com | 13 | Signed-off-by: Leif Lindholm <leif@nuviainc.com> |
14 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
15 | Message-id: 20200827124335.30586-1-leif@nuviainc.com | ||
15 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 16 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
16 | --- | 17 | --- |
17 | hw/usb/hcd-ehci.h | 1 + | 18 | hw/arm/sbsa-ref.c | 29 +++++++++++++++++++++++------ |
18 | include/hw/arm/allwinner-h3.h | 8 +++++++ | 19 | 1 file changed, 23 insertions(+), 6 deletions(-) |
19 | hw/arm/allwinner-h3.c | 44 +++++++++++++++++++++++++++++++++++ | ||
20 | hw/usb/hcd-ehci-sysbus.c | 17 ++++++++++++++ | ||
21 | hw/arm/Kconfig | 2 ++ | ||
22 | 5 files changed, 72 insertions(+) | ||
23 | 20 | ||
24 | diff --git a/hw/usb/hcd-ehci.h b/hw/usb/hcd-ehci.h | 21 | diff --git a/hw/arm/sbsa-ref.c b/hw/arm/sbsa-ref.c |
25 | index XXXXXXX..XXXXXXX 100644 | 22 | index XXXXXXX..XXXXXXX 100644 |
26 | --- a/hw/usb/hcd-ehci.h | 23 | --- a/hw/arm/sbsa-ref.c |
27 | +++ b/hw/usb/hcd-ehci.h | 24 | +++ b/hw/arm/sbsa-ref.c |
28 | @@ -XXX,XX +XXX,XX @@ typedef struct EHCIPCIState { | 25 | @@ -XXX,XX +XXX,XX @@ static const int sbsa_ref_irqmap[] = { |
29 | #define TYPE_SYS_BUS_EHCI "sysbus-ehci-usb" | 26 | [SBSA_EHCI] = 11, |
30 | #define TYPE_PLATFORM_EHCI "platform-ehci-usb" | ||
31 | #define TYPE_EXYNOS4210_EHCI "exynos4210-ehci-usb" | ||
32 | +#define TYPE_AW_H3_EHCI "aw-h3-ehci-usb" | ||
33 | #define TYPE_TEGRA2_EHCI "tegra2-ehci-usb" | ||
34 | #define TYPE_PPC4xx_EHCI "ppc4xx-ehci-usb" | ||
35 | #define TYPE_FUSBH200_EHCI "fusbh200-ehci-usb" | ||
36 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | ||
37 | index XXXXXXX..XXXXXXX 100644 | ||
38 | --- a/include/hw/arm/allwinner-h3.h | ||
39 | +++ b/include/hw/arm/allwinner-h3.h | ||
40 | @@ -XXX,XX +XXX,XX @@ enum { | ||
41 | AW_H3_SRAM_A1, | ||
42 | AW_H3_SRAM_A2, | ||
43 | AW_H3_SRAM_C, | ||
44 | + AW_H3_EHCI0, | ||
45 | + AW_H3_OHCI0, | ||
46 | + AW_H3_EHCI1, | ||
47 | + AW_H3_OHCI1, | ||
48 | + AW_H3_EHCI2, | ||
49 | + AW_H3_OHCI2, | ||
50 | + AW_H3_EHCI3, | ||
51 | + AW_H3_OHCI3, | ||
52 | AW_H3_CCU, | ||
53 | AW_H3_PIT, | ||
54 | AW_H3_UART0, | ||
55 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
56 | index XXXXXXX..XXXXXXX 100644 | ||
57 | --- a/hw/arm/allwinner-h3.c | ||
58 | +++ b/hw/arm/allwinner-h3.c | ||
59 | @@ -XXX,XX +XXX,XX @@ | ||
60 | #include "hw/sysbus.h" | ||
61 | #include "hw/char/serial.h" | ||
62 | #include "hw/misc/unimp.h" | ||
63 | +#include "hw/usb/hcd-ehci.h" | ||
64 | #include "sysemu/sysemu.h" | ||
65 | #include "hw/arm/allwinner-h3.h" | ||
66 | |||
67 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
68 | [AW_H3_SRAM_A1] = 0x00000000, | ||
69 | [AW_H3_SRAM_A2] = 0x00044000, | ||
70 | [AW_H3_SRAM_C] = 0x00010000, | ||
71 | + [AW_H3_EHCI0] = 0x01c1a000, | ||
72 | + [AW_H3_OHCI0] = 0x01c1a400, | ||
73 | + [AW_H3_EHCI1] = 0x01c1b000, | ||
74 | + [AW_H3_OHCI1] = 0x01c1b400, | ||
75 | + [AW_H3_EHCI2] = 0x01c1c000, | ||
76 | + [AW_H3_OHCI2] = 0x01c1c400, | ||
77 | + [AW_H3_EHCI3] = 0x01c1d000, | ||
78 | + [AW_H3_OHCI3] = 0x01c1d400, | ||
79 | [AW_H3_CCU] = 0x01c20000, | ||
80 | [AW_H3_PIT] = 0x01c20c00, | ||
81 | [AW_H3_UART0] = 0x01c28000, | ||
82 | @@ -XXX,XX +XXX,XX @@ enum { | ||
83 | AW_H3_GIC_SPI_UART3 = 3, | ||
84 | AW_H3_GIC_SPI_TIMER0 = 18, | ||
85 | AW_H3_GIC_SPI_TIMER1 = 19, | ||
86 | + AW_H3_GIC_SPI_EHCI0 = 72, | ||
87 | + AW_H3_GIC_SPI_OHCI0 = 73, | ||
88 | + AW_H3_GIC_SPI_EHCI1 = 74, | ||
89 | + AW_H3_GIC_SPI_OHCI1 = 75, | ||
90 | + AW_H3_GIC_SPI_EHCI2 = 76, | ||
91 | + AW_H3_GIC_SPI_OHCI2 = 77, | ||
92 | + AW_H3_GIC_SPI_EHCI3 = 78, | ||
93 | + AW_H3_GIC_SPI_OHCI3 = 79, | ||
94 | }; | 27 | }; |
95 | 28 | ||
96 | /* Allwinner H3 general constants */ | 29 | +static uint64_t sbsa_ref_cpu_mp_affinity(SBSAMachineState *sms, int idx) |
97 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
98 | qdev_init_nofail(DEVICE(&s->ccu)); | ||
99 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->ccu), 0, s->memmap[AW_H3_CCU]); | ||
100 | |||
101 | + /* Universal Serial Bus */ | ||
102 | + sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI0], | ||
103 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
104 | + AW_H3_GIC_SPI_EHCI0)); | ||
105 | + sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI1], | ||
106 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
107 | + AW_H3_GIC_SPI_EHCI1)); | ||
108 | + sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI2], | ||
109 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
110 | + AW_H3_GIC_SPI_EHCI2)); | ||
111 | + sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI3], | ||
112 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
113 | + AW_H3_GIC_SPI_EHCI3)); | ||
114 | + | ||
115 | + sysbus_create_simple("sysbus-ohci", s->memmap[AW_H3_OHCI0], | ||
116 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
117 | + AW_H3_GIC_SPI_OHCI0)); | ||
118 | + sysbus_create_simple("sysbus-ohci", s->memmap[AW_H3_OHCI1], | ||
119 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
120 | + AW_H3_GIC_SPI_OHCI1)); | ||
121 | + sysbus_create_simple("sysbus-ohci", s->memmap[AW_H3_OHCI2], | ||
122 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
123 | + AW_H3_GIC_SPI_OHCI2)); | ||
124 | + sysbus_create_simple("sysbus-ohci", s->memmap[AW_H3_OHCI3], | ||
125 | + qdev_get_gpio_in(DEVICE(&s->gic), | ||
126 | + AW_H3_GIC_SPI_OHCI3)); | ||
127 | + | ||
128 | /* UART0. For future clocktree API: All UARTS are connected to APB2_CLK. */ | ||
129 | serial_mm_init(get_system_memory(), s->memmap[AW_H3_UART0], 2, | ||
130 | qdev_get_gpio_in(DEVICE(&s->gic), AW_H3_GIC_SPI_UART0), | ||
131 | diff --git a/hw/usb/hcd-ehci-sysbus.c b/hw/usb/hcd-ehci-sysbus.c | ||
132 | index XXXXXXX..XXXXXXX 100644 | ||
133 | --- a/hw/usb/hcd-ehci-sysbus.c | ||
134 | +++ b/hw/usb/hcd-ehci-sysbus.c | ||
135 | @@ -XXX,XX +XXX,XX @@ static const TypeInfo ehci_exynos4210_type_info = { | ||
136 | .class_init = ehci_exynos4210_class_init, | ||
137 | }; | ||
138 | |||
139 | +static void ehci_aw_h3_class_init(ObjectClass *oc, void *data) | ||
140 | +{ | 30 | +{ |
141 | + SysBusEHCIClass *sec = SYS_BUS_EHCI_CLASS(oc); | 31 | + uint8_t clustersz = ARM_DEFAULT_CPUS_PER_CLUSTER; |
142 | + DeviceClass *dc = DEVICE_CLASS(oc); | 32 | + return arm_cpu_mp_affinity(idx, clustersz); |
143 | + | ||
144 | + sec->capsbase = 0x0; | ||
145 | + sec->opregbase = 0x10; | ||
146 | + set_bit(DEVICE_CATEGORY_USB, dc->categories); | ||
147 | +} | 33 | +} |
148 | + | 34 | + |
149 | +static const TypeInfo ehci_aw_h3_type_info = { | 35 | /* |
150 | + .name = TYPE_AW_H3_EHCI, | 36 | * Firmware on this machine only uses ACPI table to load OS, these limited |
151 | + .parent = TYPE_SYS_BUS_EHCI, | 37 | * device tree nodes are just to let firmware know the info which varies from |
152 | + .class_init = ehci_aw_h3_class_init, | 38 | @@ -XXX,XX +XXX,XX @@ static void create_fdt(SBSAMachineState *sms) |
153 | +}; | 39 | g_free(matrix); |
154 | + | 40 | } |
155 | static void ehci_tegra2_class_init(ObjectClass *oc, void *data) | 41 | |
42 | + /* | ||
43 | + * From Documentation/devicetree/bindings/arm/cpus.yaml | ||
44 | + * On ARM v8 64-bit systems this property is required | ||
45 | + * and matches the MPIDR_EL1 register affinity bits. | ||
46 | + * | ||
47 | + * * If cpus node's #address-cells property is set to 2 | ||
48 | + * | ||
49 | + * The first reg cell bits [7:0] must be set to | ||
50 | + * bits [39:32] of MPIDR_EL1. | ||
51 | + * | ||
52 | + * The second reg cell bits [23:0] must be set to | ||
53 | + * bits [23:0] of MPIDR_EL1. | ||
54 | + */ | ||
55 | qemu_fdt_add_subnode(sms->fdt, "/cpus"); | ||
56 | + qemu_fdt_setprop_cell(sms->fdt, "/cpus", "#address-cells", 2); | ||
57 | + qemu_fdt_setprop_cell(sms->fdt, "/cpus", "#size-cells", 0x0); | ||
58 | |||
59 | for (cpu = sms->smp_cpus - 1; cpu >= 0; cpu--) { | ||
60 | char *nodename = g_strdup_printf("/cpus/cpu@%d", cpu); | ||
61 | ARMCPU *armcpu = ARM_CPU(qemu_get_cpu(cpu)); | ||
62 | CPUState *cs = CPU(armcpu); | ||
63 | + uint64_t mpidr = sbsa_ref_cpu_mp_affinity(sms, cpu); | ||
64 | |||
65 | qemu_fdt_add_subnode(sms->fdt, nodename); | ||
66 | + qemu_fdt_setprop_u64(sms->fdt, nodename, "reg", mpidr); | ||
67 | |||
68 | if (ms->possible_cpus->cpus[cs->cpu_index].props.has_node_id) { | ||
69 | qemu_fdt_setprop_cell(sms->fdt, nodename, "numa-node-id", | ||
70 | @@ -XXX,XX +XXX,XX @@ static void sbsa_ref_init(MachineState *machine) | ||
71 | arm_load_kernel(ARM_CPU(first_cpu), machine, &sms->bootinfo); | ||
72 | } | ||
73 | |||
74 | -static uint64_t sbsa_ref_cpu_mp_affinity(SBSAMachineState *sms, int idx) | ||
75 | -{ | ||
76 | - uint8_t clustersz = ARM_DEFAULT_CPUS_PER_CLUSTER; | ||
77 | - return arm_cpu_mp_affinity(idx, clustersz); | ||
78 | -} | ||
79 | - | ||
80 | static const CPUArchIdList *sbsa_ref_possible_cpu_arch_ids(MachineState *ms) | ||
156 | { | 81 | { |
157 | SysBusEHCIClass *sec = SYS_BUS_EHCI_CLASS(oc); | 82 | unsigned int max_cpus = ms->smp.max_cpus; |
158 | @@ -XXX,XX +XXX,XX @@ static void ehci_sysbus_register_types(void) | ||
159 | type_register_static(&ehci_type_info); | ||
160 | type_register_static(&ehci_platform_type_info); | ||
161 | type_register_static(&ehci_exynos4210_type_info); | ||
162 | + type_register_static(&ehci_aw_h3_type_info); | ||
163 | type_register_static(&ehci_tegra2_type_info); | ||
164 | type_register_static(&ehci_ppc4xx_type_info); | ||
165 | type_register_static(&ehci_fusbh200_type_info); | ||
166 | diff --git a/hw/arm/Kconfig b/hw/arm/Kconfig | ||
167 | index XXXXXXX..XXXXXXX 100644 | ||
168 | --- a/hw/arm/Kconfig | ||
169 | +++ b/hw/arm/Kconfig | ||
170 | @@ -XXX,XX +XXX,XX @@ config ALLWINNER_H3 | ||
171 | select ARM_TIMER | ||
172 | select ARM_GIC | ||
173 | select UNIMP | ||
174 | + select USB_OHCI | ||
175 | + select USB_EHCI_SYSBUS | ||
176 | |||
177 | config RASPI | ||
178 | bool | ||
179 | -- | 83 | -- |
180 | 2.20.1 | 84 | 2.20.1 |
181 | 85 | ||
182 | 86 | diff view generated by jsdifflib |
1 | From: Niek Linnenbank <nieklinnenbank@gmail.com> | 1 | From: Graeme Gregory <graeme@nuviainc.com> |
---|---|---|---|
2 | 2 | ||
3 | The Allwinner H3 System on Chip has an System Control | 3 | A difference between sbsa platform and the virt platform is PSCI is |
4 | module that provides system wide generic controls and | 4 | handled by ARM-TF in the sbsa platform. This means that the PSCI code |
5 | device information. This commit adds support for the | 5 | there needs to communicate some of the platform power changes down |
6 | Allwinner H3 System Control module. | 6 | to the qemu code for things like shutdown/reset control. |
7 | 7 | ||
8 | Signed-off-by: Niek Linnenbank <nieklinnenbank@gmail.com> | 8 | Space has been left to extend the EC if we find other use cases in |
9 | Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com> | 9 | future where ARM-TF and qemu need to communicate. |
10 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | 10 | |
11 | Tested-by: Philippe Mathieu-Daudé <philmd@redhat.com> | 11 | Signed-off-by: Graeme Gregory <graeme@nuviainc.com> |
12 | Message-id: 20200311221854.30370-6-nieklinnenbank@gmail.com | 12 | Reviewed-by: Leif Lindholm <leif@nuviainc.com> |
13 | Tested-by: Leif Lindholm <leif@nuviainc.com> | ||
14 | Message-id: 20200826141952.136164-2-graeme@nuviainc.com | ||
15 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 16 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
14 | --- | 17 | --- |
15 | hw/misc/Makefile.objs | 1 + | 18 | hw/misc/sbsa_ec.c | 98 +++++++++++++++++++++++++++++++++++++++++++++ |
16 | include/hw/arm/allwinner-h3.h | 3 + | 19 | hw/misc/meson.build | 2 + |
17 | include/hw/misc/allwinner-h3-sysctrl.h | 67 ++++++++++++ | 20 | 2 files changed, 100 insertions(+) |
18 | hw/arm/allwinner-h3.c | 9 +- | 21 | create mode 100644 hw/misc/sbsa_ec.c |
19 | hw/misc/allwinner-h3-sysctrl.c | 140 +++++++++++++++++++++++++ | ||
20 | 5 files changed, 219 insertions(+), 1 deletion(-) | ||
21 | create mode 100644 include/hw/misc/allwinner-h3-sysctrl.h | ||
22 | create mode 100644 hw/misc/allwinner-h3-sysctrl.c | ||
23 | 22 | ||
24 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs | 23 | diff --git a/hw/misc/sbsa_ec.c b/hw/misc/sbsa_ec.c |
25 | index XXXXXXX..XXXXXXX 100644 | ||
26 | --- a/hw/misc/Makefile.objs | ||
27 | +++ b/hw/misc/Makefile.objs | ||
28 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_MACIO) += macio/ | ||
29 | common-obj-$(CONFIG_IVSHMEM_DEVICE) += ivshmem.o | ||
30 | |||
31 | common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-ccu.o | ||
32 | +common-obj-$(CONFIG_ALLWINNER_H3) += allwinner-h3-sysctrl.o | ||
33 | common-obj-$(CONFIG_REALVIEW) += arm_sysctl.o | ||
34 | common-obj-$(CONFIG_NSERIES) += cbus.o | ||
35 | common-obj-$(CONFIG_ECCMEMCTL) += eccmemctl.o | ||
36 | diff --git a/include/hw/arm/allwinner-h3.h b/include/hw/arm/allwinner-h3.h | ||
37 | index XXXXXXX..XXXXXXX 100644 | ||
38 | --- a/include/hw/arm/allwinner-h3.h | ||
39 | +++ b/include/hw/arm/allwinner-h3.h | ||
40 | @@ -XXX,XX +XXX,XX @@ | ||
41 | #include "hw/timer/allwinner-a10-pit.h" | ||
42 | #include "hw/intc/arm_gic.h" | ||
43 | #include "hw/misc/allwinner-h3-ccu.h" | ||
44 | +#include "hw/misc/allwinner-h3-sysctrl.h" | ||
45 | #include "target/arm/cpu.h" | ||
46 | |||
47 | /** | ||
48 | @@ -XXX,XX +XXX,XX @@ enum { | ||
49 | AW_H3_SRAM_A1, | ||
50 | AW_H3_SRAM_A2, | ||
51 | AW_H3_SRAM_C, | ||
52 | + AW_H3_SYSCTRL, | ||
53 | AW_H3_EHCI0, | ||
54 | AW_H3_OHCI0, | ||
55 | AW_H3_EHCI1, | ||
56 | @@ -XXX,XX +XXX,XX @@ typedef struct AwH3State { | ||
57 | const hwaddr *memmap; | ||
58 | AwA10PITState timer; | ||
59 | AwH3ClockCtlState ccu; | ||
60 | + AwH3SysCtrlState sysctrl; | ||
61 | GICState gic; | ||
62 | MemoryRegion sram_a1; | ||
63 | MemoryRegion sram_a2; | ||
64 | diff --git a/include/hw/misc/allwinner-h3-sysctrl.h b/include/hw/misc/allwinner-h3-sysctrl.h | ||
65 | new file mode 100644 | 24 | new file mode 100644 |
66 | index XXXXXXX..XXXXXXX | 25 | index XXXXXXX..XXXXXXX |
67 | --- /dev/null | 26 | --- /dev/null |
68 | +++ b/include/hw/misc/allwinner-h3-sysctrl.h | 27 | +++ b/hw/misc/sbsa_ec.c |
69 | @@ -XXX,XX +XXX,XX @@ | 28 | @@ -XXX,XX +XXX,XX @@ |
70 | +/* | 29 | +/* |
71 | + * Allwinner H3 System Control emulation | 30 | + * ARM SBSA Reference Platform Embedded Controller |
72 | + * | 31 | + * |
73 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | 32 | + * A device to allow PSCI running in the secure side of sbsa-ref machine |
33 | + * to communicate platform power states to qemu. | ||
74 | + * | 34 | + * |
75 | + * This program is free software: you can redistribute it and/or modify | 35 | + * Copyright (c) 2020 Nuvia Inc |
76 | + * it under the terms of the GNU General Public License as published by | 36 | + * Written by Graeme Gregory <graeme@nuviainc.com> |
77 | + * the Free Software Foundation, either version 2 of the License, or | ||
78 | + * (at your option) any later version. | ||
79 | + * | 37 | + * |
80 | + * This program is distributed in the hope that it will be useful, | 38 | + * SPDX-License-Identifer: GPL-2.0-or-later |
81 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
82 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
83 | + * GNU General Public License for more details. | ||
84 | + * | ||
85 | + * You should have received a copy of the GNU General Public License | ||
86 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
87 | + */ | ||
88 | + | ||
89 | +#ifndef HW_MISC_ALLWINNER_H3_SYSCTRL_H | ||
90 | +#define HW_MISC_ALLWINNER_H3_SYSCTRL_H | ||
91 | + | ||
92 | +#include "qom/object.h" | ||
93 | +#include "hw/sysbus.h" | ||
94 | + | ||
95 | +/** | ||
96 | + * @name Constants | ||
97 | + * @{ | ||
98 | + */ | ||
99 | + | ||
100 | +/** Highest register address used by System Control device */ | ||
101 | +#define AW_H3_SYSCTRL_REGS_MAXADDR (0x30) | ||
102 | + | ||
103 | +/** Total number of known registers */ | ||
104 | +#define AW_H3_SYSCTRL_REGS_NUM ((AW_H3_SYSCTRL_REGS_MAXADDR / \ | ||
105 | + sizeof(uint32_t)) + 1) | ||
106 | + | ||
107 | +/** @} */ | ||
108 | + | ||
109 | +/** | ||
110 | + * @name Object model | ||
111 | + * @{ | ||
112 | + */ | ||
113 | + | ||
114 | +#define TYPE_AW_H3_SYSCTRL "allwinner-h3-sysctrl" | ||
115 | +#define AW_H3_SYSCTRL(obj) \ | ||
116 | + OBJECT_CHECK(AwH3SysCtrlState, (obj), TYPE_AW_H3_SYSCTRL) | ||
117 | + | ||
118 | +/** @} */ | ||
119 | + | ||
120 | +/** | ||
121 | + * Allwinner H3 System Control object instance state | ||
122 | + */ | ||
123 | +typedef struct AwH3SysCtrlState { | ||
124 | + /*< private >*/ | ||
125 | + SysBusDevice parent_obj; | ||
126 | + /*< public >*/ | ||
127 | + | ||
128 | + /** Maps I/O registers in physical memory */ | ||
129 | + MemoryRegion iomem; | ||
130 | + | ||
131 | + /** Array of hardware registers */ | ||
132 | + uint32_t regs[AW_H3_SYSCTRL_REGS_NUM]; | ||
133 | + | ||
134 | +} AwH3SysCtrlState; | ||
135 | + | ||
136 | +#endif /* HW_MISC_ALLWINNER_H3_SYSCTRL_H */ | ||
137 | diff --git a/hw/arm/allwinner-h3.c b/hw/arm/allwinner-h3.c | ||
138 | index XXXXXXX..XXXXXXX 100644 | ||
139 | --- a/hw/arm/allwinner-h3.c | ||
140 | +++ b/hw/arm/allwinner-h3.c | ||
141 | @@ -XXX,XX +XXX,XX @@ const hwaddr allwinner_h3_memmap[] = { | ||
142 | [AW_H3_SRAM_A1] = 0x00000000, | ||
143 | [AW_H3_SRAM_A2] = 0x00044000, | ||
144 | [AW_H3_SRAM_C] = 0x00010000, | ||
145 | + [AW_H3_SYSCTRL] = 0x01c00000, | ||
146 | [AW_H3_EHCI0] = 0x01c1a000, | ||
147 | [AW_H3_OHCI0] = 0x01c1a400, | ||
148 | [AW_H3_EHCI1] = 0x01c1b000, | ||
149 | @@ -XXX,XX +XXX,XX @@ struct AwH3Unimplemented { | ||
150 | } unimplemented[] = { | ||
151 | { "d-engine", 0x01000000, 4 * MiB }, | ||
152 | { "d-inter", 0x01400000, 128 * KiB }, | ||
153 | - { "syscon", 0x01c00000, 4 * KiB }, | ||
154 | { "dma", 0x01c02000, 4 * KiB }, | ||
155 | { "nfdc", 0x01c03000, 4 * KiB }, | ||
156 | { "ts", 0x01c06000, 4 * KiB }, | ||
157 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_init(Object *obj) | ||
158 | |||
159 | sysbus_init_child_obj(obj, "ccu", &s->ccu, sizeof(s->ccu), | ||
160 | TYPE_AW_H3_CCU); | ||
161 | + | ||
162 | + sysbus_init_child_obj(obj, "sysctrl", &s->sysctrl, sizeof(s->sysctrl), | ||
163 | + TYPE_AW_H3_SYSCTRL); | ||
164 | } | ||
165 | |||
166 | static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
167 | @@ -XXX,XX +XXX,XX @@ static void allwinner_h3_realize(DeviceState *dev, Error **errp) | ||
168 | qdev_init_nofail(DEVICE(&s->ccu)); | ||
169 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->ccu), 0, s->memmap[AW_H3_CCU]); | ||
170 | |||
171 | + /* System Control */ | ||
172 | + qdev_init_nofail(DEVICE(&s->sysctrl)); | ||
173 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->sysctrl), 0, s->memmap[AW_H3_SYSCTRL]); | ||
174 | + | ||
175 | /* Universal Serial Bus */ | ||
176 | sysbus_create_simple(TYPE_AW_H3_EHCI, s->memmap[AW_H3_EHCI0], | ||
177 | qdev_get_gpio_in(DEVICE(&s->gic), | ||
178 | diff --git a/hw/misc/allwinner-h3-sysctrl.c b/hw/misc/allwinner-h3-sysctrl.c | ||
179 | new file mode 100644 | ||
180 | index XXXXXXX..XXXXXXX | ||
181 | --- /dev/null | ||
182 | +++ b/hw/misc/allwinner-h3-sysctrl.c | ||
183 | @@ -XXX,XX +XXX,XX @@ | ||
184 | +/* | ||
185 | + * Allwinner H3 System Control emulation | ||
186 | + * | ||
187 | + * Copyright (C) 2019 Niek Linnenbank <nieklinnenbank@gmail.com> | ||
188 | + * | ||
189 | + * This program is free software: you can redistribute it and/or modify | ||
190 | + * it under the terms of the GNU General Public License as published by | ||
191 | + * the Free Software Foundation, either version 2 of the License, or | ||
192 | + * (at your option) any later version. | ||
193 | + * | ||
194 | + * This program is distributed in the hope that it will be useful, | ||
195 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
196 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
197 | + * GNU General Public License for more details. | ||
198 | + * | ||
199 | + * You should have received a copy of the GNU General Public License | ||
200 | + * along with this program. If not, see <http://www.gnu.org/licenses/>. | ||
201 | + */ | 39 | + */ |
202 | + | 40 | + |
203 | +#include "qemu/osdep.h" | 41 | +#include "qemu/osdep.h" |
204 | +#include "qemu/units.h" | 42 | +#include "qemu-common.h" |
43 | +#include "qemu/log.h" | ||
205 | +#include "hw/sysbus.h" | 44 | +#include "hw/sysbus.h" |
206 | +#include "migration/vmstate.h" | 45 | +#include "sysemu/runstate.h" |
207 | +#include "qemu/log.h" | ||
208 | +#include "qemu/module.h" | ||
209 | +#include "hw/misc/allwinner-h3-sysctrl.h" | ||
210 | + | 46 | + |
211 | +/* System Control register offsets */ | 47 | +typedef struct { |
212 | +enum { | 48 | + SysBusDevice parent_obj; |
213 | + REG_VER = 0x24, /* Version */ | 49 | + MemoryRegion iomem; |
214 | + REG_EMAC_PHY_CLK = 0x30, /* EMAC PHY Clock */ | 50 | +} SECUREECState; |
51 | + | ||
52 | +#define TYPE_SBSA_EC "sbsa-ec" | ||
53 | +#define SECURE_EC(obj) OBJECT_CHECK(SECUREECState, (obj), TYPE_SBSA_EC) | ||
54 | + | ||
55 | +enum sbsa_ec_powerstates { | ||
56 | + SBSA_EC_CMD_POWEROFF = 0x01, | ||
57 | + SBSA_EC_CMD_REBOOT = 0x02, | ||
215 | +}; | 58 | +}; |
216 | + | 59 | + |
217 | +#define REG_INDEX(offset) (offset / sizeof(uint32_t)) | 60 | +static uint64_t sbsa_ec_read(void *opaque, hwaddr offset, unsigned size) |
218 | + | ||
219 | +/* System Control register reset values */ | ||
220 | +enum { | ||
221 | + REG_VER_RST = 0x0, | ||
222 | + REG_EMAC_PHY_CLK_RST = 0x58000, | ||
223 | +}; | ||
224 | + | ||
225 | +static uint64_t allwinner_h3_sysctrl_read(void *opaque, hwaddr offset, | ||
226 | + unsigned size) | ||
227 | +{ | 61 | +{ |
228 | + const AwH3SysCtrlState *s = AW_H3_SYSCTRL(opaque); | 62 | + /* No use for this currently */ |
229 | + const uint32_t idx = REG_INDEX(offset); | 63 | + qemu_log_mask(LOG_GUEST_ERROR, "sbsa-ec: no readable registers"); |
230 | + | 64 | + return 0; |
231 | + if (idx >= AW_H3_SYSCTRL_REGS_NUM) { | ||
232 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | ||
233 | + __func__, (uint32_t)offset); | ||
234 | + return 0; | ||
235 | + } | ||
236 | + | ||
237 | + return s->regs[idx]; | ||
238 | +} | 65 | +} |
239 | + | 66 | + |
240 | +static void allwinner_h3_sysctrl_write(void *opaque, hwaddr offset, | 67 | +static void sbsa_ec_write(void *opaque, hwaddr offset, |
241 | + uint64_t val, unsigned size) | 68 | + uint64_t value, unsigned size) |
242 | +{ | 69 | +{ |
243 | + AwH3SysCtrlState *s = AW_H3_SYSCTRL(opaque); | 70 | + if (offset == 0) { /* PSCI machine power command register */ |
244 | + const uint32_t idx = REG_INDEX(offset); | 71 | + switch (value) { |
245 | + | 72 | + case SBSA_EC_CMD_POWEROFF: |
246 | + if (idx >= AW_H3_SYSCTRL_REGS_NUM) { | 73 | + qemu_system_shutdown_request(SHUTDOWN_CAUSE_GUEST_SHUTDOWN); |
247 | + qemu_log_mask(LOG_GUEST_ERROR, "%s: out-of-bounds offset 0x%04x\n", | 74 | + break; |
248 | + __func__, (uint32_t)offset); | 75 | + case SBSA_EC_CMD_REBOOT: |
249 | + return; | 76 | + qemu_system_reset_request(SHUTDOWN_CAUSE_GUEST_RESET); |
250 | + } | 77 | + break; |
251 | + | 78 | + default: |
252 | + switch (offset) { | 79 | + qemu_log_mask(LOG_GUEST_ERROR, |
253 | + case REG_VER: /* Version */ | 80 | + "sbsa-ec: unknown power command"); |
254 | + break; | 81 | + } |
255 | + default: | 82 | + } else { |
256 | + s->regs[idx] = (uint32_t) val; | 83 | + qemu_log_mask(LOG_GUEST_ERROR, "sbsa-ec: unknown EC register"); |
257 | + break; | ||
258 | + } | 84 | + } |
259 | +} | 85 | +} |
260 | + | 86 | + |
261 | +static const MemoryRegionOps allwinner_h3_sysctrl_ops = { | 87 | +static const MemoryRegionOps sbsa_ec_ops = { |
262 | + .read = allwinner_h3_sysctrl_read, | 88 | + .read = sbsa_ec_read, |
263 | + .write = allwinner_h3_sysctrl_write, | 89 | + .write = sbsa_ec_write, |
264 | + .endianness = DEVICE_NATIVE_ENDIAN, | 90 | + .endianness = DEVICE_NATIVE_ENDIAN, |
265 | + .valid = { | 91 | + .valid.min_access_size = 4, |
266 | + .min_access_size = 4, | 92 | + .valid.max_access_size = 4, |
267 | + .max_access_size = 4, | ||
268 | + }, | ||
269 | + .impl.min_access_size = 4, | ||
270 | +}; | 93 | +}; |
271 | + | 94 | + |
272 | +static void allwinner_h3_sysctrl_reset(DeviceState *dev) | 95 | +static void sbsa_ec_init(Object *obj) |
273 | +{ | 96 | +{ |
274 | + AwH3SysCtrlState *s = AW_H3_SYSCTRL(dev); | 97 | + SECUREECState *s = SECURE_EC(obj); |
98 | + SysBusDevice *dev = SYS_BUS_DEVICE(obj); | ||
275 | + | 99 | + |
276 | + /* Set default values for registers */ | 100 | + memory_region_init_io(&s->iomem, obj, &sbsa_ec_ops, s, "sbsa-ec", |
277 | + s->regs[REG_INDEX(REG_VER)] = REG_VER_RST; | 101 | + 0x1000); |
278 | + s->regs[REG_INDEX(REG_EMAC_PHY_CLK)] = REG_EMAC_PHY_CLK_RST; | 102 | + sysbus_init_mmio(dev, &s->iomem); |
279 | +} | 103 | +} |
280 | + | 104 | + |
281 | +static void allwinner_h3_sysctrl_init(Object *obj) | 105 | +static void sbsa_ec_class_init(ObjectClass *klass, void *data) |
282 | +{ | ||
283 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
284 | + AwH3SysCtrlState *s = AW_H3_SYSCTRL(obj); | ||
285 | + | ||
286 | + /* Memory mapping */ | ||
287 | + memory_region_init_io(&s->iomem, OBJECT(s), &allwinner_h3_sysctrl_ops, s, | ||
288 | + TYPE_AW_H3_SYSCTRL, 4 * KiB); | ||
289 | + sysbus_init_mmio(sbd, &s->iomem); | ||
290 | +} | ||
291 | + | ||
292 | +static const VMStateDescription allwinner_h3_sysctrl_vmstate = { | ||
293 | + .name = "allwinner-h3-sysctrl", | ||
294 | + .version_id = 1, | ||
295 | + .minimum_version_id = 1, | ||
296 | + .fields = (VMStateField[]) { | ||
297 | + VMSTATE_UINT32_ARRAY(regs, AwH3SysCtrlState, AW_H3_SYSCTRL_REGS_NUM), | ||
298 | + VMSTATE_END_OF_LIST() | ||
299 | + } | ||
300 | +}; | ||
301 | + | ||
302 | +static void allwinner_h3_sysctrl_class_init(ObjectClass *klass, void *data) | ||
303 | +{ | 106 | +{ |
304 | + DeviceClass *dc = DEVICE_CLASS(klass); | 107 | + DeviceClass *dc = DEVICE_CLASS(klass); |
305 | + | 108 | + |
306 | + dc->reset = allwinner_h3_sysctrl_reset; | 109 | + /* No vmstate or reset required: device has no internal state */ |
307 | + dc->vmsd = &allwinner_h3_sysctrl_vmstate; | 110 | + dc->user_creatable = false; |
308 | +} | 111 | +} |
309 | + | 112 | + |
310 | +static const TypeInfo allwinner_h3_sysctrl_info = { | 113 | +static const TypeInfo sbsa_ec_info = { |
311 | + .name = TYPE_AW_H3_SYSCTRL, | 114 | + .name = TYPE_SBSA_EC, |
312 | + .parent = TYPE_SYS_BUS_DEVICE, | 115 | + .parent = TYPE_SYS_BUS_DEVICE, |
313 | + .instance_init = allwinner_h3_sysctrl_init, | 116 | + .instance_size = sizeof(SECUREECState), |
314 | + .instance_size = sizeof(AwH3SysCtrlState), | 117 | + .instance_init = sbsa_ec_init, |
315 | + .class_init = allwinner_h3_sysctrl_class_init, | 118 | + .class_init = sbsa_ec_class_init, |
316 | +}; | 119 | +}; |
317 | + | 120 | + |
318 | +static void allwinner_h3_sysctrl_register(void) | 121 | +static void sbsa_ec_register_type(void) |
319 | +{ | 122 | +{ |
320 | + type_register_static(&allwinner_h3_sysctrl_info); | 123 | + type_register_static(&sbsa_ec_info); |
321 | +} | 124 | +} |
322 | + | 125 | + |
323 | +type_init(allwinner_h3_sysctrl_register) | 126 | +type_init(sbsa_ec_register_type); |
127 | diff --git a/hw/misc/meson.build b/hw/misc/meson.build | ||
128 | index XXXXXXX..XXXXXXX 100644 | ||
129 | --- a/hw/misc/meson.build | ||
130 | +++ b/hw/misc/meson.build | ||
131 | @@ -XXX,XX +XXX,XX @@ specific_ss.add(when: 'CONFIG_MAC_VIA', if_true: files('mac_via.c')) | ||
132 | |||
133 | specific_ss.add(when: 'CONFIG_MIPS_CPS', if_true: files('mips_cmgcr.c', 'mips_cpc.c')) | ||
134 | specific_ss.add(when: 'CONFIG_MIPS_ITU', if_true: files('mips_itu.c')) | ||
135 | + | ||
136 | +specific_ss.add(when: 'CONFIG_SBSA_REF', if_true: files('sbsa_ec.c')) | ||
324 | -- | 137 | -- |
325 | 2.20.1 | 138 | 2.20.1 |
326 | 139 | ||
327 | 140 | diff view generated by jsdifflib |
1 | From: Richard Henderson <richard.henderson@linaro.org> | 1 | From: Graeme Gregory <graeme@nuviainc.com> |
---|---|---|---|
2 | 2 | ||
3 | We fail to validate the upper bits of a virtual address on a | 3 | Add the previously created sbsa-ec device to the sbsa-ref machine in |
4 | translation disabled regime, as per AArch64.TranslateAddressS1Off. | 4 | secure memory so the PSCI implementation in ARM-TF can access it, but |
5 | not expose it to non secure firmware or OS except by via ARM-TF. | ||
5 | 6 | ||
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Signed-off-by: Graeme Gregory <graeme@nuviainc.com> |
7 | Message-id: 20200308012946.16303-2-richard.henderson@linaro.org | 8 | Reviewed-by: Leif Lindholm <leif@nuviainc.com> |
9 | Tested-by: Leif Lindholm <leif@nuviainc.com> | ||
10 | Message-id: 20200826141952.136164-3-graeme@nuviainc.com | ||
8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 11 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 13 | --- |
11 | target/arm/helper.c | 35 ++++++++++++++++++++++++++++++++++- | 14 | hw/arm/sbsa-ref.c | 14 ++++++++++++++ |
12 | 1 file changed, 34 insertions(+), 1 deletion(-) | 15 | 1 file changed, 14 insertions(+) |
13 | 16 | ||
14 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 17 | diff --git a/hw/arm/sbsa-ref.c b/hw/arm/sbsa-ref.c |
15 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/helper.c | 19 | --- a/hw/arm/sbsa-ref.c |
17 | +++ b/target/arm/helper.c | 20 | +++ b/hw/arm/sbsa-ref.c |
18 | @@ -XXX,XX +XXX,XX @@ bool get_phys_addr(CPUARMState *env, target_ulong address, | 21 | @@ -XXX,XX +XXX,XX @@ enum { |
19 | /* Definitely a real MMU, not an MPU */ | 22 | SBSA_CPUPERIPHS, |
20 | 23 | SBSA_GIC_DIST, | |
21 | if (regime_translation_disabled(env, mmu_idx)) { | 24 | SBSA_GIC_REDIST, |
22 | - /* MMU disabled. */ | 25 | + SBSA_SECURE_EC, |
23 | + /* | 26 | SBSA_SMMU, |
24 | + * MMU disabled. S1 addresses within aa64 translation regimes are | 27 | SBSA_UART, |
25 | + * still checked for bounds -- see AArch64.TranslateAddressS1Off. | 28 | SBSA_RTC, |
26 | + */ | 29 | @@ -XXX,XX +XXX,XX @@ static const MemMapEntry sbsa_ref_memmap[] = { |
27 | + if (mmu_idx != ARMMMUIdx_Stage2) { | 30 | [SBSA_CPUPERIPHS] = { 0x40000000, 0x00040000 }, |
28 | + int r_el = regime_el(env, mmu_idx); | 31 | [SBSA_GIC_DIST] = { 0x40060000, 0x00010000 }, |
29 | + if (arm_el_is_aa64(env, r_el)) { | 32 | [SBSA_GIC_REDIST] = { 0x40080000, 0x04000000 }, |
30 | + int pamax = arm_pamax(env_archcpu(env)); | 33 | + [SBSA_SECURE_EC] = { 0x50000000, 0x00001000 }, |
31 | + uint64_t tcr = env->cp15.tcr_el[r_el].raw_tcr; | 34 | [SBSA_UART] = { 0x60000000, 0x00001000 }, |
32 | + int addrtop, tbi; | 35 | [SBSA_RTC] = { 0x60010000, 0x00001000 }, |
36 | [SBSA_GPIO] = { 0x60020000, 0x00001000 }, | ||
37 | @@ -XXX,XX +XXX,XX @@ static void *sbsa_ref_dtb(const struct arm_boot_info *binfo, int *fdt_size) | ||
38 | return board->fdt; | ||
39 | } | ||
40 | |||
41 | +static void create_secure_ec(MemoryRegion *mem) | ||
42 | +{ | ||
43 | + hwaddr base = sbsa_ref_memmap[SBSA_SECURE_EC].base; | ||
44 | + DeviceState *dev = qdev_new("sbsa-ec"); | ||
45 | + SysBusDevice *s = SYS_BUS_DEVICE(dev); | ||
33 | + | 46 | + |
34 | + tbi = aa64_va_parameter_tbi(tcr, mmu_idx); | 47 | + memory_region_add_subregion(mem, base, |
35 | + if (access_type == MMU_INST_FETCH) { | 48 | + sysbus_mmio_get_region(s, 0)); |
36 | + tbi &= ~aa64_va_parameter_tbid(tcr, mmu_idx); | 49 | +} |
37 | + } | ||
38 | + tbi = (tbi >> extract64(address, 55, 1)) & 1; | ||
39 | + addrtop = (tbi ? 55 : 63); | ||
40 | + | 50 | + |
41 | + if (extract64(address, pamax, addrtop - pamax + 1) != 0) { | 51 | static void sbsa_ref_init(MachineState *machine) |
42 | + fi->type = ARMFault_AddressSize; | 52 | { |
43 | + fi->level = 0; | 53 | unsigned int smp_cpus = machine->smp.cpus; |
44 | + fi->stage2 = false; | 54 | @@ -XXX,XX +XXX,XX @@ static void sbsa_ref_init(MachineState *machine) |
45 | + return 1; | 55 | |
46 | + } | 56 | create_pcie(sms); |
57 | |||
58 | + create_secure_ec(secure_sysmem); | ||
47 | + | 59 | + |
48 | + /* | 60 | sms->bootinfo.ram_size = machine->ram_size; |
49 | + * When TBI is disabled, we've just validated that all of the | 61 | sms->bootinfo.nb_cpus = smp_cpus; |
50 | + * bits above PAMax are zero, so logically we only need to | 62 | sms->bootinfo.board_id = -1; |
51 | + * clear the top byte for TBI. But it's clearer to follow | ||
52 | + * the pseudocode set of addrdesc.paddress. | ||
53 | + */ | ||
54 | + address = extract64(address, 0, 52); | ||
55 | + } | ||
56 | + } | ||
57 | *phys_ptr = address; | ||
58 | *prot = PAGE_READ | PAGE_WRITE | PAGE_EXEC; | ||
59 | *page_size = TARGET_PAGE_SIZE; | ||
60 | -- | 63 | -- |
61 | 2.20.1 | 64 | 2.20.1 |
62 | 65 | ||
63 | 66 | diff view generated by jsdifflib |