1 | Arm queue -- I have more stuff pending but I prefer to push | 1 | Second pull request of the week; mostly RTH's support for some |
---|---|---|---|
2 | this first lot out and keep the pull below 50 patches. | 2 | new-in-v8.1/v8.3 instructions, and my v8M board model. |
3 | Most of this is Alex's FP16 support work. | ||
4 | 3 | ||
4 | thanks | ||
5 | -- PMM | 5 | -- PMM |
6 | 6 | ||
7 | The following changes since commit 427cbc7e4136a061628cb4315cc8182ea36d772f: | ||
7 | 8 | ||
8 | The following changes since commit 6697439794f72b3501ee16bb95d16854f9981421: | 9 | Merge remote-tracking branch 'remotes/mst/tags/for_upstream' into staging (2018-03-01 18:46:41 +0000) |
9 | |||
10 | Merge remote-tracking branch 'remotes/kraxel/tags/usb-20180227-pull-request' into staging (2018-02-27 17:50:46 +0000) | ||
11 | 10 | ||
12 | are available in the Git repository at: | 11 | are available in the Git repository at: |
13 | 12 | ||
14 | git://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20180301 | 13 | git://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20180302 |
15 | 14 | ||
16 | for you to fetch changes up to c22e580c2ad1cccef582e1490e732f254d4ac064: | 15 | for you to fetch changes up to e66a67bf28e1b4fce2e3d72a2610dbd48d9d3078: |
17 | 16 | ||
18 | MAINTAINERS: Update my email address (2018-03-01 11:13:59 +0000) | 17 | target/arm: Enable ARM_FEATURE_V8_FCMA (2018-03-02 11:03:45 +0000) |
19 | 18 | ||
20 | ---------------------------------------------------------------- | 19 | ---------------------------------------------------------------- |
21 | target-arm queue: | 20 | target-arm queue: |
22 | * update MAINTAINERS for Alistair's new email address | 21 | * implement FCMA and RDM v8.1 and v8.3 instructions |
23 | * add Arm v8.2 FP16 arithmetic extension for linux-user | 22 | * enable Cortex-M33 v8M core, and provide new mps2-an505 board model |
24 | * implement display connector emulation for vexpress board | 23 | that uses it |
25 | * xilinx_spips: Enable only two slaves when reading/writing with stripe | 24 | * decodetree: Propagate return value from translate subroutines |
26 | * xilinx_spips: Use 8 dummy cycles with the QIOR/QIOR4 commands | 25 | * xlnx-zynqmp: Implement the RTC device |
27 | * hw: register: Run post_write hook on reset | ||
28 | 26 | ||
29 | ---------------------------------------------------------------- | 27 | ---------------------------------------------------------------- |
30 | Alex Bennée (31): | 28 | Alistair Francis (3): |
31 | include/exec/helper-head.h: support f16 in helper calls | 29 | xlnx-zynqmp-rtc: Initial commit |
32 | target/arm/cpu64: introduce ARM_V8_FP16 feature bit | 30 | xlnx-zynqmp-rtc: Add basic time support |
33 | target/arm/cpu.h: update comment for half-precision values | 31 | xlnx-zynqmp: Connect the RTC device |
34 | target/arm/cpu.h: add additional float_status flags | ||
35 | target/arm/helper: pass explicit fpst to set_rmode | ||
36 | arm/translate-a64: implement half-precision F(MIN|MAX)(V|NMV) | ||
37 | arm/translate-a64: handle_3same_64 comment fix | ||
38 | arm/translate-a64: initial decode for simd_three_reg_same_fp16 | ||
39 | arm/translate-a64: add FP16 FADD/FABD/FSUB/FMUL/FDIV to simd_three_reg_same_fp16 | ||
40 | arm/translate-a64: add FP16 F[A]C[EQ/GE/GT] to simd_three_reg_same_fp16 | ||
41 | arm/translate-a64: add FP16 FMULA/X/S to simd_three_reg_same_fp16 | ||
42 | arm/translate-a64: add FP16 FR[ECP/SQRT]S to simd_three_reg_same_fp16 | ||
43 | arm/translate-a64: add FP16 pairwise ops simd_three_reg_same_fp16 | ||
44 | arm/translate-a64: add FP16 FMULX/MLS/FMLA to simd_indexed | ||
45 | arm/translate-a64: add FP16 x2 ops for simd_indexed | ||
46 | arm/translate-a64: initial decode for simd_two_reg_misc_fp16 | ||
47 | arm/translate-a64: add FP16 FPRINTx to simd_two_reg_misc_fp16 | ||
48 | arm/translate-a64: add FCVTxx to simd_two_reg_misc_fp16 | ||
49 | arm/translate-a64: add FP16 FCMxx (zero) to simd_two_reg_misc_fp16 | ||
50 | arm/translate-a64: add FP16 SCVTF/UCVFT to simd_two_reg_misc_fp16 | ||
51 | arm/translate-a64: add FP16 FNEG/FABS to simd_two_reg_misc_fp16 | ||
52 | arm/helper.c: re-factor recpe and add recepe_f16 | ||
53 | arm/translate-a64: add FP16 FRECPE | ||
54 | arm/translate-a64: add FP16 FRCPX to simd_two_reg_misc_fp16 | ||
55 | arm/translate-a64: add FP16 FSQRT to simd_two_reg_misc_fp16 | ||
56 | arm/helper.c: re-factor rsqrte and add rsqrte_f16 | ||
57 | arm/translate-a64: add FP16 FRSQRTE to simd_two_reg_misc_fp16 | ||
58 | arm/translate-a64: add FP16 FMOV to simd_mod_imm | ||
59 | arm/translate-a64: add all FP16 ops in simd_scalar_pairwise | ||
60 | arm/translate-a64: implement simd_scalar_three_reg_same_fp16 | ||
61 | arm/translate-a64: add all single op FP16 to handle_fp_1src_half | ||
62 | 32 | ||
63 | Alistair Francis (2): | 33 | Peter Maydell (19): |
64 | hw: register: Run post_write hook on reset | 34 | loader: Add new load_ramdisk_as() |
65 | MAINTAINERS: Update my email address | 35 | hw/arm/boot: Honour CPU's address space for image loads |
36 | hw/arm/armv7m: Honour CPU's address space for image loads | ||
37 | target/arm: Define an IDAU interface | ||
38 | armv7m: Forward idau property to CPU object | ||
39 | target/arm: Define init-svtor property for the reset secure VTOR value | ||
40 | armv7m: Forward init-svtor property to CPU object | ||
41 | target/arm: Add Cortex-M33 | ||
42 | hw/misc/unimp: Move struct to header file | ||
43 | include/hw/or-irq.h: Add missing include guard | ||
44 | qdev: Add new qdev_init_gpio_in_named_with_opaque() | ||
45 | hw/core/split-irq: Device that splits IRQ lines | ||
46 | hw/misc/mps2-fpgaio: FPGA control block for MPS2 AN505 | ||
47 | hw/misc/tz-ppc: Model TrustZone peripheral protection controller | ||
48 | hw/misc/iotkit-secctl: Arm IoT Kit security controller initial skeleton | ||
49 | hw/misc/iotkit-secctl: Add handling for PPCs | ||
50 | hw/misc/iotkit-secctl: Add remaining simple registers | ||
51 | hw/arm/iotkit: Model Arm IOT Kit | ||
52 | mps2-an505: New board model: MPS2 with AN505 Cortex-M33 FPGA image | ||
66 | 53 | ||
67 | Corey Minyard (2): | 54 | Richard Henderson (17): |
68 | i2c: Fix some brace style issues | 55 | decodetree: Propagate return value from translate subroutines |
69 | i2c: Move the bus class to i2c.h | 56 | target/arm: Add ARM_FEATURE_V8_RDM |
57 | target/arm: Refactor disas_simd_indexed decode | ||
58 | target/arm: Refactor disas_simd_indexed size checks | ||
59 | target/arm: Decode aa64 armv8.1 scalar three same extra | ||
60 | target/arm: Decode aa64 armv8.1 three same extra | ||
61 | target/arm: Decode aa64 armv8.1 scalar/vector x indexed element | ||
62 | target/arm: Decode aa32 armv8.1 three same | ||
63 | target/arm: Decode aa32 armv8.1 two reg and a scalar | ||
64 | target/arm: Enable ARM_FEATURE_V8_RDM | ||
65 | target/arm: Add ARM_FEATURE_V8_FCMA | ||
66 | target/arm: Decode aa64 armv8.3 fcadd | ||
67 | target/arm: Decode aa64 armv8.3 fcmla | ||
68 | target/arm: Decode aa32 armv8.3 3-same | ||
69 | target/arm: Decode aa32 armv8.3 2-reg-index | ||
70 | target/arm: Decode t32 simd 3reg and 2reg_scalar extension | ||
71 | target/arm: Enable ARM_FEATURE_V8_FCMA | ||
70 | 72 | ||
71 | Francisco Iglesias (2): | 73 | hw/arm/Makefile.objs | 2 + |
72 | xilinx_spips: Enable only two slaves when reading/writing with stripe | 74 | hw/core/Makefile.objs | 1 + |
73 | xilinx_spips: Use 8 dummy cycles with the QIOR/QIOR4 commands | 75 | hw/misc/Makefile.objs | 4 + |
76 | hw/timer/Makefile.objs | 1 + | ||
77 | target/arm/Makefile.objs | 2 +- | ||
78 | include/hw/arm/armv7m.h | 5 + | ||
79 | include/hw/arm/iotkit.h | 109 ++++++ | ||
80 | include/hw/arm/xlnx-zynqmp.h | 2 + | ||
81 | include/hw/core/split-irq.h | 57 +++ | ||
82 | include/hw/irq.h | 4 +- | ||
83 | include/hw/loader.h | 12 +- | ||
84 | include/hw/misc/iotkit-secctl.h | 103 ++++++ | ||
85 | include/hw/misc/mps2-fpgaio.h | 43 +++ | ||
86 | include/hw/misc/tz-ppc.h | 101 ++++++ | ||
87 | include/hw/misc/unimp.h | 10 + | ||
88 | include/hw/or-irq.h | 5 + | ||
89 | include/hw/qdev-core.h | 30 +- | ||
90 | include/hw/timer/xlnx-zynqmp-rtc.h | 86 +++++ | ||
91 | target/arm/cpu.h | 8 + | ||
92 | target/arm/helper.h | 31 ++ | ||
93 | target/arm/idau.h | 61 ++++ | ||
94 | hw/arm/armv7m.c | 35 +- | ||
95 | hw/arm/boot.c | 119 ++++--- | ||
96 | hw/arm/iotkit.c | 598 +++++++++++++++++++++++++++++++ | ||
97 | hw/arm/mps2-tz.c | 503 ++++++++++++++++++++++++++ | ||
98 | hw/arm/xlnx-zynqmp.c | 14 + | ||
99 | hw/core/loader.c | 8 +- | ||
100 | hw/core/qdev.c | 8 +- | ||
101 | hw/core/split-irq.c | 89 +++++ | ||
102 | hw/misc/iotkit-secctl.c | 704 +++++++++++++++++++++++++++++++++++++ | ||
103 | hw/misc/mps2-fpgaio.c | 176 ++++++++++ | ||
104 | hw/misc/tz-ppc.c | 302 ++++++++++++++++ | ||
105 | hw/misc/unimp.c | 10 - | ||
106 | hw/timer/xlnx-zynqmp-rtc.c | 272 ++++++++++++++ | ||
107 | linux-user/elfload.c | 2 + | ||
108 | target/arm/cpu.c | 66 +++- | ||
109 | target/arm/cpu64.c | 2 + | ||
110 | target/arm/helper.c | 28 +- | ||
111 | target/arm/translate-a64.c | 514 +++++++++++++++++++++------ | ||
112 | target/arm/translate.c | 275 +++++++++++++-- | ||
113 | target/arm/vec_helper.c | 429 ++++++++++++++++++++++ | ||
114 | default-configs/arm-softmmu.mak | 5 + | ||
115 | hw/misc/trace-events | 24 ++ | ||
116 | hw/timer/trace-events | 3 + | ||
117 | scripts/decodetree.py | 5 +- | ||
118 | 45 files changed, 4668 insertions(+), 200 deletions(-) | ||
119 | create mode 100644 include/hw/arm/iotkit.h | ||
120 | create mode 100644 include/hw/core/split-irq.h | ||
121 | create mode 100644 include/hw/misc/iotkit-secctl.h | ||
122 | create mode 100644 include/hw/misc/mps2-fpgaio.h | ||
123 | create mode 100644 include/hw/misc/tz-ppc.h | ||
124 | create mode 100644 include/hw/timer/xlnx-zynqmp-rtc.h | ||
125 | create mode 100644 target/arm/idau.h | ||
126 | create mode 100644 hw/arm/iotkit.c | ||
127 | create mode 100644 hw/arm/mps2-tz.c | ||
128 | create mode 100644 hw/core/split-irq.c | ||
129 | create mode 100644 hw/misc/iotkit-secctl.c | ||
130 | create mode 100644 hw/misc/mps2-fpgaio.c | ||
131 | create mode 100644 hw/misc/tz-ppc.c | ||
132 | create mode 100644 hw/timer/xlnx-zynqmp-rtc.c | ||
133 | create mode 100644 target/arm/vec_helper.c | ||
74 | 134 | ||
75 | Linus Walleij (3): | ||
76 | hw/i2c-ddc: Do not fail writes | ||
77 | hw/sii9022: Add support for Silicon Image SII9022 | ||
78 | arm/vexpress: Add proper display connector emulation | ||
79 | |||
80 | Peter Maydell (2): | ||
81 | target/arm: Enable ARM_V8_FP16 feature bit for the AArch64 "any" CPU | ||
82 | linux-user: Report AArch64 FP16 support via hwcap bits | ||
83 | |||
84 | hw/display/Makefile.objs | 1 + | ||
85 | include/exec/helper-head.h | 3 + | ||
86 | include/fpu/softfloat.h | 18 +- | ||
87 | include/hw/i2c/i2c.h | 23 +- | ||
88 | include/hw/register.h | 6 +- | ||
89 | target/arm/cpu.h | 34 +- | ||
90 | target/arm/helper-a64.h | 33 + | ||
91 | target/arm/helper.h | 14 +- | ||
92 | hw/arm/vexpress.c | 6 +- | ||
93 | hw/core/register.c | 8 + | ||
94 | hw/display/sii9022.c | 191 ++++++ | ||
95 | hw/i2c/core.c | 18 - | ||
96 | hw/i2c/i2c-ddc.c | 4 +- | ||
97 | hw/ssi/xilinx_spips.c | 43 +- | ||
98 | linux-user/elfload.c | 2 + | ||
99 | target/arm/cpu64.c | 1 + | ||
100 | target/arm/helper-a64.c | 269 +++++++++ | ||
101 | target/arm/helper.c | 481 ++++++++------- | ||
102 | target/arm/translate-a64.c | 1266 +++++++++++++++++++++++++++++++++------ | ||
103 | target/arm/translate.c | 12 +- | ||
104 | MAINTAINERS | 12 +- | ||
105 | default-configs/arm-softmmu.mak | 2 + | ||
106 | hw/display/trace-events | 5 + | ||
107 | 23 files changed, 1981 insertions(+), 471 deletions(-) | ||
108 | create mode 100644 hw/display/sii9022.c | ||
109 | diff view generated by jsdifflib |
1 | From: Alistair Francis <alistair.francis@xilinx.com> | 1 | From: Alistair Francis <alistair.francis@xilinx.com> |
---|---|---|---|
2 | 2 | ||
3 | I am leaving Xilinx, so to avoid having an email address that bounces | 3 | Initial commit of the ZynqMP RTC device. |
4 | update my maintainer address to point to my personal email address. | ||
5 | 4 | ||
6 | Signed-off-by: Alistair Francis <alistair.francis@xilinx.com> | 5 | Signed-off-by: Alistair Francis <alistair.francis@xilinx.com> |
7 | Signed-off-by: Alistair Francis <alistair@alistair23.me> | ||
8 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | 6 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
9 | Message-id: 7bb690382e3370aa1c1e047a84e36603c787ec0e.1519749987.git.alistair.francis@xilinx.com | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 8 | --- |
12 | MAINTAINERS | 12 ++++++------ | 9 | hw/timer/Makefile.objs | 1 + |
13 | 1 file changed, 6 insertions(+), 6 deletions(-) | 10 | include/hw/timer/xlnx-zynqmp-rtc.h | 84 +++++++++++++++ |
14 | 11 | hw/timer/xlnx-zynqmp-rtc.c | 214 +++++++++++++++++++++++++++++++++++++ | |
15 | diff --git a/MAINTAINERS b/MAINTAINERS | 12 | 3 files changed, 299 insertions(+) |
13 | create mode 100644 include/hw/timer/xlnx-zynqmp-rtc.h | ||
14 | create mode 100644 hw/timer/xlnx-zynqmp-rtc.c | ||
15 | |||
16 | diff --git a/hw/timer/Makefile.objs b/hw/timer/Makefile.objs | ||
16 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/MAINTAINERS | 18 | --- a/hw/timer/Makefile.objs |
18 | +++ b/MAINTAINERS | 19 | +++ b/hw/timer/Makefile.objs |
19 | @@ -XXX,XX +XXX,XX @@ F: hw/misc/arm_sysctl.c | 20 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_IMX) += imx_epit.o |
20 | 21 | common-obj-$(CONFIG_IMX) += imx_gpt.o | |
21 | Xilinx Zynq | 22 | common-obj-$(CONFIG_LM32) += lm32_timer.o |
22 | M: Edgar E. Iglesias <edgar.iglesias@gmail.com> | 23 | common-obj-$(CONFIG_MILKYMIST) += milkymist-sysctl.o |
23 | -M: Alistair Francis <alistair.francis@xilinx.com> | 24 | +common-obj-$(CONFIG_XLNX_ZYNQMP) += xlnx-zynqmp-rtc.o |
24 | +M: Alistair Francis <alistair@alistair23.me> | 25 | |
25 | L: qemu-arm@nongnu.org | 26 | obj-$(CONFIG_ALTERA_TIMER) += altera_timer.o |
26 | S: Maintained | 27 | obj-$(CONFIG_EXYNOS4) += exynos4210_mct.o |
27 | F: hw/*/xilinx_* | 28 | diff --git a/include/hw/timer/xlnx-zynqmp-rtc.h b/include/hw/timer/xlnx-zynqmp-rtc.h |
28 | @@ -XXX,XX +XXX,XX @@ F: include/hw/misc/zynq* | 29 | new file mode 100644 |
29 | X: hw/ssi/xilinx_* | 30 | index XXXXXXX..XXXXXXX |
30 | 31 | --- /dev/null | |
31 | Xilinx ZynqMP | 32 | +++ b/include/hw/timer/xlnx-zynqmp-rtc.h |
32 | -M: Alistair Francis <alistair.francis@xilinx.com> | 33 | @@ -XXX,XX +XXX,XX @@ |
33 | +M: Alistair Francis <alistair@alistair23.me> | 34 | +/* |
34 | M: Edgar E. Iglesias <edgar.iglesias@gmail.com> | 35 | + * QEMU model of the Xilinx ZynqMP Real Time Clock (RTC). |
35 | L: qemu-arm@nongnu.org | 36 | + * |
36 | S: Maintained | 37 | + * Copyright (c) 2017 Xilinx Inc. |
37 | @@ -XXX,XX +XXX,XX @@ T: git git://github.com/bonzini/qemu.git scsi-next | 38 | + * |
38 | 39 | + * Written-by: Alistair Francis <alistair.francis@xilinx.com> | |
39 | SSI | 40 | + * |
40 | M: Peter Crosthwaite <crosthwaite.peter@gmail.com> | 41 | + * Permission is hereby granted, free of charge, to any person obtaining a copy |
41 | -M: Alistair Francis <alistair.francis@xilinx.com> | 42 | + * of this software and associated documentation files (the "Software"), to deal |
42 | +M: Alistair Francis <alistair@alistair23.me> | 43 | + * in the Software without restriction, including without limitation the rights |
43 | S: Maintained | 44 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell |
44 | F: hw/ssi/* | 45 | + * copies of the Software, and to permit persons to whom the Software is |
45 | F: hw/block/m25p80.c | 46 | + * furnished to do so, subject to the following conditions: |
46 | @@ -XXX,XX +XXX,XX @@ X: hw/ssi/xilinx_* | 47 | + * |
47 | F: tests/m25p80-test.c | 48 | + * The above copyright notice and this permission notice shall be included in |
48 | 49 | + * all copies or substantial portions of the Software. | |
49 | Xilinx SPI | 50 | + * |
50 | -M: Alistair Francis <alistair.francis@xilinx.com> | 51 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
51 | +M: Alistair Francis <alistair@alistair23.me> | 52 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
52 | M: Peter Crosthwaite <crosthwaite.peter@gmail.com> | 53 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
53 | S: Maintained | 54 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
54 | F: hw/ssi/xilinx_* | 55 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
55 | @@ -XXX,XX +XXX,XX @@ S: Maintained | 56 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN |
56 | F: hw/net/eepro100.c | 57 | + * THE SOFTWARE. |
57 | 58 | + */ | |
58 | Generic Loader | 59 | + |
59 | -M: Alistair Francis <alistair.francis@xilinx.com> | 60 | +#include "hw/register.h" |
60 | +M: Alistair Francis <alistair@alistair23.me> | 61 | + |
61 | S: Maintained | 62 | +#define TYPE_XLNX_ZYNQMP_RTC "xlnx-zynmp.rtc" |
62 | F: hw/core/generic-loader.c | 63 | + |
63 | F: include/hw/core/generic-loader.h | 64 | +#define XLNX_ZYNQMP_RTC(obj) \ |
64 | @@ -XXX,XX +XXX,XX @@ F: tests/qmp-test.c | 65 | + OBJECT_CHECK(XlnxZynqMPRTC, (obj), TYPE_XLNX_ZYNQMP_RTC) |
65 | T: git git://repo.or.cz/qemu/armbru.git qapi-next | 66 | + |
66 | 67 | +REG32(SET_TIME_WRITE, 0x0) | |
67 | Register API | 68 | +REG32(SET_TIME_READ, 0x4) |
68 | -M: Alistair Francis <alistair.francis@xilinx.com> | 69 | +REG32(CALIB_WRITE, 0x8) |
69 | +M: Alistair Francis <alistair@alistair23.me> | 70 | + FIELD(CALIB_WRITE, FRACTION_EN, 20, 1) |
70 | S: Maintained | 71 | + FIELD(CALIB_WRITE, FRACTION_DATA, 16, 4) |
71 | F: hw/core/register.c | 72 | + FIELD(CALIB_WRITE, MAX_TICK, 0, 16) |
72 | F: include/hw/register.h | 73 | +REG32(CALIB_READ, 0xc) |
74 | + FIELD(CALIB_READ, FRACTION_EN, 20, 1) | ||
75 | + FIELD(CALIB_READ, FRACTION_DATA, 16, 4) | ||
76 | + FIELD(CALIB_READ, MAX_TICK, 0, 16) | ||
77 | +REG32(CURRENT_TIME, 0x10) | ||
78 | +REG32(CURRENT_TICK, 0x14) | ||
79 | + FIELD(CURRENT_TICK, VALUE, 0, 16) | ||
80 | +REG32(ALARM, 0x18) | ||
81 | +REG32(RTC_INT_STATUS, 0x20) | ||
82 | + FIELD(RTC_INT_STATUS, ALARM, 1, 1) | ||
83 | + FIELD(RTC_INT_STATUS, SECONDS, 0, 1) | ||
84 | +REG32(RTC_INT_MASK, 0x24) | ||
85 | + FIELD(RTC_INT_MASK, ALARM, 1, 1) | ||
86 | + FIELD(RTC_INT_MASK, SECONDS, 0, 1) | ||
87 | +REG32(RTC_INT_EN, 0x28) | ||
88 | + FIELD(RTC_INT_EN, ALARM, 1, 1) | ||
89 | + FIELD(RTC_INT_EN, SECONDS, 0, 1) | ||
90 | +REG32(RTC_INT_DIS, 0x2c) | ||
91 | + FIELD(RTC_INT_DIS, ALARM, 1, 1) | ||
92 | + FIELD(RTC_INT_DIS, SECONDS, 0, 1) | ||
93 | +REG32(ADDR_ERROR, 0x30) | ||
94 | + FIELD(ADDR_ERROR, STATUS, 0, 1) | ||
95 | +REG32(ADDR_ERROR_INT_MASK, 0x34) | ||
96 | + FIELD(ADDR_ERROR_INT_MASK, MASK, 0, 1) | ||
97 | +REG32(ADDR_ERROR_INT_EN, 0x38) | ||
98 | + FIELD(ADDR_ERROR_INT_EN, MASK, 0, 1) | ||
99 | +REG32(ADDR_ERROR_INT_DIS, 0x3c) | ||
100 | + FIELD(ADDR_ERROR_INT_DIS, MASK, 0, 1) | ||
101 | +REG32(CONTROL, 0x40) | ||
102 | + FIELD(CONTROL, BATTERY_DISABLE, 31, 1) | ||
103 | + FIELD(CONTROL, OSC_CNTRL, 24, 4) | ||
104 | + FIELD(CONTROL, SLVERR_ENABLE, 0, 1) | ||
105 | +REG32(SAFETY_CHK, 0x50) | ||
106 | + | ||
107 | +#define XLNX_ZYNQMP_RTC_R_MAX (R_SAFETY_CHK + 1) | ||
108 | + | ||
109 | +typedef struct XlnxZynqMPRTC { | ||
110 | + SysBusDevice parent_obj; | ||
111 | + MemoryRegion iomem; | ||
112 | + qemu_irq irq_rtc_int; | ||
113 | + qemu_irq irq_addr_error_int; | ||
114 | + | ||
115 | + uint32_t regs[XLNX_ZYNQMP_RTC_R_MAX]; | ||
116 | + RegisterInfo regs_info[XLNX_ZYNQMP_RTC_R_MAX]; | ||
117 | +} XlnxZynqMPRTC; | ||
118 | diff --git a/hw/timer/xlnx-zynqmp-rtc.c b/hw/timer/xlnx-zynqmp-rtc.c | ||
119 | new file mode 100644 | ||
120 | index XXXXXXX..XXXXXXX | ||
121 | --- /dev/null | ||
122 | +++ b/hw/timer/xlnx-zynqmp-rtc.c | ||
123 | @@ -XXX,XX +XXX,XX @@ | ||
124 | +/* | ||
125 | + * QEMU model of the Xilinx ZynqMP Real Time Clock (RTC). | ||
126 | + * | ||
127 | + * Copyright (c) 2017 Xilinx Inc. | ||
128 | + * | ||
129 | + * Written-by: Alistair Francis <alistair.francis@xilinx.com> | ||
130 | + * | ||
131 | + * Permission is hereby granted, free of charge, to any person obtaining a copy | ||
132 | + * of this software and associated documentation files (the "Software"), to deal | ||
133 | + * in the Software without restriction, including without limitation the rights | ||
134 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||
135 | + * copies of the Software, and to permit persons to whom the Software is | ||
136 | + * furnished to do so, subject to the following conditions: | ||
137 | + * | ||
138 | + * The above copyright notice and this permission notice shall be included in | ||
139 | + * all copies or substantial portions of the Software. | ||
140 | + * | ||
141 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
142 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
143 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | ||
144 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
145 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||
146 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | ||
147 | + * THE SOFTWARE. | ||
148 | + */ | ||
149 | + | ||
150 | +#include "qemu/osdep.h" | ||
151 | +#include "hw/sysbus.h" | ||
152 | +#include "hw/register.h" | ||
153 | +#include "qemu/bitops.h" | ||
154 | +#include "qemu/log.h" | ||
155 | +#include "hw/timer/xlnx-zynqmp-rtc.h" | ||
156 | + | ||
157 | +#ifndef XLNX_ZYNQMP_RTC_ERR_DEBUG | ||
158 | +#define XLNX_ZYNQMP_RTC_ERR_DEBUG 0 | ||
159 | +#endif | ||
160 | + | ||
161 | +static void rtc_int_update_irq(XlnxZynqMPRTC *s) | ||
162 | +{ | ||
163 | + bool pending = s->regs[R_RTC_INT_STATUS] & ~s->regs[R_RTC_INT_MASK]; | ||
164 | + qemu_set_irq(s->irq_rtc_int, pending); | ||
165 | +} | ||
166 | + | ||
167 | +static void addr_error_int_update_irq(XlnxZynqMPRTC *s) | ||
168 | +{ | ||
169 | + bool pending = s->regs[R_ADDR_ERROR] & ~s->regs[R_ADDR_ERROR_INT_MASK]; | ||
170 | + qemu_set_irq(s->irq_addr_error_int, pending); | ||
171 | +} | ||
172 | + | ||
173 | +static void rtc_int_status_postw(RegisterInfo *reg, uint64_t val64) | ||
174 | +{ | ||
175 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); | ||
176 | + rtc_int_update_irq(s); | ||
177 | +} | ||
178 | + | ||
179 | +static uint64_t rtc_int_en_prew(RegisterInfo *reg, uint64_t val64) | ||
180 | +{ | ||
181 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); | ||
182 | + | ||
183 | + s->regs[R_RTC_INT_MASK] &= (uint32_t) ~val64; | ||
184 | + rtc_int_update_irq(s); | ||
185 | + return 0; | ||
186 | +} | ||
187 | + | ||
188 | +static uint64_t rtc_int_dis_prew(RegisterInfo *reg, uint64_t val64) | ||
189 | +{ | ||
190 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); | ||
191 | + | ||
192 | + s->regs[R_RTC_INT_MASK] |= (uint32_t) val64; | ||
193 | + rtc_int_update_irq(s); | ||
194 | + return 0; | ||
195 | +} | ||
196 | + | ||
197 | +static void addr_error_postw(RegisterInfo *reg, uint64_t val64) | ||
198 | +{ | ||
199 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); | ||
200 | + addr_error_int_update_irq(s); | ||
201 | +} | ||
202 | + | ||
203 | +static uint64_t addr_error_int_en_prew(RegisterInfo *reg, uint64_t val64) | ||
204 | +{ | ||
205 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); | ||
206 | + | ||
207 | + s->regs[R_ADDR_ERROR_INT_MASK] &= (uint32_t) ~val64; | ||
208 | + addr_error_int_update_irq(s); | ||
209 | + return 0; | ||
210 | +} | ||
211 | + | ||
212 | +static uint64_t addr_error_int_dis_prew(RegisterInfo *reg, uint64_t val64) | ||
213 | +{ | ||
214 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); | ||
215 | + | ||
216 | + s->regs[R_ADDR_ERROR_INT_MASK] |= (uint32_t) val64; | ||
217 | + addr_error_int_update_irq(s); | ||
218 | + return 0; | ||
219 | +} | ||
220 | + | ||
221 | +static const RegisterAccessInfo rtc_regs_info[] = { | ||
222 | + { .name = "SET_TIME_WRITE", .addr = A_SET_TIME_WRITE, | ||
223 | + },{ .name = "SET_TIME_READ", .addr = A_SET_TIME_READ, | ||
224 | + .ro = 0xffffffff, | ||
225 | + },{ .name = "CALIB_WRITE", .addr = A_CALIB_WRITE, | ||
226 | + },{ .name = "CALIB_READ", .addr = A_CALIB_READ, | ||
227 | + .ro = 0x1fffff, | ||
228 | + },{ .name = "CURRENT_TIME", .addr = A_CURRENT_TIME, | ||
229 | + .ro = 0xffffffff, | ||
230 | + },{ .name = "CURRENT_TICK", .addr = A_CURRENT_TICK, | ||
231 | + .ro = 0xffff, | ||
232 | + },{ .name = "ALARM", .addr = A_ALARM, | ||
233 | + },{ .name = "RTC_INT_STATUS", .addr = A_RTC_INT_STATUS, | ||
234 | + .w1c = 0x3, | ||
235 | + .post_write = rtc_int_status_postw, | ||
236 | + },{ .name = "RTC_INT_MASK", .addr = A_RTC_INT_MASK, | ||
237 | + .reset = 0x3, | ||
238 | + .ro = 0x3, | ||
239 | + },{ .name = "RTC_INT_EN", .addr = A_RTC_INT_EN, | ||
240 | + .pre_write = rtc_int_en_prew, | ||
241 | + },{ .name = "RTC_INT_DIS", .addr = A_RTC_INT_DIS, | ||
242 | + .pre_write = rtc_int_dis_prew, | ||
243 | + },{ .name = "ADDR_ERROR", .addr = A_ADDR_ERROR, | ||
244 | + .w1c = 0x1, | ||
245 | + .post_write = addr_error_postw, | ||
246 | + },{ .name = "ADDR_ERROR_INT_MASK", .addr = A_ADDR_ERROR_INT_MASK, | ||
247 | + .reset = 0x1, | ||
248 | + .ro = 0x1, | ||
249 | + },{ .name = "ADDR_ERROR_INT_EN", .addr = A_ADDR_ERROR_INT_EN, | ||
250 | + .pre_write = addr_error_int_en_prew, | ||
251 | + },{ .name = "ADDR_ERROR_INT_DIS", .addr = A_ADDR_ERROR_INT_DIS, | ||
252 | + .pre_write = addr_error_int_dis_prew, | ||
253 | + },{ .name = "CONTROL", .addr = A_CONTROL, | ||
254 | + .reset = 0x1000000, | ||
255 | + .rsvd = 0x70fffffe, | ||
256 | + },{ .name = "SAFETY_CHK", .addr = A_SAFETY_CHK, | ||
257 | + } | ||
258 | +}; | ||
259 | + | ||
260 | +static void rtc_reset(DeviceState *dev) | ||
261 | +{ | ||
262 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(dev); | ||
263 | + unsigned int i; | ||
264 | + | ||
265 | + for (i = 0; i < ARRAY_SIZE(s->regs_info); ++i) { | ||
266 | + register_reset(&s->regs_info[i]); | ||
267 | + } | ||
268 | + | ||
269 | + rtc_int_update_irq(s); | ||
270 | + addr_error_int_update_irq(s); | ||
271 | +} | ||
272 | + | ||
273 | +static const MemoryRegionOps rtc_ops = { | ||
274 | + .read = register_read_memory, | ||
275 | + .write = register_write_memory, | ||
276 | + .endianness = DEVICE_LITTLE_ENDIAN, | ||
277 | + .valid = { | ||
278 | + .min_access_size = 4, | ||
279 | + .max_access_size = 4, | ||
280 | + }, | ||
281 | +}; | ||
282 | + | ||
283 | +static void rtc_init(Object *obj) | ||
284 | +{ | ||
285 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(obj); | ||
286 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
287 | + RegisterInfoArray *reg_array; | ||
288 | + | ||
289 | + memory_region_init(&s->iomem, obj, TYPE_XLNX_ZYNQMP_RTC, | ||
290 | + XLNX_ZYNQMP_RTC_R_MAX * 4); | ||
291 | + reg_array = | ||
292 | + register_init_block32(DEVICE(obj), rtc_regs_info, | ||
293 | + ARRAY_SIZE(rtc_regs_info), | ||
294 | + s->regs_info, s->regs, | ||
295 | + &rtc_ops, | ||
296 | + XLNX_ZYNQMP_RTC_ERR_DEBUG, | ||
297 | + XLNX_ZYNQMP_RTC_R_MAX * 4); | ||
298 | + memory_region_add_subregion(&s->iomem, | ||
299 | + 0x0, | ||
300 | + ®_array->mem); | ||
301 | + sysbus_init_mmio(sbd, &s->iomem); | ||
302 | + sysbus_init_irq(sbd, &s->irq_rtc_int); | ||
303 | + sysbus_init_irq(sbd, &s->irq_addr_error_int); | ||
304 | +} | ||
305 | + | ||
306 | +static const VMStateDescription vmstate_rtc = { | ||
307 | + .name = TYPE_XLNX_ZYNQMP_RTC, | ||
308 | + .version_id = 1, | ||
309 | + .minimum_version_id = 1, | ||
310 | + .fields = (VMStateField[]) { | ||
311 | + VMSTATE_UINT32_ARRAY(regs, XlnxZynqMPRTC, XLNX_ZYNQMP_RTC_R_MAX), | ||
312 | + VMSTATE_END_OF_LIST(), | ||
313 | + } | ||
314 | +}; | ||
315 | + | ||
316 | +static void rtc_class_init(ObjectClass *klass, void *data) | ||
317 | +{ | ||
318 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
319 | + | ||
320 | + dc->reset = rtc_reset; | ||
321 | + dc->vmsd = &vmstate_rtc; | ||
322 | +} | ||
323 | + | ||
324 | +static const TypeInfo rtc_info = { | ||
325 | + .name = TYPE_XLNX_ZYNQMP_RTC, | ||
326 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
327 | + .instance_size = sizeof(XlnxZynqMPRTC), | ||
328 | + .class_init = rtc_class_init, | ||
329 | + .instance_init = rtc_init, | ||
330 | +}; | ||
331 | + | ||
332 | +static void rtc_register_types(void) | ||
333 | +{ | ||
334 | + type_register_static(&rtc_info); | ||
335 | +} | ||
336 | + | ||
337 | +type_init(rtc_register_types) | ||
73 | -- | 338 | -- |
74 | 2.16.2 | 339 | 2.16.2 |
75 | 340 | ||
76 | 341 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Alistair Francis <alistair.francis@xilinx.com> |
---|---|---|---|
2 | 2 | ||
3 | These use the generic float16_compare functionality which in turn uses | 3 | Allow the guest to determine the time set from the QEMU command line. |
4 | the common float_compare code from the softfloat re-factor. | ||
5 | 4 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | This includes adding a trace event to debug the new time. |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 6 | |
8 | Message-id: 20180227143852.11175-11-alex.bennee@linaro.org | 7 | Signed-off-by: Alistair Francis <alistair.francis@xilinx.com> |
8 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
9 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 11 | --- |
11 | target/arm/helper-a64.h | 5 +++++ | 12 | include/hw/timer/xlnx-zynqmp-rtc.h | 2 ++ |
12 | target/arm/helper-a64.c | 49 ++++++++++++++++++++++++++++++++++++++++++++++ | 13 | hw/timer/xlnx-zynqmp-rtc.c | 58 ++++++++++++++++++++++++++++++++++++++ |
13 | target/arm/translate-a64.c | 15 ++++++++++++++ | 14 | hw/timer/trace-events | 3 ++ |
14 | 3 files changed, 69 insertions(+) | 15 | 3 files changed, 63 insertions(+) |
15 | 16 | ||
16 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 17 | diff --git a/include/hw/timer/xlnx-zynqmp-rtc.h b/include/hw/timer/xlnx-zynqmp-rtc.h |
17 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-a64.h | 19 | --- a/include/hw/timer/xlnx-zynqmp-rtc.h |
19 | +++ b/target/arm/helper-a64.h | 20 | +++ b/include/hw/timer/xlnx-zynqmp-rtc.h |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_addh, f16, f16, f16, ptr) | 21 | @@ -XXX,XX +XXX,XX @@ typedef struct XlnxZynqMPRTC { |
21 | DEF_HELPER_3(advsimd_subh, f16, f16, f16, ptr) | 22 | qemu_irq irq_rtc_int; |
22 | DEF_HELPER_3(advsimd_mulh, f16, f16, f16, ptr) | 23 | qemu_irq irq_addr_error_int; |
23 | DEF_HELPER_3(advsimd_divh, f16, f16, f16, ptr) | 24 | |
24 | +DEF_HELPER_3(advsimd_ceq_f16, i32, f16, f16, ptr) | 25 | + uint32_t tick_offset; |
25 | +DEF_HELPER_3(advsimd_cge_f16, i32, f16, f16, ptr) | 26 | + |
26 | +DEF_HELPER_3(advsimd_cgt_f16, i32, f16, f16, ptr) | 27 | uint32_t regs[XLNX_ZYNQMP_RTC_R_MAX]; |
27 | +DEF_HELPER_3(advsimd_acge_f16, i32, f16, f16, ptr) | 28 | RegisterInfo regs_info[XLNX_ZYNQMP_RTC_R_MAX]; |
28 | +DEF_HELPER_3(advsimd_acgt_f16, i32, f16, f16, ptr) | 29 | } XlnxZynqMPRTC; |
29 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 30 | diff --git a/hw/timer/xlnx-zynqmp-rtc.c b/hw/timer/xlnx-zynqmp-rtc.c |
30 | index XXXXXXX..XXXXXXX 100644 | 31 | index XXXXXXX..XXXXXXX 100644 |
31 | --- a/target/arm/helper-a64.c | 32 | --- a/hw/timer/xlnx-zynqmp-rtc.c |
32 | +++ b/target/arm/helper-a64.c | 33 | +++ b/hw/timer/xlnx-zynqmp-rtc.c |
33 | @@ -XXX,XX +XXX,XX @@ ADVSIMD_HALFOP(min) | 34 | @@ -XXX,XX +XXX,XX @@ |
34 | ADVSIMD_HALFOP(max) | 35 | #include "hw/register.h" |
35 | ADVSIMD_HALFOP(minnum) | 36 | #include "qemu/bitops.h" |
36 | ADVSIMD_HALFOP(maxnum) | 37 | #include "qemu/log.h" |
37 | + | 38 | +#include "hw/ptimer.h" |
38 | +/* | 39 | +#include "qemu/cutils.h" |
39 | + * Floating point comparisons produce an integer result. Softfloat | 40 | +#include "sysemu/sysemu.h" |
40 | + * routines return float_relation types which we convert to the 0/-1 | 41 | +#include "trace.h" |
41 | + * Neon requires. | 42 | #include "hw/timer/xlnx-zynqmp-rtc.h" |
42 | + */ | 43 | |
43 | + | 44 | #ifndef XLNX_ZYNQMP_RTC_ERR_DEBUG |
44 | +#define ADVSIMD_CMPRES(test) (test) ? 0xffff : 0 | 45 | @@ -XXX,XX +XXX,XX @@ static void addr_error_int_update_irq(XlnxZynqMPRTC *s) |
45 | + | 46 | qemu_set_irq(s->irq_addr_error_int, pending); |
46 | +uint32_t HELPER(advsimd_ceq_f16)(float16 a, float16 b, void *fpstp) | 47 | } |
48 | |||
49 | +static uint32_t rtc_get_count(XlnxZynqMPRTC *s) | ||
47 | +{ | 50 | +{ |
48 | + float_status *fpst = fpstp; | 51 | + int64_t now = qemu_clock_get_ns(rtc_clock); |
49 | + int compare = float16_compare_quiet(a, b, fpst); | 52 | + return s->tick_offset + now / NANOSECONDS_PER_SECOND; |
50 | + return ADVSIMD_CMPRES(compare == float_relation_equal); | ||
51 | +} | 53 | +} |
52 | + | 54 | + |
53 | +uint32_t HELPER(advsimd_cge_f16)(float16 a, float16 b, void *fpstp) | 55 | +static uint64_t current_time_postr(RegisterInfo *reg, uint64_t val64) |
54 | +{ | 56 | +{ |
55 | + float_status *fpst = fpstp; | 57 | + XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); |
56 | + int compare = float16_compare(a, b, fpst); | 58 | + |
57 | + return ADVSIMD_CMPRES(compare == float_relation_greater || | 59 | + return rtc_get_count(s); |
58 | + compare == float_relation_equal); | ||
59 | +} | 60 | +} |
60 | + | 61 | + |
61 | +uint32_t HELPER(advsimd_cgt_f16)(float16 a, float16 b, void *fpstp) | 62 | static void rtc_int_status_postw(RegisterInfo *reg, uint64_t val64) |
62 | +{ | 63 | { |
63 | + float_status *fpst = fpstp; | 64 | XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque); |
64 | + int compare = float16_compare(a, b, fpst); | 65 | @@ -XXX,XX +XXX,XX @@ static uint64_t addr_error_int_dis_prew(RegisterInfo *reg, uint64_t val64) |
65 | + return ADVSIMD_CMPRES(compare == float_relation_greater); | 66 | |
67 | static const RegisterAccessInfo rtc_regs_info[] = { | ||
68 | { .name = "SET_TIME_WRITE", .addr = A_SET_TIME_WRITE, | ||
69 | + .unimp = MAKE_64BIT_MASK(0, 32), | ||
70 | },{ .name = "SET_TIME_READ", .addr = A_SET_TIME_READ, | ||
71 | .ro = 0xffffffff, | ||
72 | + .post_read = current_time_postr, | ||
73 | },{ .name = "CALIB_WRITE", .addr = A_CALIB_WRITE, | ||
74 | + .unimp = MAKE_64BIT_MASK(0, 32), | ||
75 | },{ .name = "CALIB_READ", .addr = A_CALIB_READ, | ||
76 | .ro = 0x1fffff, | ||
77 | },{ .name = "CURRENT_TIME", .addr = A_CURRENT_TIME, | ||
78 | .ro = 0xffffffff, | ||
79 | + .post_read = current_time_postr, | ||
80 | },{ .name = "CURRENT_TICK", .addr = A_CURRENT_TICK, | ||
81 | .ro = 0xffff, | ||
82 | },{ .name = "ALARM", .addr = A_ALARM, | ||
83 | @@ -XXX,XX +XXX,XX @@ static void rtc_init(Object *obj) | ||
84 | XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(obj); | ||
85 | SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
86 | RegisterInfoArray *reg_array; | ||
87 | + struct tm current_tm; | ||
88 | |||
89 | memory_region_init(&s->iomem, obj, TYPE_XLNX_ZYNQMP_RTC, | ||
90 | XLNX_ZYNQMP_RTC_R_MAX * 4); | ||
91 | @@ -XXX,XX +XXX,XX @@ static void rtc_init(Object *obj) | ||
92 | sysbus_init_mmio(sbd, &s->iomem); | ||
93 | sysbus_init_irq(sbd, &s->irq_rtc_int); | ||
94 | sysbus_init_irq(sbd, &s->irq_addr_error_int); | ||
95 | + | ||
96 | + qemu_get_timedate(¤t_tm, 0); | ||
97 | + s->tick_offset = mktimegm(¤t_tm) - | ||
98 | + qemu_clock_get_ns(rtc_clock) / NANOSECONDS_PER_SECOND; | ||
99 | + | ||
100 | + trace_xlnx_zynqmp_rtc_gettime(current_tm.tm_year, current_tm.tm_mon, | ||
101 | + current_tm.tm_mday, current_tm.tm_hour, | ||
102 | + current_tm.tm_min, current_tm.tm_sec); | ||
66 | +} | 103 | +} |
67 | + | 104 | + |
68 | +uint32_t HELPER(advsimd_acge_f16)(float16 a, float16 b, void *fpstp) | 105 | +static int rtc_pre_save(void *opaque) |
69 | +{ | 106 | +{ |
70 | + float_status *fpst = fpstp; | 107 | + XlnxZynqMPRTC *s = opaque; |
71 | + float16 f0 = float16_abs(a); | 108 | + int64_t now = qemu_clock_get_ns(rtc_clock) / NANOSECONDS_PER_SECOND; |
72 | + float16 f1 = float16_abs(b); | 109 | + |
73 | + int compare = float16_compare(f0, f1, fpst); | 110 | + /* Add the time at migration */ |
74 | + return ADVSIMD_CMPRES(compare == float_relation_greater || | 111 | + s->tick_offset = s->tick_offset + now; |
75 | + compare == float_relation_equal); | 112 | + |
113 | + return 0; | ||
76 | +} | 114 | +} |
77 | + | 115 | + |
78 | +uint32_t HELPER(advsimd_acgt_f16)(float16 a, float16 b, void *fpstp) | 116 | +static int rtc_post_load(void *opaque, int version_id) |
79 | +{ | 117 | +{ |
80 | + float_status *fpst = fpstp; | 118 | + XlnxZynqMPRTC *s = opaque; |
81 | + float16 f0 = float16_abs(a); | 119 | + int64_t now = qemu_clock_get_ns(rtc_clock) / NANOSECONDS_PER_SECOND; |
82 | + float16 f1 = float16_abs(b); | 120 | + |
83 | + int compare = float16_compare(f0, f1, fpst); | 121 | + /* Subtract the time after migration. This combined with the pre_save |
84 | + return ADVSIMD_CMPRES(compare == float_relation_greater); | 122 | + * action results in us having subtracted the time that the guest was |
85 | +} | 123 | + * stopped to the offset. |
86 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 124 | + */ |
125 | + s->tick_offset = s->tick_offset - now; | ||
126 | + | ||
127 | + return 0; | ||
128 | } | ||
129 | |||
130 | static const VMStateDescription vmstate_rtc = { | ||
131 | .name = TYPE_XLNX_ZYNQMP_RTC, | ||
132 | .version_id = 1, | ||
133 | .minimum_version_id = 1, | ||
134 | + .pre_save = rtc_pre_save, | ||
135 | + .post_load = rtc_post_load, | ||
136 | .fields = (VMStateField[]) { | ||
137 | VMSTATE_UINT32_ARRAY(regs, XlnxZynqMPRTC, XLNX_ZYNQMP_RTC_R_MAX), | ||
138 | + VMSTATE_UINT32(tick_offset, XlnxZynqMPRTC), | ||
139 | VMSTATE_END_OF_LIST(), | ||
140 | } | ||
141 | }; | ||
142 | diff --git a/hw/timer/trace-events b/hw/timer/trace-events | ||
87 | index XXXXXXX..XXXXXXX 100644 | 143 | index XXXXXXX..XXXXXXX 100644 |
88 | --- a/target/arm/translate-a64.c | 144 | --- a/hw/timer/trace-events |
89 | +++ b/target/arm/translate-a64.c | 145 | +++ b/hw/timer/trace-events |
90 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | 146 | @@ -XXX,XX +XXX,XX @@ systick_write(uint64_t addr, uint32_t value, unsigned size) "systick write addr |
91 | case 0x2: /* FADD */ | 147 | cmsdk_apb_timer_read(uint64_t offset, uint64_t data, unsigned size) "CMSDK APB timer read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u" |
92 | gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst); | 148 | cmsdk_apb_timer_write(uint64_t offset, uint64_t data, unsigned size) "CMSDK APB timer write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u" |
93 | break; | 149 | cmsdk_apb_timer_reset(void) "CMSDK APB timer: reset" |
94 | + case 0x4: /* FCMEQ */ | 150 | + |
95 | + gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 151 | +# hw/timer/xlnx-zynqmp-rtc.c |
96 | + break; | 152 | +xlnx_zynqmp_rtc_gettime(int year, int month, int day, int hour, int min, int sec) "Get time from host: %d-%d-%d %2d:%02d:%02d" |
97 | case 0x6: /* FMAX */ | ||
98 | gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
99 | break; | ||
100 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | ||
101 | case 0x13: /* FMUL */ | ||
102 | gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
103 | break; | ||
104 | + case 0x14: /* FCMGE */ | ||
105 | + gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
106 | + break; | ||
107 | + case 0x15: /* FACGE */ | ||
108 | + gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
109 | + break; | ||
110 | case 0x17: /* FDIV */ | ||
111 | gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
112 | break; | ||
113 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | ||
114 | gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
115 | tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff); | ||
116 | break; | ||
117 | + case 0x1c: /* FCMGT */ | ||
118 | + gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
119 | + break; | ||
120 | + case 0x1d: /* FACGT */ | ||
121 | + gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
122 | + break; | ||
123 | default: | ||
124 | fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n", | ||
125 | __func__, insn, fpopcode, s->pc); | ||
126 | -- | 153 | -- |
127 | 2.16.2 | 154 | 2.16.2 |
128 | 155 | ||
129 | 156 | diff view generated by jsdifflib |
1 | From: Alistair Francis <alistair.francis@xilinx.com> | 1 | From: Alistair Francis <alistair.francis@xilinx.com> |
---|---|---|---|
2 | 2 | ||
3 | Ensure that the post write hook is called during reset. This allows us | ||
4 | to rely on the post write functions instead of having to call them from | ||
5 | the reset() function. | ||
6 | |||
7 | Signed-off-by: Alistair Francis <alistair.francis@xilinx.com> | 3 | Signed-off-by: Alistair Francis <alistair.francis@xilinx.com> |
4 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
8 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | 5 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
9 | Message-id: d131e24b911653a945e46ca2d8f90f572469e1dd.1517856214.git.alistair.francis@xilinx.com | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 7 | --- |
12 | include/hw/register.h | 6 +++--- | 8 | include/hw/arm/xlnx-zynqmp.h | 2 ++ |
13 | hw/core/register.c | 8 ++++++++ | 9 | hw/arm/xlnx-zynqmp.c | 14 ++++++++++++++ |
14 | 2 files changed, 11 insertions(+), 3 deletions(-) | 10 | 2 files changed, 16 insertions(+) |
15 | 11 | ||
16 | diff --git a/include/hw/register.h b/include/hw/register.h | 12 | diff --git a/include/hw/arm/xlnx-zynqmp.h b/include/hw/arm/xlnx-zynqmp.h |
17 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/include/hw/register.h | 14 | --- a/include/hw/arm/xlnx-zynqmp.h |
19 | +++ b/include/hw/register.h | 15 | +++ b/include/hw/arm/xlnx-zynqmp.h |
20 | @@ -XXX,XX +XXX,XX @@ typedef struct RegisterInfoArray RegisterInfoArray; | 16 | @@ -XXX,XX +XXX,XX @@ |
21 | * immediately before the actual write. The returned value is what is written, | 17 | #include "hw/dma/xlnx_dpdma.h" |
22 | * giving the handler a chance to modify the written value. | 18 | #include "hw/display/xlnx_dp.h" |
23 | * @post_write: Post write callback. Passed the written value. Most write side | 19 | #include "hw/intc/xlnx-zynqmp-ipi.h" |
24 | - * effects should be implemented here. | 20 | +#include "hw/timer/xlnx-zynqmp-rtc.h" |
25 | + * effects should be implemented here. This is called during device reset. | 21 | |
26 | * | 22 | #define TYPE_XLNX_ZYNQMP "xlnx,zynqmp" |
27 | * @post_read: Post read callback. Passes the value that is about to be returned | 23 | #define XLNX_ZYNQMP(obj) OBJECT_CHECK(XlnxZynqMPState, (obj), \ |
28 | * for a read. The return value from this function is what is ultimately read, | 24 | @@ -XXX,XX +XXX,XX @@ typedef struct XlnxZynqMPState { |
29 | @@ -XXX,XX +XXX,XX @@ uint64_t register_read(RegisterInfo *reg, uint64_t re, const char* prefix, | 25 | XlnxDPState dp; |
30 | bool debug); | 26 | XlnxDPDMAState dpdma; |
31 | 27 | XlnxZynqMPIPI ipi; | |
32 | /** | 28 | + XlnxZynqMPRTC rtc; |
33 | - * reset a register | 29 | |
34 | - * @reg: register to reset | 30 | char *boot_cpu; |
35 | + * Resets a register. This will also call the post_write hook if it exists. | 31 | ARMCPU *boot_cpu_ptr; |
36 | + * @reg: The register to reset. | 32 | diff --git a/hw/arm/xlnx-zynqmp.c b/hw/arm/xlnx-zynqmp.c |
37 | */ | ||
38 | |||
39 | void register_reset(RegisterInfo *reg); | ||
40 | diff --git a/hw/core/register.c b/hw/core/register.c | ||
41 | index XXXXXXX..XXXXXXX 100644 | 33 | index XXXXXXX..XXXXXXX 100644 |
42 | --- a/hw/core/register.c | 34 | --- a/hw/arm/xlnx-zynqmp.c |
43 | +++ b/hw/core/register.c | 35 | +++ b/hw/arm/xlnx-zynqmp.c |
44 | @@ -XXX,XX +XXX,XX @@ uint64_t register_read(RegisterInfo *reg, uint64_t re, const char* prefix, | 36 | @@ -XXX,XX +XXX,XX @@ |
45 | 37 | #define IPI_ADDR 0xFF300000 | |
46 | void register_reset(RegisterInfo *reg) | 38 | #define IPI_IRQ 64 |
47 | { | 39 | |
48 | + const RegisterAccessInfo *ac; | 40 | +#define RTC_ADDR 0xffa60000 |
41 | +#define RTC_IRQ 26 | ||
49 | + | 42 | + |
50 | g_assert(reg); | 43 | #define SDHCI_CAPABILITIES 0x280737ec6481 /* Datasheet: UG1085 (v1.7) */ |
51 | 44 | ||
52 | if (!reg->data || !reg->access) { | 45 | static const uint64_t gem_addr[XLNX_ZYNQMP_NUM_GEMS] = { |
53 | return; | 46 | @@ -XXX,XX +XXX,XX @@ static void xlnx_zynqmp_init(Object *obj) |
47 | |||
48 | object_initialize(&s->ipi, sizeof(s->ipi), TYPE_XLNX_ZYNQMP_IPI); | ||
49 | qdev_set_parent_bus(DEVICE(&s->ipi), sysbus_get_default()); | ||
50 | + | ||
51 | + object_initialize(&s->rtc, sizeof(s->rtc), TYPE_XLNX_ZYNQMP_RTC); | ||
52 | + qdev_set_parent_bus(DEVICE(&s->rtc), sysbus_get_default()); | ||
53 | } | ||
54 | |||
55 | static void xlnx_zynqmp_realize(DeviceState *dev, Error **errp) | ||
56 | @@ -XXX,XX +XXX,XX @@ static void xlnx_zynqmp_realize(DeviceState *dev, Error **errp) | ||
54 | } | 57 | } |
55 | 58 | sysbus_mmio_map(SYS_BUS_DEVICE(&s->ipi), 0, IPI_ADDR); | |
56 | + ac = reg->access; | 59 | sysbus_connect_irq(SYS_BUS_DEVICE(&s->ipi), 0, gic_spi[IPI_IRQ]); |
57 | + | 60 | + |
58 | register_write_val(reg, reg->access->reset); | 61 | + object_property_set_bool(OBJECT(&s->rtc), true, "realized", &err); |
59 | + | 62 | + if (err) { |
60 | + if (ac->post_write) { | 63 | + error_propagate(errp, err); |
61 | + ac->post_write(reg, reg->access->reset); | 64 | + return; |
62 | + } | 65 | + } |
66 | + sysbus_mmio_map(SYS_BUS_DEVICE(&s->rtc), 0, RTC_ADDR); | ||
67 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->rtc), 0, gic_spi[RTC_IRQ]); | ||
63 | } | 68 | } |
64 | 69 | ||
65 | void register_init(RegisterInfo *reg) | 70 | static Property xlnx_zynqmp_props[] = { |
66 | -- | 71 | -- |
67 | 2.16.2 | 72 | 2.16.2 |
68 | 73 | ||
69 | 74 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | From: Francisco Iglesias <frasse.iglesias@gmail.com> | ||
2 | 1 | ||
3 | Assert only the lower cs on bus 0 and upper cs on bus 1 when both buses and | ||
4 | chip selects are enabled (e.g reading/writing with stripe). | ||
5 | |||
6 | Signed-off-by: Francisco Iglesias <frasse.iglesias@gmail.com> | ||
7 | Reviewed-by: Alistair Francis <alistair.francis@xilinx.com> | ||
8 | Tested-by: Alistair Francis <alistair.francis@xilinx.com> | ||
9 | Message-id: 20180223232233.31482-2-frasse.iglesias@gmail.com | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | --- | ||
12 | hw/ssi/xilinx_spips.c | 41 +++++++++++++++++++++++++++++++++++++---- | ||
13 | 1 file changed, 37 insertions(+), 4 deletions(-) | ||
14 | |||
15 | diff --git a/hw/ssi/xilinx_spips.c b/hw/ssi/xilinx_spips.c | ||
16 | index XXXXXXX..XXXXXXX 100644 | ||
17 | --- a/hw/ssi/xilinx_spips.c | ||
18 | +++ b/hw/ssi/xilinx_spips.c | ||
19 | @@ -XXX,XX +XXX,XX @@ static void xilinx_spips_update_cs(XilinxSPIPS *s, int field) | ||
20 | { | ||
21 | int i; | ||
22 | |||
23 | - for (i = 0; i < s->num_cs; i++) { | ||
24 | + for (i = 0; i < s->num_cs * s->num_busses; i++) { | ||
25 | bool old_state = s->cs_lines_state[i]; | ||
26 | bool new_state = field & (1 << i); | ||
27 | |||
28 | @@ -XXX,XX +XXX,XX @@ static void xilinx_spips_update_cs(XilinxSPIPS *s, int field) | ||
29 | } | ||
30 | qemu_set_irq(s->cs_lines[i], !new_state); | ||
31 | } | ||
32 | - if (!(field & ((1 << s->num_cs) - 1))) { | ||
33 | + if (!(field & ((1 << (s->num_cs * s->num_busses)) - 1))) { | ||
34 | s->snoop_state = SNOOP_CHECKING; | ||
35 | s->cmd_dummies = 0; | ||
36 | s->link_state = 1; | ||
37 | @@ -XXX,XX +XXX,XX @@ static void xlnx_zynqmp_qspips_update_cs_lines(XlnxZynqMPQSPIPS *s) | ||
38 | { | ||
39 | if (s->regs[R_GQSPI_GF_SNAPSHOT]) { | ||
40 | int field = ARRAY_FIELD_EX32(s->regs, GQSPI_GF_SNAPSHOT, CHIP_SELECT); | ||
41 | - xilinx_spips_update_cs(XILINX_SPIPS(s), field); | ||
42 | + bool upper_cs_sel = field & (1 << 1); | ||
43 | + bool lower_cs_sel = field & 1; | ||
44 | + bool bus0_enabled; | ||
45 | + bool bus1_enabled; | ||
46 | + uint8_t buses; | ||
47 | + int cs = 0; | ||
48 | + | ||
49 | + buses = ARRAY_FIELD_EX32(s->regs, GQSPI_GF_SNAPSHOT, DATA_BUS_SELECT); | ||
50 | + bus0_enabled = buses & 1; | ||
51 | + bus1_enabled = buses & (1 << 1); | ||
52 | + | ||
53 | + if (bus0_enabled && bus1_enabled) { | ||
54 | + if (lower_cs_sel) { | ||
55 | + cs |= 1; | ||
56 | + } | ||
57 | + if (upper_cs_sel) { | ||
58 | + cs |= 1 << 3; | ||
59 | + } | ||
60 | + } else if (bus0_enabled) { | ||
61 | + if (lower_cs_sel) { | ||
62 | + cs |= 1; | ||
63 | + } | ||
64 | + if (upper_cs_sel) { | ||
65 | + cs |= 1 << 1; | ||
66 | + } | ||
67 | + } else if (bus1_enabled) { | ||
68 | + if (lower_cs_sel) { | ||
69 | + cs |= 1 << 2; | ||
70 | + } | ||
71 | + if (upper_cs_sel) { | ||
72 | + cs |= 1 << 3; | ||
73 | + } | ||
74 | + } | ||
75 | + xilinx_spips_update_cs(XILINX_SPIPS(s), cs); | ||
76 | } | ||
77 | } | ||
78 | |||
79 | @@ -XXX,XX +XXX,XX @@ static void xilinx_spips_update_cs_lines(XilinxSPIPS *s) | ||
80 | if (num_effective_busses(s) == 2) { | ||
81 | /* Single bit chip-select for qspi */ | ||
82 | field &= 0x1; | ||
83 | - field |= field << 1; | ||
84 | + field |= field << 3; | ||
85 | /* Dual stack U-Page */ | ||
86 | } else if (s->regs[R_LQSPI_CFG] & LQSPI_CFG_TWO_MEM && | ||
87 | s->regs[R_LQSPI_STS] & LQSPI_CFG_U_PAGE) { | ||
88 | -- | ||
89 | 2.16.2 | ||
90 | |||
91 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | From: Francisco Iglesias <frasse.iglesias@gmail.com> | ||
2 | 1 | ||
3 | Use 8 dummy cycles (4 dummy bytes) with the QIOR/QIOR4 commands in legacy mode | ||
4 | for matching what is expected by Micron (Numonyx) flashes (the default target | ||
5 | flash type of the QSPI). | ||
6 | |||
7 | Signed-off-by: Francisco Iglesias <frasse.iglesias@gmail.com> | ||
8 | Tested-by: Alistair Francis <alistair.francis@xilinx.com> | ||
9 | Reviewed-by: Alistair Francis <alistair.francis@xilinx.com> | ||
10 | Message-id: 20180223232233.31482-3-frasse.iglesias@gmail.com | ||
11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
12 | --- | ||
13 | hw/ssi/xilinx_spips.c | 2 +- | ||
14 | 1 file changed, 1 insertion(+), 1 deletion(-) | ||
15 | |||
16 | diff --git a/hw/ssi/xilinx_spips.c b/hw/ssi/xilinx_spips.c | ||
17 | index XXXXXXX..XXXXXXX 100644 | ||
18 | --- a/hw/ssi/xilinx_spips.c | ||
19 | +++ b/hw/ssi/xilinx_spips.c | ||
20 | @@ -XXX,XX +XXX,XX @@ static int xilinx_spips_num_dummies(XilinxQSPIPS *qs, uint8_t command) | ||
21 | return 2; | ||
22 | case QIOR: | ||
23 | case QIOR_4: | ||
24 | - return 5; | ||
25 | + return 4; | ||
26 | default: | ||
27 | return -1; | ||
28 | } | ||
29 | -- | ||
30 | 2.16.2 | ||
31 | |||
32 | diff view generated by jsdifflib |
Deleted patch | |||
---|---|---|---|
1 | From: Corey Minyard <cminyard@mvista.com> | ||
2 | 1 | ||
3 | Signed-off-by: Corey Minyard <cminyard@mvista.com> | ||
4 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
5 | Signed-off-by: Linus Walleij <linus.walleij@linaro.org> | ||
6 | Message-id: 20180227104903.21353-2-linus.walleij@linaro.org | ||
7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
8 | --- | ||
9 | include/hw/i2c/i2c.h | 6 ++---- | ||
10 | hw/i2c/core.c | 3 +-- | ||
11 | 2 files changed, 3 insertions(+), 6 deletions(-) | ||
12 | |||
13 | diff --git a/include/hw/i2c/i2c.h b/include/hw/i2c/i2c.h | ||
14 | index XXXXXXX..XXXXXXX 100644 | ||
15 | --- a/include/hw/i2c/i2c.h | ||
16 | +++ b/include/hw/i2c/i2c.h | ||
17 | @@ -XXX,XX +XXX,XX @@ typedef struct I2CSlave I2CSlave; | ||
18 | #define I2C_SLAVE_GET_CLASS(obj) \ | ||
19 | OBJECT_GET_CLASS(I2CSlaveClass, (obj), TYPE_I2C_SLAVE) | ||
20 | |||
21 | -typedef struct I2CSlaveClass | ||
22 | -{ | ||
23 | +typedef struct I2CSlaveClass { | ||
24 | DeviceClass parent_class; | ||
25 | |||
26 | /* Callbacks provided by the device. */ | ||
27 | @@ -XXX,XX +XXX,XX @@ typedef struct I2CSlaveClass | ||
28 | int (*event)(I2CSlave *s, enum i2c_event event); | ||
29 | } I2CSlaveClass; | ||
30 | |||
31 | -struct I2CSlave | ||
32 | -{ | ||
33 | +struct I2CSlave { | ||
34 | DeviceState qdev; | ||
35 | |||
36 | /* Remaining fields for internal use by the I2C code. */ | ||
37 | diff --git a/hw/i2c/core.c b/hw/i2c/core.c | ||
38 | index XXXXXXX..XXXXXXX 100644 | ||
39 | --- a/hw/i2c/core.c | ||
40 | +++ b/hw/i2c/core.c | ||
41 | @@ -XXX,XX +XXX,XX @@ struct I2CNode { | ||
42 | |||
43 | #define I2C_BROADCAST 0x00 | ||
44 | |||
45 | -struct I2CBus | ||
46 | -{ | ||
47 | +struct I2CBus { | ||
48 | BusState qbus; | ||
49 | QLIST_HEAD(, I2CNode) current_devs; | ||
50 | uint8_t saved_address; | ||
51 | -- | ||
52 | 2.16.2 | ||
53 | |||
54 | diff view generated by jsdifflib |
1 | From: Linus Walleij <linus.walleij@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | The tx function of the DDC I2C slave emulation was returning 1 | 3 | Allow the translate subroutines to return false for invalid insns. |
4 | on all writes resulting in NACK in the I2C bus. Changing it to | ||
5 | 0 makes the DDC I2C work fine with bit-banged I2C such as the | ||
6 | versatile I2C. | ||
7 | 4 | ||
8 | I guess it was not affecting whatever I2C controller this was | 5 | At present we can of course invoke an invalid insn exception from within |
9 | used with until now, but with the Versatile I2C it surely | 6 | the translate subroutine, but in the short term this consolidates code. |
10 | does not work. | 7 | In the long term it would allow the decodetree language to support |
8 | overlapping patterns for ISA extensions. | ||
11 | 9 | ||
10 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
11 | Message-id: 20180227232618.2908-1-richard.henderson@linaro.org | ||
12 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
13 | Signed-off-by: Linus Walleij <linus.walleij@linaro.org> | ||
14 | Message-id: 20180227104903.21353-4-linus.walleij@linaro.org | ||
15 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
16 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
17 | --- | 14 | --- |
18 | hw/i2c/i2c-ddc.c | 4 ++-- | 15 | scripts/decodetree.py | 5 ++--- |
19 | 1 file changed, 2 insertions(+), 2 deletions(-) | 16 | 1 file changed, 2 insertions(+), 3 deletions(-) |
20 | 17 | ||
21 | diff --git a/hw/i2c/i2c-ddc.c b/hw/i2c/i2c-ddc.c | 18 | diff --git a/scripts/decodetree.py b/scripts/decodetree.py |
22 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100755 |
23 | --- a/hw/i2c/i2c-ddc.c | 20 | --- a/scripts/decodetree.py |
24 | +++ b/hw/i2c/i2c-ddc.c | 21 | +++ b/scripts/decodetree.py |
25 | @@ -XXX,XX +XXX,XX @@ static int i2c_ddc_tx(I2CSlave *i2c, uint8_t data) | 22 | @@ -XXX,XX +XXX,XX @@ class Pattern(General): |
26 | s->reg = data; | 23 | global translate_prefix |
27 | s->firstbyte = false; | 24 | output('typedef ', self.base.base.struct_name(), |
28 | DPRINTF("[EDID] Written new pointer: %u\n", data); | 25 | ' arg_', self.name, ';\n') |
29 | - return 1; | 26 | - output(translate_scope, 'void ', translate_prefix, '_', self.name, |
30 | + return 0; | 27 | + output(translate_scope, 'bool ', translate_prefix, '_', self.name, |
31 | } | 28 | '(DisasContext *ctx, arg_', self.name, |
32 | 29 | ' *a, ', insntype, ' insn);\n') | |
33 | /* Ignore all writes */ | 30 | |
34 | s->reg++; | 31 | @@ -XXX,XX +XXX,XX @@ class Pattern(General): |
35 | - return 1; | 32 | output(ind, self.base.extract_name(), '(&u.f_', arg, ', insn);\n') |
36 | + return 0; | 33 | for n, f in self.fields.items(): |
37 | } | 34 | output(ind, 'u.f_', arg, '.', n, ' = ', f.str_extract(), ';\n') |
38 | 35 | - output(ind, translate_prefix, '_', self.name, | |
39 | static void i2c_ddc_init(Object *obj) | 36 | + output(ind, 'return ', translate_prefix, '_', self.name, |
37 | '(ctx, &u.f_', arg, ', insn);\n') | ||
38 | - output(ind, 'return true;\n') | ||
39 | # end Pattern | ||
40 | |||
41 | |||
40 | -- | 42 | -- |
41 | 2.16.2 | 43 | 2.16.2 |
42 | 44 | ||
43 | 45 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Add a function load_ramdisk_as() which behaves like the existing |
---|---|---|---|
2 | load_ramdisk() but allows the caller to specify the AddressSpace | ||
3 | to use. This matches the pattern we have already for various | ||
4 | other loader functions. | ||
2 | 5 | ||
3 | A bunch of the vectorised bitwise operations just operate on larger | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | chunks at a time. We can do the same for the new half-precision | 7 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
5 | operations by introducing some TWOHALFOP helpers which work on each | 8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
6 | half of a pair of half-precision operations at once. | 9 | Message-id: 20180220180325.29818-2-peter.maydell@linaro.org |
10 | --- | ||
11 | include/hw/loader.h | 12 +++++++++++- | ||
12 | hw/core/loader.c | 8 +++++++- | ||
13 | 2 files changed, 18 insertions(+), 2 deletions(-) | ||
7 | 14 | ||
8 | Hopefully all this hoop jumping will get simpler once we have | 15 | diff --git a/include/hw/loader.h b/include/hw/loader.h |
9 | generically vectorised helpers here. | ||
10 | |||
11 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | ||
12 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
13 | Message-id: 20180227143852.11175-16-alex.bennee@linaro.org | ||
14 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
15 | --- | ||
16 | target/arm/helper-a64.h | 10 ++++++++++ | ||
17 | target/arm/helper-a64.c | 46 +++++++++++++++++++++++++++++++++++++++++++++- | ||
18 | target/arm/translate-a64.c | 26 +++++++++++++++++++++----- | ||
19 | 3 files changed, 76 insertions(+), 6 deletions(-) | ||
20 | |||
21 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | ||
22 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
23 | --- a/target/arm/helper-a64.h | 17 | --- a/include/hw/loader.h |
24 | +++ b/target/arm/helper-a64.h | 18 | +++ b/include/hw/loader.h |
25 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_acge_f16, i32, f16, f16, ptr) | 19 | @@ -XXX,XX +XXX,XX @@ int load_uimage(const char *filename, hwaddr *ep, |
26 | DEF_HELPER_3(advsimd_acgt_f16, i32, f16, f16, ptr) | 20 | void *translate_opaque); |
27 | DEF_HELPER_3(advsimd_mulxh, f16, f16, f16, ptr) | 21 | |
28 | DEF_HELPER_4(advsimd_muladdh, f16, f16, f16, f16, ptr) | 22 | /** |
29 | +DEF_HELPER_3(advsimd_add2h, i32, i32, i32, ptr) | 23 | - * load_ramdisk: |
30 | +DEF_HELPER_3(advsimd_sub2h, i32, i32, i32, ptr) | 24 | + * load_ramdisk_as: |
31 | +DEF_HELPER_3(advsimd_mul2h, i32, i32, i32, ptr) | 25 | * @filename: Path to the ramdisk image |
32 | +DEF_HELPER_3(advsimd_div2h, i32, i32, i32, ptr) | 26 | * @addr: Memory address to load the ramdisk to |
33 | +DEF_HELPER_3(advsimd_max2h, i32, i32, i32, ptr) | 27 | * @max_sz: Maximum allowed ramdisk size (for non-u-boot ramdisks) |
34 | +DEF_HELPER_3(advsimd_min2h, i32, i32, i32, ptr) | 28 | + * @as: The AddressSpace to load the ELF to. The value of address_space_memory |
35 | +DEF_HELPER_3(advsimd_maxnum2h, i32, i32, i32, ptr) | 29 | + * is used if nothing is supplied here. |
36 | +DEF_HELPER_3(advsimd_minnum2h, i32, i32, i32, ptr) | 30 | * |
37 | +DEF_HELPER_3(advsimd_mulx2h, i32, i32, i32, ptr) | 31 | * Load a ramdisk image with U-Boot header to the specified memory |
38 | +DEF_HELPER_4(advsimd_muladd2h, i32, i32, i32, i32, ptr) | 32 | * address. |
39 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 33 | * |
34 | * Returns the size of the loaded image on success, -1 otherwise. | ||
35 | */ | ||
36 | +int load_ramdisk_as(const char *filename, hwaddr addr, uint64_t max_sz, | ||
37 | + AddressSpace *as); | ||
38 | + | ||
39 | +/** | ||
40 | + * load_ramdisk: | ||
41 | + * Same as load_ramdisk_as(), but doesn't allow the caller to specify | ||
42 | + * an AddressSpace. | ||
43 | + */ | ||
44 | int load_ramdisk(const char *filename, hwaddr addr, uint64_t max_sz); | ||
45 | |||
46 | ssize_t gunzip(void *dst, size_t dstlen, uint8_t *src, size_t srclen); | ||
47 | diff --git a/hw/core/loader.c b/hw/core/loader.c | ||
40 | index XXXXXXX..XXXXXXX 100644 | 48 | index XXXXXXX..XXXXXXX 100644 |
41 | --- a/target/arm/helper-a64.c | 49 | --- a/hw/core/loader.c |
42 | +++ b/target/arm/helper-a64.c | 50 | +++ b/hw/core/loader.c |
43 | @@ -XXX,XX +XXX,XX @@ ADVSIMD_HALFOP(max) | 51 | @@ -XXX,XX +XXX,XX @@ int load_uimage_as(const char *filename, hwaddr *ep, hwaddr *loadaddr, |
44 | ADVSIMD_HALFOP(minnum) | 52 | |
45 | ADVSIMD_HALFOP(maxnum) | 53 | /* Load a ramdisk. */ |
46 | 54 | int load_ramdisk(const char *filename, hwaddr addr, uint64_t max_sz) | |
47 | +#define ADVSIMD_TWOHALFOP(name) \ | 55 | +{ |
48 | +uint32_t ADVSIMD_HELPER(name, 2h)(uint32_t two_a, uint32_t two_b, void *fpstp) \ | 56 | + return load_ramdisk_as(filename, addr, max_sz, NULL); |
49 | +{ \ | ||
50 | + float16 a1, a2, b1, b2; \ | ||
51 | + uint32_t r1, r2; \ | ||
52 | + float_status *fpst = fpstp; \ | ||
53 | + a1 = extract32(two_a, 0, 16); \ | ||
54 | + a2 = extract32(two_a, 16, 16); \ | ||
55 | + b1 = extract32(two_b, 0, 16); \ | ||
56 | + b2 = extract32(two_b, 16, 16); \ | ||
57 | + r1 = float16_ ## name(a1, b1, fpst); \ | ||
58 | + r2 = float16_ ## name(a2, b2, fpst); \ | ||
59 | + return deposit32(r1, 16, 16, r2); \ | ||
60 | +} | 57 | +} |
61 | + | 58 | + |
62 | +ADVSIMD_TWOHALFOP(add) | 59 | +int load_ramdisk_as(const char *filename, hwaddr addr, uint64_t max_sz, |
63 | +ADVSIMD_TWOHALFOP(sub) | 60 | + AddressSpace *as) |
64 | +ADVSIMD_TWOHALFOP(mul) | ||
65 | +ADVSIMD_TWOHALFOP(div) | ||
66 | +ADVSIMD_TWOHALFOP(min) | ||
67 | +ADVSIMD_TWOHALFOP(max) | ||
68 | +ADVSIMD_TWOHALFOP(minnum) | ||
69 | +ADVSIMD_TWOHALFOP(maxnum) | ||
70 | + | ||
71 | /* Data processing - scalar floating-point and advanced SIMD */ | ||
72 | -float16 HELPER(advsimd_mulxh)(float16 a, float16 b, void *fpstp) | ||
73 | +static float16 float16_mulx(float16 a, float16 b, void *fpstp) | ||
74 | { | 61 | { |
75 | float_status *fpst = fpstp; | 62 | return load_uboot_image(filename, NULL, &addr, NULL, IH_TYPE_RAMDISK, |
76 | 63 | - NULL, NULL, NULL); | |
77 | @@ -XXX,XX +XXX,XX @@ float16 HELPER(advsimd_mulxh)(float16 a, float16 b, void *fpstp) | 64 | + NULL, NULL, as); |
78 | return float16_mul(a, b, fpst); | ||
79 | } | 65 | } |
80 | 66 | ||
81 | +ADVSIMD_HALFOP(mulx) | 67 | /* Load a gzip-compressed kernel to a dynamically allocated buffer. */ |
82 | +ADVSIMD_TWOHALFOP(mulx) | ||
83 | + | ||
84 | /* fused multiply-accumulate */ | ||
85 | float16 HELPER(advsimd_muladdh)(float16 a, float16 b, float16 c, void *fpstp) | ||
86 | { | ||
87 | @@ -XXX,XX +XXX,XX @@ float16 HELPER(advsimd_muladdh)(float16 a, float16 b, float16 c, void *fpstp) | ||
88 | return float16_muladd(a, b, c, 0, fpst); | ||
89 | } | ||
90 | |||
91 | +uint32_t HELPER(advsimd_muladd2h)(uint32_t two_a, uint32_t two_b, | ||
92 | + uint32_t two_c, void *fpstp) | ||
93 | +{ | ||
94 | + float_status *fpst = fpstp; | ||
95 | + float16 a1, a2, b1, b2, c1, c2; | ||
96 | + uint32_t r1, r2; | ||
97 | + a1 = extract32(two_a, 0, 16); | ||
98 | + a2 = extract32(two_a, 16, 16); | ||
99 | + b1 = extract32(two_b, 0, 16); | ||
100 | + b2 = extract32(two_b, 16, 16); | ||
101 | + c1 = extract32(two_c, 0, 16); | ||
102 | + c2 = extract32(two_c, 16, 16); | ||
103 | + r1 = float16_muladd(a1, b1, c1, 0, fpst); | ||
104 | + r2 = float16_muladd(a2, b2, c2, 0, fpst); | ||
105 | + return deposit32(r1, 16, 16, r2); | ||
106 | +} | ||
107 | + | ||
108 | /* | ||
109 | * Floating point comparisons produce an integer result. Softfloat | ||
110 | * routines return float_relation types which we convert to the 0/-1 | ||
111 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
112 | index XXXXXXX..XXXXXXX 100644 | ||
113 | --- a/target/arm/translate-a64.c | ||
114 | +++ b/target/arm/translate-a64.c | ||
115 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
116 | * multiply-add */ | ||
117 | tcg_gen_xori_i32(tcg_op, tcg_op, 0x80008000); | ||
118 | } | ||
119 | - gen_helper_advsimd_muladdh(tcg_res, tcg_op, tcg_idx, | ||
120 | - tcg_res, fpst); | ||
121 | + if (is_scalar) { | ||
122 | + gen_helper_advsimd_muladdh(tcg_res, tcg_op, tcg_idx, | ||
123 | + tcg_res, fpst); | ||
124 | + } else { | ||
125 | + gen_helper_advsimd_muladd2h(tcg_res, tcg_op, tcg_idx, | ||
126 | + tcg_res, fpst); | ||
127 | + } | ||
128 | break; | ||
129 | case 2: | ||
130 | if (opcode == 0x5) { | ||
131 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
132 | switch (size) { | ||
133 | case 1: | ||
134 | if (u) { | ||
135 | - gen_helper_advsimd_mulxh(tcg_res, tcg_op, tcg_idx, | ||
136 | - fpst); | ||
137 | + if (is_scalar) { | ||
138 | + gen_helper_advsimd_mulxh(tcg_res, tcg_op, | ||
139 | + tcg_idx, fpst); | ||
140 | + } else { | ||
141 | + gen_helper_advsimd_mulx2h(tcg_res, tcg_op, | ||
142 | + tcg_idx, fpst); | ||
143 | + } | ||
144 | } else { | ||
145 | - g_assert_not_reached(); | ||
146 | + if (is_scalar) { | ||
147 | + gen_helper_advsimd_mulh(tcg_res, tcg_op, | ||
148 | + tcg_idx, fpst); | ||
149 | + } else { | ||
150 | + gen_helper_advsimd_mul2h(tcg_res, tcg_op, | ||
151 | + tcg_idx, fpst); | ||
152 | + } | ||
153 | } | ||
154 | break; | ||
155 | case 2: | ||
156 | -- | 68 | -- |
157 | 2.16.2 | 69 | 2.16.2 |
158 | 70 | ||
159 | 71 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Instead of loading kernels, device trees, and the like to |
---|---|---|---|
2 | the system address space, use the CPU's address space. This | ||
3 | is important if we're trying to load the file to memory or | ||
4 | via an alias memory region that is provided by an SoC | ||
5 | object and thus not mapped into the system address space. | ||
2 | 6 | ||
3 | Much like recpe the ARM ARM has simplified the pseudo code for the | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | calculation which is done on a fixed point 9 bit integer maths. So | 8 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
5 | while adding f16 we can also clean this up to be a little less heavy | 9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
6 | on the floating point and just return the fractional part and leave | 10 | Message-id: 20180220180325.29818-3-peter.maydell@linaro.org |
7 | the calle's to do the final packing of the result. | 11 | --- |
12 | hw/arm/boot.c | 119 +++++++++++++++++++++++++++++++++++++--------------------- | ||
13 | 1 file changed, 76 insertions(+), 43 deletions(-) | ||
8 | 14 | ||
9 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 15 | diff --git a/hw/arm/boot.c b/hw/arm/boot.c |
10 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
11 | Message-id: 20180227143852.11175-27-alex.bennee@linaro.org | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | --- | ||
14 | target/arm/helper.h | 1 + | ||
15 | target/arm/helper.c | 221 ++++++++++++++++++++++++---------------------------- | ||
16 | 2 files changed, 104 insertions(+), 118 deletions(-) | ||
17 | |||
18 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
19 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/helper.h | 17 | --- a/hw/arm/boot.c |
21 | +++ b/target/arm/helper.h | 18 | +++ b/hw/arm/boot.c |
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(rsqrts_f32, f32, f32, f32, env) | 19 | @@ -XXX,XX +XXX,XX @@ |
23 | DEF_HELPER_FLAGS_2(recpe_f16, TCG_CALL_NO_RWG, f16, f16, ptr) | 20 | #define ARM64_TEXT_OFFSET_OFFSET 8 |
24 | DEF_HELPER_FLAGS_2(recpe_f32, TCG_CALL_NO_RWG, f32, f32, ptr) | 21 | #define ARM64_MAGIC_OFFSET 56 |
25 | DEF_HELPER_FLAGS_2(recpe_f64, TCG_CALL_NO_RWG, f64, f64, ptr) | 22 | |
26 | +DEF_HELPER_FLAGS_2(rsqrte_f16, TCG_CALL_NO_RWG, f16, f16, ptr) | 23 | +static AddressSpace *arm_boot_address_space(ARMCPU *cpu, |
27 | DEF_HELPER_FLAGS_2(rsqrte_f32, TCG_CALL_NO_RWG, f32, f32, ptr) | 24 | + const struct arm_boot_info *info) |
28 | DEF_HELPER_FLAGS_2(rsqrte_f64, TCG_CALL_NO_RWG, f64, f64, ptr) | 25 | +{ |
29 | DEF_HELPER_2(recpe_u32, i32, i32, ptr) | 26 | + /* Return the address space to use for bootloader reads and writes. |
30 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 27 | + * We prefer the secure address space if the CPU has it and we're |
31 | index XXXXXXX..XXXXXXX 100644 | 28 | + * going to boot the guest into it. |
32 | --- a/target/arm/helper.c | 29 | + */ |
33 | +++ b/target/arm/helper.c | 30 | + int asidx; |
34 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp) | 31 | + CPUState *cs = CPU(cpu); |
35 | /* The algorithm that must be used to calculate the estimate | ||
36 | * is specified by the ARM ARM. | ||
37 | */ | ||
38 | -static float64 recip_sqrt_estimate(float64 a, float_status *real_fp_status) | ||
39 | + | 32 | + |
40 | +static int do_recip_sqrt_estimate(int a) | 33 | + if (arm_feature(&cpu->env, ARM_FEATURE_EL3) && info->secure_boot) { |
41 | { | 34 | + asidx = ARMASIdx_S; |
42 | - /* These calculations mustn't set any fp exception flags, | 35 | + } else { |
43 | - * so we use a local copy of the fp_status. | 36 | + asidx = ARMASIdx_NS; |
44 | - */ | ||
45 | - float_status dummy_status = *real_fp_status; | ||
46 | - float_status *s = &dummy_status; | ||
47 | - float64 q; | ||
48 | - int64_t q_int; | ||
49 | + int b, estimate; | ||
50 | |||
51 | - if (float64_lt(a, float64_half, s)) { | ||
52 | - /* range 0.25 <= a < 0.5 */ | ||
53 | - | ||
54 | - /* a in units of 1/512 rounded down */ | ||
55 | - /* q0 = (int)(a * 512.0); */ | ||
56 | - q = float64_mul(float64_512, a, s); | ||
57 | - q_int = float64_to_int64_round_to_zero(q, s); | ||
58 | - | ||
59 | - /* reciprocal root r */ | ||
60 | - /* r = 1.0 / sqrt(((double)q0 + 0.5) / 512.0); */ | ||
61 | - q = int64_to_float64(q_int, s); | ||
62 | - q = float64_add(q, float64_half, s); | ||
63 | - q = float64_div(q, float64_512, s); | ||
64 | - q = float64_sqrt(q, s); | ||
65 | - q = float64_div(float64_one, q, s); | ||
66 | + assert(128 <= a && a < 512); | ||
67 | + if (a < 256) { | ||
68 | + a = a * 2 + 1; | ||
69 | } else { | ||
70 | - /* range 0.5 <= a < 1.0 */ | ||
71 | - | ||
72 | - /* a in units of 1/256 rounded down */ | ||
73 | - /* q1 = (int)(a * 256.0); */ | ||
74 | - q = float64_mul(float64_256, a, s); | ||
75 | - int64_t q_int = float64_to_int64_round_to_zero(q, s); | ||
76 | - | ||
77 | - /* reciprocal root r */ | ||
78 | - /* r = 1.0 /sqrt(((double)q1 + 0.5) / 256); */ | ||
79 | - q = int64_to_float64(q_int, s); | ||
80 | - q = float64_add(q, float64_half, s); | ||
81 | - q = float64_div(q, float64_256, s); | ||
82 | - q = float64_sqrt(q, s); | ||
83 | - q = float64_div(float64_one, q, s); | ||
84 | + a = (a >> 1) << 1; | ||
85 | + a = (a + 1) * 2; | ||
86 | } | ||
87 | - /* r in units of 1/256 rounded to nearest */ | ||
88 | - /* s = (int)(256.0 * r + 0.5); */ | ||
89 | + b = 512; | ||
90 | + while (a * (b + 1) * (b + 1) < (1 << 28)) { | ||
91 | + b += 1; | ||
92 | + } | ||
93 | + estimate = (b + 1) / 2; | ||
94 | + assert(256 <= estimate && estimate < 512); | ||
95 | |||
96 | - q = float64_mul(q, float64_256,s ); | ||
97 | - q = float64_add(q, float64_half, s); | ||
98 | - q_int = float64_to_int64_round_to_zero(q, s); | ||
99 | + return estimate; | ||
100 | +} | ||
101 | |||
102 | - /* return (double)s / 256.0;*/ | ||
103 | - return float64_div(int64_to_float64(q_int, s), float64_256, s); | ||
104 | + | ||
105 | +static uint64_t recip_sqrt_estimate(int *exp , int exp_off, uint64_t frac) | ||
106 | +{ | ||
107 | + int estimate; | ||
108 | + uint32_t scaled; | ||
109 | + | ||
110 | + if (*exp == 0) { | ||
111 | + while (extract64(frac, 51, 1) == 0) { | ||
112 | + frac = frac << 1; | ||
113 | + *exp -= 1; | ||
114 | + } | ||
115 | + frac = extract64(frac, 0, 51) << 1; | ||
116 | + } | 37 | + } |
117 | + | 38 | + |
118 | + if (*exp & 1) { | 39 | + return cpu_get_address_space(cs, asidx); |
119 | + /* scaled = UInt('01':fraction<51:45>) */ | ||
120 | + scaled = deposit32(1 << 7, 0, 7, extract64(frac, 45, 7)); | ||
121 | + } else { | ||
122 | + /* scaled = UInt('1':fraction<51:44>) */ | ||
123 | + scaled = deposit32(1 << 8, 0, 8, extract64(frac, 44, 8)); | ||
124 | + } | ||
125 | + estimate = do_recip_sqrt_estimate(scaled); | ||
126 | + | ||
127 | + *exp = (exp_off - *exp) / 2; | ||
128 | + return extract64(estimate, 0, 8) << 44; | ||
129 | +} | 40 | +} |
130 | + | 41 | + |
131 | +float16 HELPER(rsqrte_f16)(float16 input, void *fpstp) | 42 | typedef enum { |
132 | +{ | 43 | FIXUP_NONE = 0, /* do nothing */ |
133 | + float_status *s = fpstp; | 44 | FIXUP_TERMINATOR, /* end of insns */ |
134 | + float16 f16 = float16_squash_input_denormal(input, s); | 45 | @@ -XXX,XX +XXX,XX @@ static const ARMInsnFixup smpboot[] = { |
135 | + uint16_t val = float16_val(f16); | 46 | }; |
136 | + bool f16_sign = float16_is_neg(f16); | 47 | |
137 | + int f16_exp = extract32(val, 10, 5); | 48 | static void write_bootloader(const char *name, hwaddr addr, |
138 | + uint16_t f16_frac = extract32(val, 0, 10); | 49 | - const ARMInsnFixup *insns, uint32_t *fixupcontext) |
139 | + uint64_t f64_frac; | 50 | + const ARMInsnFixup *insns, uint32_t *fixupcontext, |
51 | + AddressSpace *as) | ||
52 | { | ||
53 | /* Fix up the specified bootloader fragment and write it into | ||
54 | * guest memory using rom_add_blob_fixed(). fixupcontext is | ||
55 | @@ -XXX,XX +XXX,XX @@ static void write_bootloader(const char *name, hwaddr addr, | ||
56 | code[i] = tswap32(insn); | ||
57 | } | ||
58 | |||
59 | - rom_add_blob_fixed(name, code, len * sizeof(uint32_t), addr); | ||
60 | + rom_add_blob_fixed_as(name, code, len * sizeof(uint32_t), addr, as); | ||
61 | |||
62 | g_free(code); | ||
63 | } | ||
64 | @@ -XXX,XX +XXX,XX @@ static void default_write_secondary(ARMCPU *cpu, | ||
65 | const struct arm_boot_info *info) | ||
66 | { | ||
67 | uint32_t fixupcontext[FIXUP_MAX]; | ||
68 | + AddressSpace *as = arm_boot_address_space(cpu, info); | ||
69 | |||
70 | fixupcontext[FIXUP_GIC_CPU_IF] = info->gic_cpu_if_addr; | ||
71 | fixupcontext[FIXUP_BOOTREG] = info->smp_bootreg_addr; | ||
72 | @@ -XXX,XX +XXX,XX @@ static void default_write_secondary(ARMCPU *cpu, | ||
73 | } | ||
74 | |||
75 | write_bootloader("smpboot", info->smp_loader_start, | ||
76 | - smpboot, fixupcontext); | ||
77 | + smpboot, fixupcontext, as); | ||
78 | } | ||
79 | |||
80 | void arm_write_secure_board_setup_dummy_smc(ARMCPU *cpu, | ||
81 | const struct arm_boot_info *info, | ||
82 | hwaddr mvbar_addr) | ||
83 | { | ||
84 | + AddressSpace *as = arm_boot_address_space(cpu, info); | ||
85 | int n; | ||
86 | uint32_t mvbar_blob[] = { | ||
87 | /* mvbar_addr: secure monitor vectors | ||
88 | @@ -XXX,XX +XXX,XX @@ void arm_write_secure_board_setup_dummy_smc(ARMCPU *cpu, | ||
89 | for (n = 0; n < ARRAY_SIZE(mvbar_blob); n++) { | ||
90 | mvbar_blob[n] = tswap32(mvbar_blob[n]); | ||
91 | } | ||
92 | - rom_add_blob_fixed("board-setup-mvbar", mvbar_blob, sizeof(mvbar_blob), | ||
93 | - mvbar_addr); | ||
94 | + rom_add_blob_fixed_as("board-setup-mvbar", mvbar_blob, sizeof(mvbar_blob), | ||
95 | + mvbar_addr, as); | ||
96 | |||
97 | for (n = 0; n < ARRAY_SIZE(board_setup_blob); n++) { | ||
98 | board_setup_blob[n] = tswap32(board_setup_blob[n]); | ||
99 | } | ||
100 | - rom_add_blob_fixed("board-setup", board_setup_blob, | ||
101 | - sizeof(board_setup_blob), info->board_setup_addr); | ||
102 | + rom_add_blob_fixed_as("board-setup", board_setup_blob, | ||
103 | + sizeof(board_setup_blob), info->board_setup_addr, as); | ||
104 | } | ||
105 | |||
106 | static void default_reset_secondary(ARMCPU *cpu, | ||
107 | const struct arm_boot_info *info) | ||
108 | { | ||
109 | + AddressSpace *as = arm_boot_address_space(cpu, info); | ||
110 | CPUState *cs = CPU(cpu); | ||
111 | |||
112 | - address_space_stl_notdirty(&address_space_memory, info->smp_bootreg_addr, | ||
113 | + address_space_stl_notdirty(as, info->smp_bootreg_addr, | ||
114 | 0, MEMTXATTRS_UNSPECIFIED, NULL); | ||
115 | cpu_set_pc(cs, info->smp_loader_start); | ||
116 | } | ||
117 | @@ -XXX,XX +XXX,XX @@ static inline bool have_dtb(const struct arm_boot_info *info) | ||
118 | } | ||
119 | |||
120 | #define WRITE_WORD(p, value) do { \ | ||
121 | - address_space_stl_notdirty(&address_space_memory, p, value, \ | ||
122 | + address_space_stl_notdirty(as, p, value, \ | ||
123 | MEMTXATTRS_UNSPECIFIED, NULL); \ | ||
124 | p += 4; \ | ||
125 | } while (0) | ||
126 | |||
127 | -static void set_kernel_args(const struct arm_boot_info *info) | ||
128 | +static void set_kernel_args(const struct arm_boot_info *info, AddressSpace *as) | ||
129 | { | ||
130 | int initrd_size = info->initrd_size; | ||
131 | hwaddr base = info->loader_start; | ||
132 | @@ -XXX,XX +XXX,XX @@ static void set_kernel_args(const struct arm_boot_info *info) | ||
133 | int cmdline_size; | ||
134 | |||
135 | cmdline_size = strlen(info->kernel_cmdline); | ||
136 | - cpu_physical_memory_write(p + 8, info->kernel_cmdline, | ||
137 | - cmdline_size + 1); | ||
138 | + address_space_write(as, p + 8, MEMTXATTRS_UNSPECIFIED, | ||
139 | + (const uint8_t *)info->kernel_cmdline, | ||
140 | + cmdline_size + 1); | ||
141 | cmdline_size = (cmdline_size >> 2) + 1; | ||
142 | WRITE_WORD(p, cmdline_size + 2); | ||
143 | WRITE_WORD(p, 0x54410009); | ||
144 | @@ -XXX,XX +XXX,XX @@ static void set_kernel_args(const struct arm_boot_info *info) | ||
145 | atag_board_len = (info->atag_board(info, atag_board_buf) + 3) & ~3; | ||
146 | WRITE_WORD(p, (atag_board_len + 8) >> 2); | ||
147 | WRITE_WORD(p, 0x414f4d50); | ||
148 | - cpu_physical_memory_write(p, atag_board_buf, atag_board_len); | ||
149 | + address_space_write(as, p, MEMTXATTRS_UNSPECIFIED, | ||
150 | + atag_board_buf, atag_board_len); | ||
151 | p += atag_board_len; | ||
152 | } | ||
153 | /* ATAG_END */ | ||
154 | @@ -XXX,XX +XXX,XX @@ static void set_kernel_args(const struct arm_boot_info *info) | ||
155 | WRITE_WORD(p, 0); | ||
156 | } | ||
157 | |||
158 | -static void set_kernel_args_old(const struct arm_boot_info *info) | ||
159 | +static void set_kernel_args_old(const struct arm_boot_info *info, | ||
160 | + AddressSpace *as) | ||
161 | { | ||
162 | hwaddr p; | ||
163 | const char *s; | ||
164 | @@ -XXX,XX +XXX,XX @@ static void set_kernel_args_old(const struct arm_boot_info *info) | ||
165 | } | ||
166 | s = info->kernel_cmdline; | ||
167 | if (s) { | ||
168 | - cpu_physical_memory_write(p, s, strlen(s) + 1); | ||
169 | + address_space_write(as, p, MEMTXATTRS_UNSPECIFIED, | ||
170 | + (const uint8_t *)s, strlen(s) + 1); | ||
171 | } else { | ||
172 | WRITE_WORD(p, 0); | ||
173 | } | ||
174 | @@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt) | ||
175 | * @addr: the address to load the image at | ||
176 | * @binfo: struct describing the boot environment | ||
177 | * @addr_limit: upper limit of the available memory area at @addr | ||
178 | + * @as: address space to load image to | ||
179 | * | ||
180 | * Load a device tree supplied by the machine or by the user with the | ||
181 | * '-dtb' command line option, and put it at offset @addr in target | ||
182 | @@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt) | ||
183 | * Note: Must not be called unless have_dtb(binfo) is true. | ||
184 | */ | ||
185 | static int load_dtb(hwaddr addr, const struct arm_boot_info *binfo, | ||
186 | - hwaddr addr_limit) | ||
187 | + hwaddr addr_limit, AddressSpace *as) | ||
188 | { | ||
189 | void *fdt = NULL; | ||
190 | int size, rc; | ||
191 | @@ -XXX,XX +XXX,XX @@ static int load_dtb(hwaddr addr, const struct arm_boot_info *binfo, | ||
192 | /* Put the DTB into the memory map as a ROM image: this will ensure | ||
193 | * the DTB is copied again upon reset, even if addr points into RAM. | ||
194 | */ | ||
195 | - rom_add_blob_fixed("dtb", fdt, size, addr); | ||
196 | + rom_add_blob_fixed_as("dtb", fdt, size, addr, as); | ||
197 | |||
198 | g_free(fdt); | ||
199 | |||
200 | @@ -XXX,XX +XXX,XX @@ static void do_cpu_reset(void *opaque) | ||
201 | } | ||
202 | |||
203 | if (cs == first_cpu) { | ||
204 | + AddressSpace *as = arm_boot_address_space(cpu, info); | ||
140 | + | 205 | + |
141 | + if (float16_is_any_nan(f16)) { | 206 | cpu_set_pc(cs, info->loader_start); |
142 | + float16 nan = f16; | 207 | |
143 | + if (float16_is_signaling_nan(f16, s)) { | 208 | if (!have_dtb(info)) { |
144 | + float_raise(float_flag_invalid, s); | 209 | if (old_param) { |
145 | + nan = float16_maybe_silence_nan(f16, s); | 210 | - set_kernel_args_old(info); |
146 | + } | 211 | + set_kernel_args_old(info, as); |
147 | + if (s->default_nan_mode) { | 212 | } else { |
148 | + nan = float16_default_nan(s); | 213 | - set_kernel_args(info); |
149 | + } | 214 | + set_kernel_args(info, as); |
150 | + return nan; | 215 | } |
151 | + } else if (float16_is_zero(f16)) { | 216 | } |
152 | + float_raise(float_flag_divbyzero, s); | 217 | } else { |
153 | + return float16_set_sign(float16_infinity, f16_sign); | 218 | @@ -XXX,XX +XXX,XX @@ static int do_arm_linux_init(Object *obj, void *opaque) |
154 | + } else if (f16_sign) { | 219 | |
155 | + float_raise(float_flag_invalid, s); | 220 | static uint64_t arm_load_elf(struct arm_boot_info *info, uint64_t *pentry, |
156 | + return float16_default_nan(s); | 221 | uint64_t *lowaddr, uint64_t *highaddr, |
157 | + } else if (float16_is_infinity(f16)) { | 222 | - int elf_machine) |
158 | + return float16_zero; | 223 | + int elf_machine, AddressSpace *as) |
159 | + } | 224 | { |
160 | + | 225 | bool elf_is64; |
161 | + /* Scale and normalize to a double-precision value between 0.25 and 1.0, | 226 | union { |
162 | + * preserving the parity of the exponent. */ | 227 | @@ -XXX,XX +XXX,XX @@ static uint64_t arm_load_elf(struct arm_boot_info *info, uint64_t *pentry, |
163 | + | 228 | } |
164 | + f64_frac = ((uint64_t) f16_frac) << (52 - 10); | 229 | } |
165 | + | 230 | |
166 | + f64_frac = recip_sqrt_estimate(&f16_exp, 44, f64_frac); | 231 | - ret = load_elf(info->kernel_filename, NULL, NULL, |
167 | + | 232 | - pentry, lowaddr, highaddr, big_endian, elf_machine, |
168 | + /* result = sign : result_exp<4:0> : estimate<7:0> : Zeros(2) */ | 233 | - 1, data_swab); |
169 | + val = deposit32(0, 15, 1, f16_sign); | 234 | + ret = load_elf_as(info->kernel_filename, NULL, NULL, |
170 | + val = deposit32(val, 10, 5, f16_exp); | 235 | + pentry, lowaddr, highaddr, big_endian, elf_machine, |
171 | + val = deposit32(val, 2, 8, extract64(f64_frac, 52 - 8, 8)); | 236 | + 1, data_swab, as); |
172 | + return make_float16(val); | 237 | if (ret <= 0) { |
173 | } | 238 | /* The header loaded but the image didn't */ |
174 | 239 | exit(1); | |
175 | float32 HELPER(rsqrte_f32)(float32 input, void *fpstp) | 240 | @@ -XXX,XX +XXX,XX @@ static uint64_t arm_load_elf(struct arm_boot_info *info, uint64_t *pentry, |
176 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrte_f32)(float32 input, void *fpstp) | 241 | } |
177 | float_status *s = fpstp; | 242 | |
178 | float32 f32 = float32_squash_input_denormal(input, s); | 243 | static uint64_t load_aarch64_image(const char *filename, hwaddr mem_base, |
179 | uint32_t val = float32_val(f32); | 244 | - hwaddr *entry) |
180 | - uint32_t f32_sbit = 0x80000000 & val; | 245 | + hwaddr *entry, AddressSpace *as) |
181 | - int32_t f32_exp = extract32(val, 23, 8); | 246 | { |
182 | + uint32_t f32_sign = float32_is_neg(f32); | 247 | hwaddr kernel_load_offset = KERNEL64_LOAD_ADDR; |
183 | + int f32_exp = extract32(val, 23, 8); | 248 | uint8_t *buffer; |
184 | uint32_t f32_frac = extract32(val, 0, 23); | 249 | @@ -XXX,XX +XXX,XX @@ static uint64_t load_aarch64_image(const char *filename, hwaddr mem_base, |
185 | uint64_t f64_frac; | 250 | } |
186 | - uint64_t val64; | 251 | |
187 | - int result_exp; | 252 | *entry = mem_base + kernel_load_offset; |
188 | - float64 f64; | 253 | - rom_add_blob_fixed(filename, buffer, size, *entry); |
189 | 254 | + rom_add_blob_fixed_as(filename, buffer, size, *entry, as); | |
190 | if (float32_is_any_nan(f32)) { | 255 | |
191 | float32 nan = f32; | 256 | g_free(buffer); |
192 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrte_f32)(float32 input, void *fpstp) | 257 | |
193 | * preserving the parity of the exponent. */ | 258 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
194 | 259 | ARMCPU *cpu = n->cpu; | |
195 | f64_frac = ((uint64_t) f32_frac) << 29; | 260 | struct arm_boot_info *info = |
196 | - if (f32_exp == 0) { | 261 | container_of(n, struct arm_boot_info, load_kernel_notifier); |
197 | - while (extract64(f64_frac, 51, 1) == 0) { | 262 | + AddressSpace *as = arm_boot_address_space(cpu, info); |
198 | - f64_frac = f64_frac << 1; | 263 | |
199 | - f32_exp = f32_exp-1; | 264 | /* The board code is not supposed to set secure_board_setup unless |
200 | - } | 265 | * running its code in secure mode is actually possible, and KVM |
201 | - f64_frac = extract64(f64_frac, 0, 51) << 1; | 266 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
202 | - } | 267 | * the kernel is supposed to be loaded by the bootloader), copy the |
203 | 268 | * DTB to the base of RAM for the bootloader to pick up. | |
204 | - if (extract64(f32_exp, 0, 1) == 0) { | 269 | */ |
205 | - f64 = make_float64(((uint64_t) f32_sbit) << 32 | 270 | - if (load_dtb(info->loader_start, info, 0) < 0) { |
206 | - | (0x3feULL << 52) | 271 | + if (load_dtb(info->loader_start, info, 0, as) < 0) { |
207 | - | f64_frac); | 272 | exit(1); |
208 | - } else { | 273 | } |
209 | - f64 = make_float64(((uint64_t) f32_sbit) << 32 | 274 | } |
210 | - | (0x3fdULL << 52) | 275 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
211 | - | f64_frac); | 276 | |
212 | - } | 277 | /* Assume that raw images are linux kernels, and ELF images are not. */ |
213 | + f64_frac = recip_sqrt_estimate(&f32_exp, 380, f64_frac); | 278 | kernel_size = arm_load_elf(info, &elf_entry, &elf_low_addr, |
214 | 279 | - &elf_high_addr, elf_machine); | |
215 | - result_exp = (380 - f32_exp) / 2; | 280 | + &elf_high_addr, elf_machine, as); |
216 | - | 281 | if (kernel_size > 0 && have_dtb(info)) { |
217 | - f64 = recip_sqrt_estimate(f64, s); | 282 | /* If there is still some room left at the base of RAM, try and put |
218 | - | 283 | * the DTB there like we do for images loaded with -bios or -pflash. |
219 | - val64 = float64_val(f64); | 284 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
220 | - | 285 | if (elf_low_addr < info->loader_start) { |
221 | - val = ((result_exp & 0xff) << 23) | 286 | elf_low_addr = 0; |
222 | - | ((val64 >> 29) & 0x7fffff); | 287 | } |
223 | + /* result = sign : result_exp<4:0> : estimate<7:0> : Zeros(15) */ | 288 | - if (load_dtb(info->loader_start, info, elf_low_addr) < 0) { |
224 | + val = deposit32(0, 31, 1, f32_sign); | 289 | + if (load_dtb(info->loader_start, info, elf_low_addr, as) < 0) { |
225 | + val = deposit32(val, 23, 8, f32_exp); | 290 | exit(1); |
226 | + val = deposit32(val, 15, 8, extract64(f64_frac, 52 - 8, 8)); | 291 | } |
227 | return make_float32(val); | 292 | } |
228 | } | 293 | } |
229 | 294 | entry = elf_entry; | |
230 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp) | 295 | if (kernel_size < 0) { |
231 | float_status *s = fpstp; | 296 | - kernel_size = load_uimage(info->kernel_filename, &entry, NULL, |
232 | float64 f64 = float64_squash_input_denormal(input, s); | 297 | - &is_linux, NULL, NULL); |
233 | uint64_t val = float64_val(f64); | 298 | + kernel_size = load_uimage_as(info->kernel_filename, &entry, NULL, |
234 | - uint64_t f64_sbit = 0x8000000000000000ULL & val; | 299 | + &is_linux, NULL, NULL, as); |
235 | - int64_t f64_exp = extract64(val, 52, 11); | 300 | } |
236 | + bool f64_sign = float64_is_neg(f64); | 301 | if (arm_feature(&cpu->env, ARM_FEATURE_AARCH64) && kernel_size < 0) { |
237 | + int f64_exp = extract64(val, 52, 11); | 302 | kernel_size = load_aarch64_image(info->kernel_filename, |
238 | uint64_t f64_frac = extract64(val, 0, 52); | 303 | - info->loader_start, &entry); |
239 | - int64_t result_exp; | 304 | + info->loader_start, &entry, as); |
240 | - uint64_t result_frac; | 305 | is_linux = 1; |
241 | 306 | } else if (kernel_size < 0) { | |
242 | if (float64_is_any_nan(f64)) { | 307 | /* 32-bit ARM */ |
243 | float64 nan = f64; | 308 | entry = info->loader_start + KERNEL_LOAD_ADDR; |
244 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp) | 309 | - kernel_size = load_image_targphys(info->kernel_filename, entry, |
245 | return float64_zero; | 310 | - info->ram_size - KERNEL_LOAD_ADDR); |
246 | } | 311 | + kernel_size = load_image_targphys_as(info->kernel_filename, entry, |
247 | 312 | + info->ram_size - KERNEL_LOAD_ADDR, | |
248 | - /* Scale and normalize to a double-precision value between 0.25 and 1.0, | 313 | + as); |
249 | - * preserving the parity of the exponent. */ | 314 | is_linux = 1; |
250 | + f64_frac = recip_sqrt_estimate(&f64_exp, 3068, f64_frac); | 315 | } |
251 | 316 | if (kernel_size < 0) { | |
252 | - if (f64_exp == 0) { | 317 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
253 | - while (extract64(f64_frac, 51, 1) == 0) { | 318 | uint32_t fixupcontext[FIXUP_MAX]; |
254 | - f64_frac = f64_frac << 1; | 319 | |
255 | - f64_exp = f64_exp - 1; | 320 | if (info->initrd_filename) { |
256 | - } | 321 | - initrd_size = load_ramdisk(info->initrd_filename, |
257 | - f64_frac = extract64(f64_frac, 0, 51) << 1; | 322 | - info->initrd_start, |
258 | - } | 323 | - info->ram_size - |
259 | - | 324 | - info->initrd_start); |
260 | - if (extract64(f64_exp, 0, 1) == 0) { | 325 | + initrd_size = load_ramdisk_as(info->initrd_filename, |
261 | - f64 = make_float64(f64_sbit | 326 | + info->initrd_start, |
262 | - | (0x3feULL << 52) | 327 | + info->ram_size - info->initrd_start, |
263 | - | f64_frac); | 328 | + as); |
264 | - } else { | 329 | if (initrd_size < 0) { |
265 | - f64 = make_float64(f64_sbit | 330 | - initrd_size = load_image_targphys(info->initrd_filename, |
266 | - | (0x3fdULL << 52) | 331 | - info->initrd_start, |
267 | - | f64_frac); | 332 | - info->ram_size - |
268 | - } | 333 | - info->initrd_start); |
269 | - | 334 | + initrd_size = load_image_targphys_as(info->initrd_filename, |
270 | - result_exp = (3068 - f64_exp) / 2; | 335 | + info->initrd_start, |
271 | - | 336 | + info->ram_size - |
272 | - f64 = recip_sqrt_estimate(f64, s); | 337 | + info->initrd_start, |
273 | - | 338 | + as); |
274 | - result_frac = extract64(float64_val(f64), 0, 52); | 339 | } |
275 | - | 340 | if (initrd_size < 0) { |
276 | - return make_float64(f64_sbit | | 341 | error_report("could not load initrd '%s'", |
277 | - ((result_exp & 0x7ff) << 52) | | 342 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
278 | - result_frac); | 343 | |
279 | + /* result = sign : result_exp<4:0> : estimate<7:0> : Zeros(44) */ | 344 | /* Place the DTB after the initrd in memory with alignment. */ |
280 | + val = deposit64(0, 61, 1, f64_sign); | 345 | dtb_start = QEMU_ALIGN_UP(info->initrd_start + initrd_size, align); |
281 | + val = deposit64(val, 52, 11, f64_exp); | 346 | - if (load_dtb(dtb_start, info, 0) < 0) { |
282 | + val = deposit64(val, 44, 8, extract64(f64_frac, 52 - 8, 8)); | 347 | + if (load_dtb(dtb_start, info, 0, as) < 0) { |
283 | + return make_float64(val); | 348 | exit(1); |
284 | } | 349 | } |
285 | 350 | fixupcontext[FIXUP_ARGPTR] = dtb_start; | |
286 | uint32_t HELPER(recpe_u32)(uint32_t a, void *fpstp) | 351 | @@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data) |
287 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(recpe_u32)(uint32_t a, void *fpstp) | 352 | fixupcontext[FIXUP_ENTRYPOINT] = entry; |
288 | 353 | ||
289 | uint32_t HELPER(rsqrte_u32)(uint32_t a, void *fpstp) | 354 | write_bootloader("bootloader", info->loader_start, |
290 | { | 355 | - primary_loader, fixupcontext); |
291 | - float_status *fpst = fpstp; | 356 | + primary_loader, fixupcontext, as); |
292 | - float64 f64; | 357 | |
293 | + int estimate; | 358 | if (info->nb_cpus > 1) { |
294 | 359 | info->write_secondary_boot(cpu, info); | |
295 | if ((a & 0xc0000000) == 0) { | ||
296 | return 0xffffffff; | ||
297 | } | ||
298 | |||
299 | - if (a & 0x80000000) { | ||
300 | - f64 = make_float64((0x3feULL << 52) | ||
301 | - | ((uint64_t)(a & 0x7fffffff) << 21)); | ||
302 | - } else { /* bits 31-30 == '01' */ | ||
303 | - f64 = make_float64((0x3fdULL << 52) | ||
304 | - | ((uint64_t)(a & 0x3fffffff) << 22)); | ||
305 | - } | ||
306 | + estimate = do_recip_sqrt_estimate(extract32(a, 23, 9)); | ||
307 | |||
308 | - f64 = recip_sqrt_estimate(f64, fpst); | ||
309 | - | ||
310 | - return 0x80000000 | ((float64_val(f64) >> 21) & 0x7fffffff); | ||
311 | + return deposit32(0, 23, 9, estimate); | ||
312 | } | ||
313 | |||
314 | /* VFPv4 fused multiply-accumulate */ | ||
315 | -- | 360 | -- |
316 | 2.16.2 | 361 | 2.16.2 |
317 | 362 | ||
318 | 363 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Instead of loading guest images to the system address space, use the |
---|---|---|---|
2 | CPU's address space. This is important if we're trying to load the | ||
3 | file to memory or via an alias memory region that is provided by an | ||
4 | SoC object and thus not mapped into the system address space. | ||
2 | 5 | ||
3 | I re-use the existing handle_2misc_fcmp_zero handler and tweak it | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | slightly to deal with the half-precision case. | 7 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20180220180325.29818-4-peter.maydell@linaro.org | ||
10 | --- | ||
11 | hw/arm/armv7m.c | 17 ++++++++++++++--- | ||
12 | 1 file changed, 14 insertions(+), 3 deletions(-) | ||
5 | 13 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 14 | diff --git a/hw/arm/armv7m.c b/hw/arm/armv7m.c |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20180227143852.11175-20-alex.bennee@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | target/arm/translate-a64.c | 80 +++++++++++++++++++++++++++++++++------------- | ||
12 | 1 file changed, 57 insertions(+), 23 deletions(-) | ||
13 | |||
14 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/translate-a64.c | 16 | --- a/hw/arm/armv7m.c |
17 | +++ b/target/arm/translate-a64.c | 17 | +++ b/hw/arm/armv7m.c |
18 | @@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode, | 18 | @@ -XXX,XX +XXX,XX @@ void armv7m_load_kernel(ARMCPU *cpu, const char *kernel_filename, int mem_size) |
19 | bool is_scalar, bool is_u, bool is_q, | 19 | uint64_t entry; |
20 | int size, int rn, int rd) | 20 | uint64_t lowaddr; |
21 | { | 21 | int big_endian; |
22 | - bool is_double = (size == 3); | 22 | + AddressSpace *as; |
23 | + bool is_double = (size == MO_64); | 23 | + int asidx; |
24 | TCGv_ptr fpst; | 24 | + CPUState *cs = CPU(cpu); |
25 | 25 | ||
26 | if (!fp_access_check(s)) { | 26 | #ifdef TARGET_WORDS_BIGENDIAN |
27 | return; | 27 | big_endian = 1; |
28 | @@ -XXX,XX +XXX,XX @@ void armv7m_load_kernel(ARMCPU *cpu, const char *kernel_filename, int mem_size) | ||
29 | exit(1); | ||
28 | } | 30 | } |
29 | 31 | ||
30 | - fpst = get_fpstatus_ptr(false); | 32 | + if (arm_feature(&cpu->env, ARM_FEATURE_EL3)) { |
31 | + fpst = get_fpstatus_ptr(size == MO_16); | 33 | + asidx = ARMASIdx_S; |
32 | 34 | + } else { | |
33 | if (is_double) { | 35 | + asidx = ARMASIdx_NS; |
34 | TCGv_i64 tcg_op = tcg_temp_new_i64(); | 36 | + } |
35 | @@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode, | 37 | + as = cpu_get_address_space(cs, asidx); |
36 | bool swap = false; | 38 | + |
37 | int pass, maxpasses; | 39 | if (kernel_filename) { |
38 | 40 | - image_size = load_elf(kernel_filename, NULL, NULL, &entry, &lowaddr, | |
39 | - switch (opcode) { | 41 | - NULL, big_endian, EM_ARM, 1, 0); |
40 | - case 0x2e: /* FCMLT (zero) */ | 42 | + image_size = load_elf_as(kernel_filename, NULL, NULL, &entry, &lowaddr, |
41 | - swap = true; | 43 | + NULL, big_endian, EM_ARM, 1, 0, as); |
42 | - /* fall through */ | 44 | if (image_size < 0) { |
43 | - case 0x2c: /* FCMGT (zero) */ | 45 | - image_size = load_image_targphys(kernel_filename, 0, mem_size); |
44 | - genfn = gen_helper_neon_cgt_f32; | 46 | + image_size = load_image_targphys_as(kernel_filename, 0, |
45 | - break; | 47 | + mem_size, as); |
46 | - case 0x2d: /* FCMEQ (zero) */ | 48 | lowaddr = 0; |
47 | - genfn = gen_helper_neon_ceq_f32; | ||
48 | - break; | ||
49 | - case 0x6d: /* FCMLE (zero) */ | ||
50 | - swap = true; | ||
51 | - /* fall through */ | ||
52 | - case 0x6c: /* FCMGE (zero) */ | ||
53 | - genfn = gen_helper_neon_cge_f32; | ||
54 | - break; | ||
55 | - default: | ||
56 | - g_assert_not_reached(); | ||
57 | + if (size == MO_16) { | ||
58 | + switch (opcode) { | ||
59 | + case 0x2e: /* FCMLT (zero) */ | ||
60 | + swap = true; | ||
61 | + /* fall through */ | ||
62 | + case 0x2c: /* FCMGT (zero) */ | ||
63 | + genfn = gen_helper_advsimd_cgt_f16; | ||
64 | + break; | ||
65 | + case 0x2d: /* FCMEQ (zero) */ | ||
66 | + genfn = gen_helper_advsimd_ceq_f16; | ||
67 | + break; | ||
68 | + case 0x6d: /* FCMLE (zero) */ | ||
69 | + swap = true; | ||
70 | + /* fall through */ | ||
71 | + case 0x6c: /* FCMGE (zero) */ | ||
72 | + genfn = gen_helper_advsimd_cge_f16; | ||
73 | + break; | ||
74 | + default: | ||
75 | + g_assert_not_reached(); | ||
76 | + } | ||
77 | + } else { | ||
78 | + switch (opcode) { | ||
79 | + case 0x2e: /* FCMLT (zero) */ | ||
80 | + swap = true; | ||
81 | + /* fall through */ | ||
82 | + case 0x2c: /* FCMGT (zero) */ | ||
83 | + genfn = gen_helper_neon_cgt_f32; | ||
84 | + break; | ||
85 | + case 0x2d: /* FCMEQ (zero) */ | ||
86 | + genfn = gen_helper_neon_ceq_f32; | ||
87 | + break; | ||
88 | + case 0x6d: /* FCMLE (zero) */ | ||
89 | + swap = true; | ||
90 | + /* fall through */ | ||
91 | + case 0x6c: /* FCMGE (zero) */ | ||
92 | + genfn = gen_helper_neon_cge_f32; | ||
93 | + break; | ||
94 | + default: | ||
95 | + g_assert_not_reached(); | ||
96 | + } | ||
97 | } | 49 | } |
98 | 50 | if (image_size < 0) { | |
99 | if (is_scalar) { | ||
100 | maxpasses = 1; | ||
101 | } else { | ||
102 | - maxpasses = is_q ? 4 : 2; | ||
103 | + int vector_size = 8 << is_q; | ||
104 | + maxpasses = vector_size >> size; | ||
105 | } | ||
106 | |||
107 | for (pass = 0; pass < maxpasses; pass++) { | ||
108 | - read_vec_element_i32(s, tcg_op, rn, pass, MO_32); | ||
109 | + read_vec_element_i32(s, tcg_op, rn, pass, size); | ||
110 | if (swap) { | ||
111 | genfn(tcg_res, tcg_zero, tcg_op, fpst); | ||
112 | } else { | ||
113 | @@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode, | ||
114 | if (is_scalar) { | ||
115 | write_fp_sreg(s, rd, tcg_res); | ||
116 | } else { | ||
117 | - write_vec_element_i32(s, tcg_res, rd, pass, MO_32); | ||
118 | + write_vec_element_i32(s, tcg_res, rd, pass, size); | ||
119 | } | ||
120 | } | ||
121 | tcg_temp_free_i32(tcg_res); | ||
122 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | ||
123 | fpop = deposit32(opcode, 5, 1, a); | ||
124 | fpop = deposit32(fpop, 6, 1, u); | ||
125 | |||
126 | + rd = extract32(insn, 0, 5); | ||
127 | + rn = extract32(insn, 5, 5); | ||
128 | + | ||
129 | switch (fpop) { | ||
130 | + break; | ||
131 | + case 0x2c: /* FCMGT (zero) */ | ||
132 | + case 0x2d: /* FCMEQ (zero) */ | ||
133 | + case 0x2e: /* FCMLT (zero) */ | ||
134 | + case 0x6c: /* FCMGE (zero) */ | ||
135 | + case 0x6d: /* FCMLE (zero) */ | ||
136 | + handle_2misc_fcmp_zero(s, fpop, is_scalar, 0, is_q, MO_16, rn, rd); | ||
137 | + return; | ||
138 | case 0x18: /* FRINTN */ | ||
139 | need_rmode = true; | ||
140 | only_in_vector = true; | ||
141 | -- | 51 | -- |
142 | 2.16.2 | 52 | 2.16.2 |
143 | 53 | ||
144 | 54 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | In v8M, the Implementation Defined Attribution Unit (IDAU) is |
---|---|---|---|
2 | 2 | a small piece of hardware typically implemented in the SoC | |
3 | Half-precision flush to zero behaviour is controlled by a separate | 3 | which provides board or SoC specific security attribution |
4 | FZ16 bit in the FPCR. To handle this we pass a pointer to | 4 | information for each address that the CPU performs MPU/SAU |
5 | fp_status_fp16 when working on half-precision operations. The value of | 5 | checks on. For QEMU, we model this with a QOM interface which |
6 | the presented FPCR is calculated from an amalgam of the two when read. | 6 | is implemented by the board or SoC object and connected to |
7 | 7 | the CPU using a link property. | |
8 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 8 | |
9 | This commit defines the new interface class, adds the link | ||
10 | property to the CPU object, and makes the SAU checking | ||
11 | code call the IDAU interface if one is present. | ||
12 | |||
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 14 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
10 | Message-id: 20180227143852.11175-5-alex.bennee@linaro.org | 15 | Message-id: 20180220180325.29818-5-peter.maydell@linaro.org |
11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
12 | --- | 16 | --- |
13 | target/arm/cpu.h | 32 ++++++++++++++++++++++------ | 17 | target/arm/cpu.h | 3 +++ |
14 | target/arm/helper.c | 26 ++++++++++++++++++----- | 18 | target/arm/idau.h | 61 +++++++++++++++++++++++++++++++++++++++++++++++++++++ |
15 | target/arm/translate-a64.c | 53 +++++++++++++++++++++++++--------------------- | 19 | target/arm/cpu.c | 15 +++++++++++++ |
16 | 3 files changed, 75 insertions(+), 36 deletions(-) | 20 | target/arm/helper.c | 28 +++++++++++++++++++++--- |
21 | 4 files changed, 104 insertions(+), 3 deletions(-) | ||
22 | create mode 100644 target/arm/idau.h | ||
17 | 23 | ||
18 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h | 24 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
19 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/cpu.h | 26 | --- a/target/arm/cpu.h |
21 | +++ b/target/arm/cpu.h | 27 | +++ b/target/arm/cpu.h |
22 | @@ -XXX,XX +XXX,XX @@ typedef struct CPUARMState { | 28 | @@ -XXX,XX +XXX,XX @@ struct ARMCPU { |
23 | /* scratch space when Tn are not sufficient. */ | 29 | /* MemoryRegion to use for secure physical accesses */ |
24 | uint32_t scratch[8]; | 30 | MemoryRegion *secure_memory; |
25 | 31 | ||
26 | - /* fp_status is the "normal" fp status. standard_fp_status retains | 32 | + /* For v8M, pointer to the IDAU interface provided by board/SoC */ |
27 | - * values corresponding to the ARM "Standard FPSCR Value", ie | 33 | + Object *idau; |
28 | - * default-NaN, flush-to-zero, round-to-nearest and is used by | 34 | + |
29 | - * any operations (generally Neon) which the architecture defines | 35 | /* 'compatible' string for this CPU for Linux device trees */ |
30 | - * as controlled by the standard FPSCR value rather than the FPSCR. | 36 | const char *dtb_compatible; |
31 | + /* There are a number of distinct float control structures: | 37 | |
32 | + * | 38 | diff --git a/target/arm/idau.h b/target/arm/idau.h |
33 | + * fp_status: is the "normal" fp status. | 39 | new file mode 100644 |
34 | + * fp_status_fp16: used for half-precision calculations | 40 | index XXXXXXX..XXXXXXX |
35 | + * standard_fp_status : the ARM "Standard FPSCR Value" | 41 | --- /dev/null |
36 | + * | 42 | +++ b/target/arm/idau.h |
37 | + * Half-precision operations are governed by a separate | 43 | @@ -XXX,XX +XXX,XX @@ |
38 | + * flush-to-zero control bit in FPSCR:FZ16. We pass a separate | 44 | +/* |
39 | + * status structure to control this. | 45 | + * QEMU ARM CPU -- interface for the Arm v8M IDAU |
40 | + * | 46 | + * |
41 | + * The "Standard FPSCR", ie default-NaN, flush-to-zero, | 47 | + * Copyright (c) 2018 Linaro Ltd |
42 | + * round-to-nearest and is used by any operations (generally | 48 | + * |
43 | + * Neon) which the architecture defines as controlled by the | 49 | + * This program is free software; you can redistribute it and/or |
44 | + * standard FPSCR value rather than the FPSCR. | 50 | + * modify it under the terms of the GNU General Public License |
45 | * | 51 | + * as published by the Free Software Foundation; either version 2 |
46 | * To avoid having to transfer exception bits around, we simply | 52 | + * of the License, or (at your option) any later version. |
47 | * say that the FPSCR cumulative exception flags are the logical | 53 | + * |
48 | - * OR of the flags in the two fp statuses. This relies on the | 54 | + * This program is distributed in the hope that it will be useful, |
49 | + * OR of the flags in the three fp statuses. This relies on the | 55 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of |
50 | * only thing which needs to read the exception flags being | 56 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
51 | * an explicit FPSCR read. | 57 | + * GNU General Public License for more details. |
52 | */ | 58 | + * |
53 | float_status fp_status; | 59 | + * You should have received a copy of the GNU General Public License |
54 | + float_status fp_status_f16; | 60 | + * along with this program; if not, see |
55 | float_status standard_fp_status; | 61 | + * <http://www.gnu.org/licenses/gpl-2.0.html> |
56 | 62 | + * | |
57 | /* ZCR_EL[1-3] */ | 63 | + * In the v8M architecture, the IDAU is a small piece of hardware |
58 | @@ -XXX,XX +XXX,XX @@ static inline void xpsr_write(CPUARMState *env, uint32_t val, uint32_t mask) | 64 | + * typically implemented in the SoC which provides board or SoC |
59 | uint32_t vfp_get_fpscr(CPUARMState *env); | 65 | + * specific security attribution information for each address that |
60 | void vfp_set_fpscr(CPUARMState *env, uint32_t val); | 66 | + * the CPU performs MPU/SAU checks on. For QEMU, we model this with a |
61 | 67 | + * QOM interface which is implemented by the board or SoC object and | |
62 | -/* For A64 the FPSCR is split into two logically distinct registers, | 68 | + * connected to the CPU using a link property. |
63 | +/* FPCR, Floating Point Control Register | 69 | + */ |
64 | + * FPSR, Floating Poiht Status Register | 70 | + |
65 | + * | 71 | +#ifndef TARGET_ARM_IDAU_H |
66 | + * For A64 the FPSCR is split into two logically distinct registers, | 72 | +#define TARGET_ARM_IDAU_H |
67 | * FPCR and FPSR. However since they still use non-overlapping bits | 73 | + |
68 | * we store the underlying state in fpscr and just mask on read/write. | 74 | +#include "qom/object.h" |
75 | + | ||
76 | +#define TYPE_IDAU_INTERFACE "idau-interface" | ||
77 | +#define IDAU_INTERFACE(obj) \ | ||
78 | + INTERFACE_CHECK(IDAUInterface, (obj), TYPE_IDAU_INTERFACE) | ||
79 | +#define IDAU_INTERFACE_CLASS(class) \ | ||
80 | + OBJECT_CLASS_CHECK(IDAUInterfaceClass, (class), TYPE_IDAU_INTERFACE) | ||
81 | +#define IDAU_INTERFACE_GET_CLASS(obj) \ | ||
82 | + OBJECT_GET_CLASS(IDAUInterfaceClass, (obj), TYPE_IDAU_INTERFACE) | ||
83 | + | ||
84 | +typedef struct IDAUInterface { | ||
85 | + Object parent; | ||
86 | +} IDAUInterface; | ||
87 | + | ||
88 | +#define IREGION_NOTVALID -1 | ||
89 | + | ||
90 | +typedef struct IDAUInterfaceClass { | ||
91 | + InterfaceClass parent; | ||
92 | + | ||
93 | + /* Check the specified address and return the IDAU security information | ||
94 | + * for it by filling in iregion, exempt, ns and nsc: | ||
95 | + * iregion: IDAU region number, or IREGION_NOTVALID if not valid | ||
96 | + * exempt: true if address is exempt from security attribution | ||
97 | + * ns: true if the address is NonSecure | ||
98 | + * nsc: true if the address is NonSecure-callable | ||
99 | + */ | ||
100 | + void (*check)(IDAUInterface *ii, uint32_t address, int *iregion, | ||
101 | + bool *exempt, bool *ns, bool *nsc); | ||
102 | +} IDAUInterfaceClass; | ||
103 | + | ||
104 | +#endif | ||
105 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c | ||
106 | index XXXXXXX..XXXXXXX 100644 | ||
107 | --- a/target/arm/cpu.c | ||
108 | +++ b/target/arm/cpu.c | ||
109 | @@ -XXX,XX +XXX,XX @@ | ||
69 | */ | 110 | */ |
70 | #define FPSR_MASK 0xf800009f | 111 | |
71 | #define FPCR_MASK 0x07f79f00 | 112 | #include "qemu/osdep.h" |
72 | + | 113 | +#include "target/arm/idau.h" |
73 | +#define FPCR_FZ16 (1 << 19) /* ARMv8.2+, FP16 flush-to-zero */ | 114 | #include "qemu/error-report.h" |
74 | +#define FPCR_FZ (1 << 24) /* Flush-to-zero enable bit */ | 115 | #include "qapi/error.h" |
75 | +#define FPCR_DN (1 << 25) /* Default NaN enable bit */ | 116 | #include "cpu.h" |
76 | + | 117 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_post_init(Object *obj) |
77 | static inline uint32_t vfp_get_fpsr(CPUARMState *env) | 118 | } |
119 | } | ||
120 | |||
121 | + if (arm_feature(&cpu->env, ARM_FEATURE_M_SECURITY)) { | ||
122 | + object_property_add_link(obj, "idau", TYPE_IDAU_INTERFACE, &cpu->idau, | ||
123 | + qdev_prop_allow_set_link_before_realize, | ||
124 | + OBJ_PROP_LINK_UNREF_ON_RELEASE, | ||
125 | + &error_abort); | ||
126 | + } | ||
127 | + | ||
128 | qdev_property_add_static(DEVICE(obj), &arm_cpu_cfgend_property, | ||
129 | &error_abort); | ||
130 | } | ||
131 | @@ -XXX,XX +XXX,XX @@ static const TypeInfo arm_cpu_type_info = { | ||
132 | .class_init = arm_cpu_class_init, | ||
133 | }; | ||
134 | |||
135 | +static const TypeInfo idau_interface_type_info = { | ||
136 | + .name = TYPE_IDAU_INTERFACE, | ||
137 | + .parent = TYPE_INTERFACE, | ||
138 | + .class_size = sizeof(IDAUInterfaceClass), | ||
139 | +}; | ||
140 | + | ||
141 | static void arm_cpu_register_types(void) | ||
78 | { | 142 | { |
79 | return vfp_get_fpscr(env) & FPSR_MASK; | 143 | const ARMCPUInfo *info = arm_cpus; |
144 | |||
145 | type_register_static(&arm_cpu_type_info); | ||
146 | + type_register_static(&idau_interface_type_info); | ||
147 | |||
148 | while (info->name) { | ||
149 | cpu_register(info); | ||
80 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 150 | diff --git a/target/arm/helper.c b/target/arm/helper.c |
81 | index XXXXXXX..XXXXXXX 100644 | 151 | index XXXXXXX..XXXXXXX 100644 |
82 | --- a/target/arm/helper.c | 152 | --- a/target/arm/helper.c |
83 | +++ b/target/arm/helper.c | 153 | +++ b/target/arm/helper.c |
84 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(vfp_get_fpscr)(CPUARMState *env) | 154 | @@ -XXX,XX +XXX,XX @@ |
85 | | (env->vfp.vec_stride << 20); | 155 | #include "qemu/osdep.h" |
86 | i = get_float_exception_flags(&env->vfp.fp_status); | 156 | +#include "target/arm/idau.h" |
87 | i |= get_float_exception_flags(&env->vfp.standard_fp_status); | 157 | #include "trace.h" |
88 | + i |= get_float_exception_flags(&env->vfp.fp_status_f16); | 158 | #include "cpu.h" |
89 | fpscr |= vfp_exceptbits_from_host(i); | 159 | #include "internals.h" |
90 | return fpscr; | 160 | @@ -XXX,XX +XXX,XX @@ static void v8m_security_lookup(CPUARMState *env, uint32_t address, |
161 | */ | ||
162 | ARMCPU *cpu = arm_env_get_cpu(env); | ||
163 | int r; | ||
164 | + bool idau_exempt = false, idau_ns = true, idau_nsc = true; | ||
165 | + int idau_region = IREGION_NOTVALID; | ||
166 | |||
167 | - /* TODO: implement IDAU */ | ||
168 | + if (cpu->idau) { | ||
169 | + IDAUInterfaceClass *iic = IDAU_INTERFACE_GET_CLASS(cpu->idau); | ||
170 | + IDAUInterface *ii = IDAU_INTERFACE(cpu->idau); | ||
171 | + | ||
172 | + iic->check(ii, address, &idau_region, &idau_exempt, &idau_ns, | ||
173 | + &idau_nsc); | ||
174 | + } | ||
175 | |||
176 | if (access_type == MMU_INST_FETCH && extract32(address, 28, 4) == 0xf) { | ||
177 | /* 0xf0000000..0xffffffff is always S for insn fetches */ | ||
178 | return; | ||
179 | } | ||
180 | |||
181 | - if (v8m_is_sau_exempt(env, address, access_type)) { | ||
182 | + if (idau_exempt || v8m_is_sau_exempt(env, address, access_type)) { | ||
183 | sattrs->ns = !regime_is_secure(env, mmu_idx); | ||
184 | return; | ||
185 | } | ||
186 | |||
187 | + if (idau_region != IREGION_NOTVALID) { | ||
188 | + sattrs->irvalid = true; | ||
189 | + sattrs->iregion = idau_region; | ||
190 | + } | ||
191 | + | ||
192 | switch (env->sau.ctrl & 3) { | ||
193 | case 0: /* SAU.ENABLE == 0, SAU.ALLNS == 0 */ | ||
194 | break; | ||
195 | @@ -XXX,XX +XXX,XX @@ static void v8m_security_lookup(CPUARMState *env, uint32_t address, | ||
196 | } | ||
197 | } | ||
198 | |||
199 | - /* TODO when we support the IDAU then it may override the result here */ | ||
200 | + /* The IDAU will override the SAU lookup results if it specifies | ||
201 | + * higher security than the SAU does. | ||
202 | + */ | ||
203 | + if (!idau_ns) { | ||
204 | + if (sattrs->ns || (!idau_nsc && sattrs->nsc)) { | ||
205 | + sattrs->ns = false; | ||
206 | + sattrs->nsc = idau_nsc; | ||
207 | + } | ||
208 | + } | ||
209 | break; | ||
210 | } | ||
91 | } | 211 | } |
92 | @@ -XXX,XX +XXX,XX @@ void HELPER(vfp_set_fpscr)(CPUARMState *env, uint32_t val) | ||
93 | break; | ||
94 | } | ||
95 | set_float_rounding_mode(i, &env->vfp.fp_status); | ||
96 | + set_float_rounding_mode(i, &env->vfp.fp_status_f16); | ||
97 | } | ||
98 | - if (changed & (1 << 24)) { | ||
99 | - set_flush_to_zero((val & (1 << 24)) != 0, &env->vfp.fp_status); | ||
100 | - set_flush_inputs_to_zero((val & (1 << 24)) != 0, &env->vfp.fp_status); | ||
101 | + if (changed & FPCR_FZ16) { | ||
102 | + bool ftz_enabled = val & FPCR_FZ16; | ||
103 | + set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16); | ||
104 | + set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16); | ||
105 | + } | ||
106 | + if (changed & FPCR_FZ) { | ||
107 | + bool ftz_enabled = val & FPCR_FZ; | ||
108 | + set_flush_to_zero(ftz_enabled, &env->vfp.fp_status); | ||
109 | + set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status); | ||
110 | + } | ||
111 | + if (changed & FPCR_DN) { | ||
112 | + bool dnan_enabled = val & FPCR_DN; | ||
113 | + set_default_nan_mode(dnan_enabled, &env->vfp.fp_status); | ||
114 | + set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16); | ||
115 | } | ||
116 | - if (changed & (1 << 25)) | ||
117 | - set_default_nan_mode((val & (1 << 25)) != 0, &env->vfp.fp_status); | ||
118 | |||
119 | + /* The exception flags are ORed together when we read fpscr so we | ||
120 | + * only need to preserve the current state in one of our | ||
121 | + * float_status values. | ||
122 | + */ | ||
123 | i = vfp_exceptbits_to_host(val); | ||
124 | set_float_exception_flags(i, &env->vfp.fp_status); | ||
125 | + set_float_exception_flags(0, &env->vfp.fp_status_f16); | ||
126 | set_float_exception_flags(0, &env->vfp.standard_fp_status); | ||
127 | } | ||
128 | |||
129 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
130 | index XXXXXXX..XXXXXXX 100644 | ||
131 | --- a/target/arm/translate-a64.c | ||
132 | +++ b/target/arm/translate-a64.c | ||
133 | @@ -XXX,XX +XXX,XX @@ static void write_fp_sreg(DisasContext *s, int reg, TCGv_i32 v) | ||
134 | tcg_temp_free_i64(tmp); | ||
135 | } | ||
136 | |||
137 | -static TCGv_ptr get_fpstatus_ptr(void) | ||
138 | +static TCGv_ptr get_fpstatus_ptr(bool is_f16) | ||
139 | { | ||
140 | TCGv_ptr statusptr = tcg_temp_new_ptr(); | ||
141 | int offset; | ||
142 | |||
143 | - /* In A64 all instructions (both FP and Neon) use the FPCR; | ||
144 | - * there is no equivalent of the A32 Neon "standard FPSCR value" | ||
145 | - * and all operations use vfp.fp_status. | ||
146 | + /* In A64 all instructions (both FP and Neon) use the FPCR; there | ||
147 | + * is no equivalent of the A32 Neon "standard FPSCR value". | ||
148 | + * However half-precision operations operate under a different | ||
149 | + * FZ16 flag and use vfp.fp_status_f16 instead of vfp.fp_status. | ||
150 | */ | ||
151 | - offset = offsetof(CPUARMState, vfp.fp_status); | ||
152 | + if (is_f16) { | ||
153 | + offset = offsetof(CPUARMState, vfp.fp_status_f16); | ||
154 | + } else { | ||
155 | + offset = offsetof(CPUARMState, vfp.fp_status); | ||
156 | + } | ||
157 | tcg_gen_addi_ptr(statusptr, cpu_env, offset); | ||
158 | return statusptr; | ||
159 | } | ||
160 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_compare(DisasContext *s, bool is_double, | ||
161 | bool cmp_with_zero, bool signal_all_nans) | ||
162 | { | ||
163 | TCGv_i64 tcg_flags = tcg_temp_new_i64(); | ||
164 | - TCGv_ptr fpst = get_fpstatus_ptr(); | ||
165 | + TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
166 | |||
167 | if (is_double) { | ||
168 | TCGv_i64 tcg_vn, tcg_vm; | ||
169 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_single(DisasContext *s, int opcode, int rd, int rn) | ||
170 | TCGv_i32 tcg_op; | ||
171 | TCGv_i32 tcg_res; | ||
172 | |||
173 | - fpst = get_fpstatus_ptr(); | ||
174 | + fpst = get_fpstatus_ptr(false); | ||
175 | tcg_op = read_fp_sreg(s, rn); | ||
176 | tcg_res = tcg_temp_new_i32(); | ||
177 | |||
178 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_double(DisasContext *s, int opcode, int rd, int rn) | ||
179 | return; | ||
180 | } | ||
181 | |||
182 | - fpst = get_fpstatus_ptr(); | ||
183 | + fpst = get_fpstatus_ptr(false); | ||
184 | tcg_op = read_fp_dreg(s, rn); | ||
185 | tcg_res = tcg_temp_new_i64(); | ||
186 | |||
187 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_2src_single(DisasContext *s, int opcode, | ||
188 | TCGv_ptr fpst; | ||
189 | |||
190 | tcg_res = tcg_temp_new_i32(); | ||
191 | - fpst = get_fpstatus_ptr(); | ||
192 | + fpst = get_fpstatus_ptr(false); | ||
193 | tcg_op1 = read_fp_sreg(s, rn); | ||
194 | tcg_op2 = read_fp_sreg(s, rm); | ||
195 | |||
196 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_2src_double(DisasContext *s, int opcode, | ||
197 | TCGv_ptr fpst; | ||
198 | |||
199 | tcg_res = tcg_temp_new_i64(); | ||
200 | - fpst = get_fpstatus_ptr(); | ||
201 | + fpst = get_fpstatus_ptr(false); | ||
202 | tcg_op1 = read_fp_dreg(s, rn); | ||
203 | tcg_op2 = read_fp_dreg(s, rm); | ||
204 | |||
205 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_3src_single(DisasContext *s, bool o0, bool o1, | ||
206 | { | ||
207 | TCGv_i32 tcg_op1, tcg_op2, tcg_op3; | ||
208 | TCGv_i32 tcg_res = tcg_temp_new_i32(); | ||
209 | - TCGv_ptr fpst = get_fpstatus_ptr(); | ||
210 | + TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
211 | |||
212 | tcg_op1 = read_fp_sreg(s, rn); | ||
213 | tcg_op2 = read_fp_sreg(s, rm); | ||
214 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_3src_double(DisasContext *s, bool o0, bool o1, | ||
215 | { | ||
216 | TCGv_i64 tcg_op1, tcg_op2, tcg_op3; | ||
217 | TCGv_i64 tcg_res = tcg_temp_new_i64(); | ||
218 | - TCGv_ptr fpst = get_fpstatus_ptr(); | ||
219 | + TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
220 | |||
221 | tcg_op1 = read_fp_dreg(s, rn); | ||
222 | tcg_op2 = read_fp_dreg(s, rm); | ||
223 | @@ -XXX,XX +XXX,XX @@ static void handle_fpfpcvt(DisasContext *s, int rd, int rn, int opcode, | ||
224 | TCGv_ptr tcg_fpstatus; | ||
225 | TCGv_i32 tcg_shift; | ||
226 | |||
227 | - tcg_fpstatus = get_fpstatus_ptr(); | ||
228 | + tcg_fpstatus = get_fpstatus_ptr(false); | ||
229 | |||
230 | tcg_shift = tcg_const_i32(64 - scale); | ||
231 | |||
232 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_across_lanes(DisasContext *s, uint32_t insn) | ||
233 | TCGv_i32 tcg_elt1 = tcg_temp_new_i32(); | ||
234 | TCGv_i32 tcg_elt2 = tcg_temp_new_i32(); | ||
235 | TCGv_i32 tcg_elt3 = tcg_temp_new_i32(); | ||
236 | - TCGv_ptr fpst = get_fpstatus_ptr(); | ||
237 | + TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
238 | |||
239 | assert(esize == 32); | ||
240 | assert(elements == 4); | ||
241 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_pairwise(DisasContext *s, uint32_t insn) | ||
242 | } | ||
243 | |||
244 | size = extract32(size, 0, 1) ? 3 : 2; | ||
245 | - fpst = get_fpstatus_ptr(); | ||
246 | + fpst = get_fpstatus_ptr(false); | ||
247 | break; | ||
248 | default: | ||
249 | unallocated_encoding(s); | ||
250 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_intfp_conv(DisasContext *s, int rd, int rn, | ||
251 | int fracbits, int size) | ||
252 | { | ||
253 | bool is_double = size == 3 ? true : false; | ||
254 | - TCGv_ptr tcg_fpst = get_fpstatus_ptr(); | ||
255 | + TCGv_ptr tcg_fpst = get_fpstatus_ptr(false); | ||
256 | TCGv_i32 tcg_shift = tcg_const_i32(fracbits); | ||
257 | TCGv_i64 tcg_int = tcg_temp_new_i64(); | ||
258 | TCGMemOp mop = size | (is_signed ? MO_SIGN : 0); | ||
259 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar, | ||
260 | |||
261 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(FPROUNDING_ZERO)); | ||
262 | gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
263 | - tcg_fpstatus = get_fpstatus_ptr(); | ||
264 | + tcg_fpstatus = get_fpstatus_ptr(false); | ||
265 | tcg_shift = tcg_const_i32(fracbits); | ||
266 | |||
267 | if (is_double) { | ||
268 | @@ -XXX,XX +XXX,XX @@ static void handle_3same_float(DisasContext *s, int size, int elements, | ||
269 | int fpopcode, int rd, int rn, int rm) | ||
270 | { | ||
271 | int pass; | ||
272 | - TCGv_ptr fpst = get_fpstatus_ptr(); | ||
273 | + TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
274 | |||
275 | for (pass = 0; pass < elements; pass++) { | ||
276 | if (size) { | ||
277 | @@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode, | ||
278 | return; | ||
279 | } | ||
280 | |||
281 | - fpst = get_fpstatus_ptr(); | ||
282 | + fpst = get_fpstatus_ptr(false); | ||
283 | |||
284 | if (is_double) { | ||
285 | TCGv_i64 tcg_op = tcg_temp_new_i64(); | ||
286 | @@ -XXX,XX +XXX,XX @@ static void handle_2misc_reciprocal(DisasContext *s, int opcode, | ||
287 | int size, int rn, int rd) | ||
288 | { | ||
289 | bool is_double = (size == 3); | ||
290 | - TCGv_ptr fpst = get_fpstatus_ptr(); | ||
291 | + TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
292 | |||
293 | if (is_double) { | ||
294 | TCGv_i64 tcg_op = tcg_temp_new_i64(); | ||
295 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_two_reg_misc(DisasContext *s, uint32_t insn) | ||
296 | if (is_fcvt) { | ||
297 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | ||
298 | gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
299 | - tcg_fpstatus = get_fpstatus_ptr(); | ||
300 | + tcg_fpstatus = get_fpstatus_ptr(false); | ||
301 | } else { | ||
302 | tcg_rmode = NULL; | ||
303 | tcg_fpstatus = NULL; | ||
304 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_3same_pair(DisasContext *s, int is_q, int u, int opcode, | ||
305 | |||
306 | /* Floating point operations need fpst */ | ||
307 | if (opcode >= 0x58) { | ||
308 | - fpst = get_fpstatus_ptr(); | ||
309 | + fpst = get_fpstatus_ptr(false); | ||
310 | } else { | ||
311 | fpst = NULL; | ||
312 | } | ||
313 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn) | ||
314 | } | ||
315 | |||
316 | if (need_fpstatus) { | ||
317 | - tcg_fpstatus = get_fpstatus_ptr(); | ||
318 | + tcg_fpstatus = get_fpstatus_ptr(false); | ||
319 | } else { | ||
320 | tcg_fpstatus = NULL; | ||
321 | } | ||
322 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
323 | } | ||
324 | |||
325 | if (is_fp) { | ||
326 | - fpst = get_fpstatus_ptr(); | ||
327 | + fpst = get_fpstatus_ptr(false); | ||
328 | } else { | ||
329 | fpst = NULL; | ||
330 | } | ||
331 | -- | 212 | -- |
332 | 2.16.2 | 213 | 2.16.2 |
333 | 214 | ||
334 | 215 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Create an "idau" property on the armv7m container object which |
---|---|---|---|
2 | we can forward to the CPU object. Annoyingly, we can't use | ||
3 | object_property_add_alias() because the CPU object we want to | ||
4 | forward to doesn't exist until the armv7m container is realized. | ||
2 | 5 | ||
3 | We do implement all the opcodes. | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20180220180325.29818-6-peter.maydell@linaro.org | ||
9 | --- | ||
10 | include/hw/arm/armv7m.h | 3 +++ | ||
11 | hw/arm/armv7m.c | 9 +++++++++ | ||
12 | 2 files changed, 12 insertions(+) | ||
4 | 13 | ||
5 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 14 | diff --git a/include/hw/arm/armv7m.h b/include/hw/arm/armv7m.h |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20180227143852.11175-8-alex.bennee@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | --- | ||
10 | target/arm/translate-a64.c | 3 +-- | ||
11 | 1 file changed, 1 insertion(+), 2 deletions(-) | ||
12 | |||
13 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
14 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/translate-a64.c | 16 | --- a/include/hw/arm/armv7m.h |
16 | +++ b/target/arm/translate-a64.c | 17 | +++ b/include/hw/arm/armv7m.h |
17 | @@ -XXX,XX +XXX,XX @@ static void handle_3same_64(DisasContext *s, int opcode, bool u, | 18 | @@ -XXX,XX +XXX,XX @@ |
18 | /* Handle 64x64->64 opcodes which are shared between the scalar | 19 | |
19 | * and vector 3-same groups. We cover every opcode where size == 3 | 20 | #include "hw/sysbus.h" |
20 | * is valid in either the three-reg-same (integer, not pairwise) | 21 | #include "hw/intc/armv7m_nvic.h" |
21 | - * or scalar-three-reg-same groups. (Some opcodes are not yet | 22 | +#include "target/arm/idau.h" |
22 | - * implemented.) | 23 | |
23 | + * or scalar-three-reg-same groups. | 24 | #define TYPE_BITBAND "ARM,bitband-memory" |
24 | */ | 25 | #define BITBAND(obj) OBJECT_CHECK(BitBandState, (obj), TYPE_BITBAND) |
25 | TCGCond cond; | 26 | @@ -XXX,XX +XXX,XX @@ typedef struct { |
27 | * + Property "memory": MemoryRegion defining the physical address space | ||
28 | * that CPU accesses see. (The NVIC, bitbanding and other CPU-internal | ||
29 | * devices will be automatically layered on top of this view.) | ||
30 | + * + Property "idau": IDAU interface (forwarded to CPU object) | ||
31 | */ | ||
32 | typedef struct ARMv7MState { | ||
33 | /*< private >*/ | ||
34 | @@ -XXX,XX +XXX,XX @@ typedef struct ARMv7MState { | ||
35 | char *cpu_type; | ||
36 | /* MemoryRegion the board provides to us (with its devices, RAM, etc) */ | ||
37 | MemoryRegion *board_memory; | ||
38 | + Object *idau; | ||
39 | } ARMv7MState; | ||
40 | |||
41 | #endif | ||
42 | diff --git a/hw/arm/armv7m.c b/hw/arm/armv7m.c | ||
43 | index XXXXXXX..XXXXXXX 100644 | ||
44 | --- a/hw/arm/armv7m.c | ||
45 | +++ b/hw/arm/armv7m.c | ||
46 | @@ -XXX,XX +XXX,XX @@ | ||
47 | #include "sysemu/qtest.h" | ||
48 | #include "qemu/error-report.h" | ||
49 | #include "exec/address-spaces.h" | ||
50 | +#include "target/arm/idau.h" | ||
51 | |||
52 | /* Bitbanded IO. Each word corresponds to a single bit. */ | ||
53 | |||
54 | @@ -XXX,XX +XXX,XX @@ static void armv7m_realize(DeviceState *dev, Error **errp) | ||
55 | |||
56 | object_property_set_link(OBJECT(s->cpu), OBJECT(&s->container), "memory", | ||
57 | &error_abort); | ||
58 | + if (object_property_find(OBJECT(s->cpu), "idau", NULL)) { | ||
59 | + object_property_set_link(OBJECT(s->cpu), s->idau, "idau", &err); | ||
60 | + if (err != NULL) { | ||
61 | + error_propagate(errp, err); | ||
62 | + return; | ||
63 | + } | ||
64 | + } | ||
65 | object_property_set_bool(OBJECT(s->cpu), true, "realized", &err); | ||
66 | if (err != NULL) { | ||
67 | error_propagate(errp, err); | ||
68 | @@ -XXX,XX +XXX,XX @@ static Property armv7m_properties[] = { | ||
69 | DEFINE_PROP_STRING("cpu-type", ARMv7MState, cpu_type), | ||
70 | DEFINE_PROP_LINK("memory", ARMv7MState, board_memory, TYPE_MEMORY_REGION, | ||
71 | MemoryRegion *), | ||
72 | + DEFINE_PROP_LINK("idau", ARMv7MState, idau, TYPE_IDAU_INTERFACE, Object *), | ||
73 | DEFINE_PROP_END_OF_LIST(), | ||
74 | }; | ||
26 | 75 | ||
27 | -- | 76 | -- |
28 | 2.16.2 | 77 | 2.16.2 |
29 | 78 | ||
30 | 79 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | The Cortex-M33 allows the system to specify the reset value of the |
---|---|---|---|
2 | secure Vector Table Offset Register (VTOR) by asserting config | ||
3 | signals. In particular, guest images for the MPS2 AN505 board rely | ||
4 | on the MPS2's initial VTOR being correct for that board. | ||
5 | Implement a QEMU property so board and SoC code can set the reset | ||
6 | value to the correct value. | ||
2 | 7 | ||
3 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Message-id: 20180227143852.11175-4-alex.bennee@linaro.org | 10 | Message-id: 20180220180325.29818-7-peter.maydell@linaro.org |
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | --- | 11 | --- |
8 | target/arm/cpu.h | 1 + | 12 | target/arm/cpu.h | 3 +++ |
9 | 1 file changed, 1 insertion(+) | 13 | target/arm/cpu.c | 18 ++++++++++++++---- |
14 | 2 files changed, 17 insertions(+), 4 deletions(-) | ||
10 | 15 | ||
11 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h | 16 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
12 | index XXXXXXX..XXXXXXX 100644 | 17 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/target/arm/cpu.h | 18 | --- a/target/arm/cpu.h |
14 | +++ b/target/arm/cpu.h | 19 | +++ b/target/arm/cpu.h |
15 | @@ -XXX,XX +XXX,XX @@ typedef struct { | 20 | @@ -XXX,XX +XXX,XX @@ struct ARMCPU { |
16 | * Qn = regs[n].d[1]:regs[n].d[0] | 21 | */ |
17 | * Dn = regs[n].d[0] | 22 | uint32_t psci_conduit; |
18 | * Sn = regs[n].d[0] bits 31..0 | 23 | |
19 | + * Hn = regs[n].d[0] bits 15..0 | 24 | + /* For v8M, initial value of the Secure VTOR */ |
20 | * | 25 | + uint32_t init_svtor; |
21 | * This corresponds to the architecturally defined mapping between | 26 | + |
22 | * the two execution states, and means we do not need to explicitly | 27 | /* [QEMU_]KVM_ARM_TARGET_* constant for this CPU, or |
28 | * QEMU_KVM_ARM_TARGET_NONE if the kernel doesn't support this CPU type. | ||
29 | */ | ||
30 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c | ||
31 | index XXXXXXX..XXXXXXX 100644 | ||
32 | --- a/target/arm/cpu.c | ||
33 | +++ b/target/arm/cpu.c | ||
34 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(CPUState *s) | ||
35 | uint32_t initial_msp; /* Loaded from 0x0 */ | ||
36 | uint32_t initial_pc; /* Loaded from 0x4 */ | ||
37 | uint8_t *rom; | ||
38 | + uint32_t vecbase; | ||
39 | |||
40 | if (arm_feature(env, ARM_FEATURE_M_SECURITY)) { | ||
41 | env->v7m.secure = true; | ||
42 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(CPUState *s) | ||
43 | /* Unlike A/R profile, M profile defines the reset LR value */ | ||
44 | env->regs[14] = 0xffffffff; | ||
45 | |||
46 | - /* Load the initial SP and PC from the vector table at address 0 */ | ||
47 | - rom = rom_ptr(0); | ||
48 | + env->v7m.vecbase[M_REG_S] = cpu->init_svtor & 0xffffff80; | ||
49 | + | ||
50 | + /* Load the initial SP and PC from offset 0 and 4 in the vector table */ | ||
51 | + vecbase = env->v7m.vecbase[env->v7m.secure]; | ||
52 | + rom = rom_ptr(vecbase); | ||
53 | if (rom) { | ||
54 | /* Address zero is covered by ROM which hasn't yet been | ||
55 | * copied into physical memory. | ||
56 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(CPUState *s) | ||
57 | * it got copied into memory. In the latter case, rom_ptr | ||
58 | * will return a NULL pointer and we should use ldl_phys instead. | ||
59 | */ | ||
60 | - initial_msp = ldl_phys(s->as, 0); | ||
61 | - initial_pc = ldl_phys(s->as, 4); | ||
62 | + initial_msp = ldl_phys(s->as, vecbase); | ||
63 | + initial_pc = ldl_phys(s->as, vecbase + 4); | ||
64 | } | ||
65 | |||
66 | env->regs[13] = initial_msp & 0xFFFFFFFC; | ||
67 | @@ -XXX,XX +XXX,XX @@ static Property arm_cpu_pmsav7_dregion_property = | ||
68 | pmsav7_dregion, | ||
69 | qdev_prop_uint32, uint32_t); | ||
70 | |||
71 | +/* M profile: initial value of the Secure VTOR */ | ||
72 | +static Property arm_cpu_initsvtor_property = | ||
73 | + DEFINE_PROP_UINT32("init-svtor", ARMCPU, init_svtor, 0); | ||
74 | + | ||
75 | static void arm_cpu_post_init(Object *obj) | ||
76 | { | ||
77 | ARMCPU *cpu = ARM_CPU(obj); | ||
78 | @@ -XXX,XX +XXX,XX @@ static void arm_cpu_post_init(Object *obj) | ||
79 | qdev_prop_allow_set_link_before_realize, | ||
80 | OBJ_PROP_LINK_UNREF_ON_RELEASE, | ||
81 | &error_abort); | ||
82 | + qdev_property_add_static(DEVICE(obj), &arm_cpu_initsvtor_property, | ||
83 | + &error_abort); | ||
84 | } | ||
85 | |||
86 | qdev_property_add_static(DEVICE(obj), &arm_cpu_cfgend_property, | ||
23 | -- | 87 | -- |
24 | 2.16.2 | 88 | 2.16.2 |
25 | 89 | ||
26 | 90 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Create an "init-svtor" property on the armv7m container |
---|---|---|---|
2 | object which we can forward to the CPU object. | ||
2 | 3 | ||
3 | I only needed to do a little light re-factoring to support the | 4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | half-precision helpers. | 5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
6 | Message-id: 20180220180325.29818-8-peter.maydell@linaro.org | ||
7 | --- | ||
8 | include/hw/arm/armv7m.h | 2 ++ | ||
9 | hw/arm/armv7m.c | 9 +++++++++ | ||
10 | 2 files changed, 11 insertions(+) | ||
5 | 11 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 12 | diff --git a/include/hw/arm/armv7m.h b/include/hw/arm/armv7m.h |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20180227143852.11175-30-alex.bennee@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | target/arm/translate-a64.c | 80 +++++++++++++++++++++++++++++++--------------- | ||
12 | 1 file changed, 54 insertions(+), 26 deletions(-) | ||
13 | |||
14 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/translate-a64.c | 14 | --- a/include/hw/arm/armv7m.h |
17 | +++ b/target/arm/translate-a64.c | 15 | +++ b/include/hw/arm/armv7m.h |
18 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_pairwise(DisasContext *s, uint32_t insn) | 16 | @@ -XXX,XX +XXX,XX @@ typedef struct { |
19 | case 0xf: /* FMAXP */ | 17 | * that CPU accesses see. (The NVIC, bitbanding and other CPU-internal |
20 | case 0x2c: /* FMINNMP */ | 18 | * devices will be automatically layered on top of this view.) |
21 | case 0x2f: /* FMINP */ | 19 | * + Property "idau": IDAU interface (forwarded to CPU object) |
22 | - /* FP op, size[0] is 32 or 64 bit */ | 20 | + * + Property "init-svtor": secure VTOR reset value (forwarded to CPU object) |
23 | + /* FP op, size[0] is 32 or 64 bit*/ | 21 | */ |
24 | if (!u) { | 22 | typedef struct ARMv7MState { |
25 | - unallocated_encoding(s); | 23 | /*< private >*/ |
26 | - return; | 24 | @@ -XXX,XX +XXX,XX @@ typedef struct ARMv7MState { |
27 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 25 | /* MemoryRegion the board provides to us (with its devices, RAM, etc) */ |
28 | + unallocated_encoding(s); | 26 | MemoryRegion *board_memory; |
29 | + return; | 27 | Object *idau; |
30 | + } else { | 28 | + uint32_t init_svtor; |
31 | + size = MO_16; | 29 | } ARMv7MState; |
32 | + } | 30 | |
33 | + } else { | 31 | #endif |
34 | + size = extract32(size, 0, 1) ? MO_64 : MO_32; | 32 | diff --git a/hw/arm/armv7m.c b/hw/arm/armv7m.c |
35 | } | 33 | index XXXXXXX..XXXXXXX 100644 |
36 | + | 34 | --- a/hw/arm/armv7m.c |
37 | if (!fp_access_check(s)) { | 35 | +++ b/hw/arm/armv7m.c |
36 | @@ -XXX,XX +XXX,XX @@ static void armv7m_realize(DeviceState *dev, Error **errp) | ||
38 | return; | 37 | return; |
39 | } | 38 | } |
40 | |||
41 | - size = extract32(size, 0, 1) ? 3 : 2; | ||
42 | - fpst = get_fpstatus_ptr(false); | ||
43 | + fpst = get_fpstatus_ptr(size == MO_16); | ||
44 | break; | ||
45 | default: | ||
46 | unallocated_encoding(s); | ||
47 | return; | ||
48 | } | 39 | } |
49 | 40 | + if (object_property_find(OBJECT(s->cpu), "init-svtor", NULL)) { | |
50 | - if (size == 3) { | 41 | + object_property_set_uint(OBJECT(s->cpu), s->init_svtor, |
51 | + if (size == MO_64) { | 42 | + "init-svtor", &err); |
52 | TCGv_i64 tcg_op1 = tcg_temp_new_i64(); | 43 | + if (err != NULL) { |
53 | TCGv_i64 tcg_op2 = tcg_temp_new_i64(); | 44 | + error_propagate(errp, err); |
54 | TCGv_i64 tcg_res = tcg_temp_new_i64(); | 45 | + return; |
55 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_pairwise(DisasContext *s, uint32_t insn) | 46 | + } |
56 | TCGv_i32 tcg_op2 = tcg_temp_new_i32(); | 47 | + } |
57 | TCGv_i32 tcg_res = tcg_temp_new_i32(); | 48 | object_property_set_bool(OBJECT(s->cpu), true, "realized", &err); |
58 | 49 | if (err != NULL) { | |
59 | - read_vec_element_i32(s, tcg_op1, rn, 0, MO_32); | 50 | error_propagate(errp, err); |
60 | - read_vec_element_i32(s, tcg_op2, rn, 1, MO_32); | 51 | @@ -XXX,XX +XXX,XX @@ static Property armv7m_properties[] = { |
61 | + read_vec_element_i32(s, tcg_op1, rn, 0, size); | 52 | DEFINE_PROP_LINK("memory", ARMv7MState, board_memory, TYPE_MEMORY_REGION, |
62 | + read_vec_element_i32(s, tcg_op2, rn, 1, size); | 53 | MemoryRegion *), |
63 | 54 | DEFINE_PROP_LINK("idau", ARMv7MState, idau, TYPE_IDAU_INTERFACE, Object *), | |
64 | - switch (opcode) { | 55 | + DEFINE_PROP_UINT32("init-svtor", ARMv7MState, init_svtor, 0), |
65 | - case 0xc: /* FMAXNMP */ | 56 | DEFINE_PROP_END_OF_LIST(), |
66 | - gen_helper_vfp_maxnums(tcg_res, tcg_op1, tcg_op2, fpst); | 57 | }; |
67 | - break; | 58 | |
68 | - case 0xd: /* FADDP */ | ||
69 | - gen_helper_vfp_adds(tcg_res, tcg_op1, tcg_op2, fpst); | ||
70 | - break; | ||
71 | - case 0xf: /* FMAXP */ | ||
72 | - gen_helper_vfp_maxs(tcg_res, tcg_op1, tcg_op2, fpst); | ||
73 | - break; | ||
74 | - case 0x2c: /* FMINNMP */ | ||
75 | - gen_helper_vfp_minnums(tcg_res, tcg_op1, tcg_op2, fpst); | ||
76 | - break; | ||
77 | - case 0x2f: /* FMINP */ | ||
78 | - gen_helper_vfp_mins(tcg_res, tcg_op1, tcg_op2, fpst); | ||
79 | - break; | ||
80 | - default: | ||
81 | - g_assert_not_reached(); | ||
82 | + if (size == MO_16) { | ||
83 | + switch (opcode) { | ||
84 | + case 0xc: /* FMAXNMP */ | ||
85 | + gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
86 | + break; | ||
87 | + case 0xd: /* FADDP */ | ||
88 | + gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
89 | + break; | ||
90 | + case 0xf: /* FMAXP */ | ||
91 | + gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
92 | + break; | ||
93 | + case 0x2c: /* FMINNMP */ | ||
94 | + gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
95 | + break; | ||
96 | + case 0x2f: /* FMINP */ | ||
97 | + gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
98 | + break; | ||
99 | + default: | ||
100 | + g_assert_not_reached(); | ||
101 | + } | ||
102 | + } else { | ||
103 | + switch (opcode) { | ||
104 | + case 0xc: /* FMAXNMP */ | ||
105 | + gen_helper_vfp_maxnums(tcg_res, tcg_op1, tcg_op2, fpst); | ||
106 | + break; | ||
107 | + case 0xd: /* FADDP */ | ||
108 | + gen_helper_vfp_adds(tcg_res, tcg_op1, tcg_op2, fpst); | ||
109 | + break; | ||
110 | + case 0xf: /* FMAXP */ | ||
111 | + gen_helper_vfp_maxs(tcg_res, tcg_op1, tcg_op2, fpst); | ||
112 | + break; | ||
113 | + case 0x2c: /* FMINNMP */ | ||
114 | + gen_helper_vfp_minnums(tcg_res, tcg_op1, tcg_op2, fpst); | ||
115 | + break; | ||
116 | + case 0x2f: /* FMINP */ | ||
117 | + gen_helper_vfp_mins(tcg_res, tcg_op1, tcg_op2, fpst); | ||
118 | + break; | ||
119 | + default: | ||
120 | + g_assert_not_reached(); | ||
121 | + } | ||
122 | } | ||
123 | |||
124 | write_fp_sreg(s, rd, tcg_res); | ||
125 | -- | 59 | -- |
126 | 2.16.2 | 60 | 2.16.2 |
127 | 61 | ||
128 | 62 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Add a Cortex-M33 definition. The M33 is an M profile CPU |
---|---|---|---|
2 | which implements the ARM v8M architecture, including the | ||
3 | M profile Security Extension. | ||
2 | 4 | ||
3 | This includes FMOV, FABS, FNEG, FSQRT and FRINT[NPMZAXI]. We re-use | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | existing helpers to achieve this. | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
7 | Message-id: 20180220180325.29818-9-peter.maydell@linaro.org | ||
8 | --- | ||
9 | target/arm/cpu.c | 31 +++++++++++++++++++++++++++++++ | ||
10 | 1 file changed, 31 insertions(+) | ||
5 | 11 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 12 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20180227143852.11175-32-alex.bennee@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | target/arm/translate-a64.c | 71 ++++++++++++++++++++++++++++++++++++++++++++++ | ||
12 | 1 file changed, 71 insertions(+) | ||
13 | |||
14 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/translate-a64.c | 14 | --- a/target/arm/cpu.c |
17 | +++ b/target/arm/translate-a64.c | 15 | +++ b/target/arm/cpu.c |
18 | @@ -XXX,XX +XXX,XX @@ static void disas_fp_csel(DisasContext *s, uint32_t insn) | 16 | @@ -XXX,XX +XXX,XX @@ static void cortex_m4_initfn(Object *obj) |
19 | tcg_temp_free_i64(t_true); | 17 | cpu->id_isar5 = 0x00000000; |
20 | } | 18 | } |
21 | 19 | ||
22 | +/* Floating-point data-processing (1 source) - half precision */ | 20 | +static void cortex_m33_initfn(Object *obj) |
23 | +static void handle_fp_1src_half(DisasContext *s, int opcode, int rd, int rn) | ||
24 | +{ | 21 | +{ |
25 | + TCGv_ptr fpst = NULL; | 22 | + ARMCPU *cpu = ARM_CPU(obj); |
26 | + TCGv_i32 tcg_op = tcg_temp_new_i32(); | ||
27 | + TCGv_i32 tcg_res = tcg_temp_new_i32(); | ||
28 | + | 23 | + |
29 | + read_vec_element_i32(s, tcg_op, rn, 0, MO_16); | 24 | + set_feature(&cpu->env, ARM_FEATURE_V8); |
30 | + | 25 | + set_feature(&cpu->env, ARM_FEATURE_M); |
31 | + switch (opcode) { | 26 | + set_feature(&cpu->env, ARM_FEATURE_M_SECURITY); |
32 | + case 0x0: /* FMOV */ | 27 | + set_feature(&cpu->env, ARM_FEATURE_THUMB_DSP); |
33 | + tcg_gen_mov_i32(tcg_res, tcg_op); | 28 | + cpu->midr = 0x410fd213; /* r0p3 */ |
34 | + break; | 29 | + cpu->pmsav7_dregion = 16; |
35 | + case 0x1: /* FABS */ | 30 | + cpu->sau_sregion = 8; |
36 | + tcg_gen_andi_i32(tcg_res, tcg_op, 0x7fff); | 31 | + cpu->id_pfr0 = 0x00000030; |
37 | + break; | 32 | + cpu->id_pfr1 = 0x00000210; |
38 | + case 0x2: /* FNEG */ | 33 | + cpu->id_dfr0 = 0x00200000; |
39 | + tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000); | 34 | + cpu->id_afr0 = 0x00000000; |
40 | + break; | 35 | + cpu->id_mmfr0 = 0x00101F40; |
41 | + case 0x3: /* FSQRT */ | 36 | + cpu->id_mmfr1 = 0x00000000; |
42 | + gen_helper_sqrt_f16(tcg_res, tcg_op, cpu_env); | 37 | + cpu->id_mmfr2 = 0x01000000; |
43 | + break; | 38 | + cpu->id_mmfr3 = 0x00000000; |
44 | + case 0x8: /* FRINTN */ | 39 | + cpu->id_isar0 = 0x01101110; |
45 | + case 0x9: /* FRINTP */ | 40 | + cpu->id_isar1 = 0x02212000; |
46 | + case 0xa: /* FRINTM */ | 41 | + cpu->id_isar2 = 0x20232232; |
47 | + case 0xb: /* FRINTZ */ | 42 | + cpu->id_isar3 = 0x01111131; |
48 | + case 0xc: /* FRINTA */ | 43 | + cpu->id_isar4 = 0x01310132; |
49 | + { | 44 | + cpu->id_isar5 = 0x00000000; |
50 | + TCGv_i32 tcg_rmode = tcg_const_i32(arm_rmode_to_sf(opcode & 7)); | 45 | + cpu->clidr = 0x00000000; |
51 | + fpst = get_fpstatus_ptr(true); | 46 | + cpu->ctr = 0x8000c000; |
52 | + | ||
53 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
54 | + gen_helper_advsimd_rinth(tcg_res, tcg_op, fpst); | ||
55 | + | ||
56 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
57 | + tcg_temp_free_i32(tcg_rmode); | ||
58 | + break; | ||
59 | + } | ||
60 | + case 0xe: /* FRINTX */ | ||
61 | + fpst = get_fpstatus_ptr(true); | ||
62 | + gen_helper_advsimd_rinth_exact(tcg_res, tcg_op, fpst); | ||
63 | + break; | ||
64 | + case 0xf: /* FRINTI */ | ||
65 | + fpst = get_fpstatus_ptr(true); | ||
66 | + gen_helper_advsimd_rinth(tcg_res, tcg_op, fpst); | ||
67 | + break; | ||
68 | + default: | ||
69 | + abort(); | ||
70 | + } | ||
71 | + | ||
72 | + write_fp_sreg(s, rd, tcg_res); | ||
73 | + | ||
74 | + if (fpst) { | ||
75 | + tcg_temp_free_ptr(fpst); | ||
76 | + } | ||
77 | + tcg_temp_free_i32(tcg_op); | ||
78 | + tcg_temp_free_i32(tcg_res); | ||
79 | +} | 47 | +} |
80 | + | 48 | + |
81 | /* Floating-point data-processing (1 source) - single precision */ | 49 | static void arm_v7m_class_init(ObjectClass *oc, void *data) |
82 | static void handle_fp_1src_single(DisasContext *s, int opcode, int rd, int rn) | ||
83 | { | 50 | { |
84 | @@ -XXX,XX +XXX,XX @@ static void disas_fp_1src(DisasContext *s, uint32_t insn) | 51 | CPUClass *cc = CPU_CLASS(oc); |
85 | 52 | @@ -XXX,XX +XXX,XX @@ static const ARMCPUInfo arm_cpus[] = { | |
86 | handle_fp_1src_double(s, opcode, rd, rn); | 53 | .class_init = arm_v7m_class_init }, |
87 | break; | 54 | { .name = "cortex-m4", .initfn = cortex_m4_initfn, |
88 | + case 3: | 55 | .class_init = arm_v7m_class_init }, |
89 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 56 | + { .name = "cortex-m33", .initfn = cortex_m33_initfn, |
90 | + unallocated_encoding(s); | 57 | + .class_init = arm_v7m_class_init }, |
91 | + return; | 58 | { .name = "cortex-r5", .initfn = cortex_r5_initfn }, |
92 | + } | 59 | { .name = "cortex-a7", .initfn = cortex_a7_initfn }, |
93 | + | 60 | { .name = "cortex-a8", .initfn = cortex_a8_initfn }, |
94 | + if (!fp_access_check(s)) { | ||
95 | + return; | ||
96 | + } | ||
97 | + | ||
98 | + handle_fp_1src_half(s, opcode, rd, rn); | ||
99 | + break; | ||
100 | default: | ||
101 | unallocated_encoding(s); | ||
102 | } | ||
103 | -- | 61 | -- |
104 | 2.16.2 | 62 | 2.16.2 |
105 | 63 | ||
106 | 64 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Move the definition of the struct for the unimplemented-device |
---|---|---|---|
2 | from unimp.c to unimp.h, so that users can embed the struct | ||
3 | in their own device structs if they prefer. | ||
2 | 4 | ||
3 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Message-id: 20180227143852.11175-28-alex.bennee@linaro.org | 8 | Message-id: 20180220180325.29818-10-peter.maydell@linaro.org |
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | --- | 9 | --- |
8 | target/arm/translate-a64.c | 7 +++++++ | 10 | include/hw/misc/unimp.h | 10 ++++++++++ |
9 | 1 file changed, 7 insertions(+) | 11 | hw/misc/unimp.c | 10 ---------- |
12 | 2 files changed, 10 insertions(+), 10 deletions(-) | ||
10 | 13 | ||
11 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 14 | diff --git a/include/hw/misc/unimp.h b/include/hw/misc/unimp.h |
12 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/target/arm/translate-a64.c | 16 | --- a/include/hw/misc/unimp.h |
14 | +++ b/target/arm/translate-a64.c | 17 | +++ b/include/hw/misc/unimp.h |
15 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 18 | @@ -XXX,XX +XXX,XX @@ |
16 | case 0x6f: /* FNEG */ | 19 | |
17 | need_fpst = false; | 20 | #define TYPE_UNIMPLEMENTED_DEVICE "unimplemented-device" |
18 | break; | 21 | |
19 | + case 0x7d: /* FRSQRTE */ | 22 | +#define UNIMPLEMENTED_DEVICE(obj) \ |
20 | case 0x7f: /* FSQRT (vector) */ | 23 | + OBJECT_CHECK(UnimplementedDeviceState, (obj), TYPE_UNIMPLEMENTED_DEVICE) |
21 | break; | 24 | + |
22 | default: | 25 | +typedef struct { |
23 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 26 | + SysBusDevice parent_obj; |
24 | case 0x6f: /* FNEG */ | 27 | + MemoryRegion iomem; |
25 | tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000); | 28 | + char *name; |
26 | break; | 29 | + uint64_t size; |
27 | + case 0x7d: /* FRSQRTE */ | 30 | +} UnimplementedDeviceState; |
28 | + gen_helper_rsqrte_f16(tcg_res, tcg_op, tcg_fpstatus); | 31 | + |
29 | + break; | 32 | /** |
30 | default: | 33 | * create_unimplemented_device: create and map a dummy device |
31 | g_assert_not_reached(); | 34 | * @name: name of the device for debug logging |
32 | } | 35 | diff --git a/hw/misc/unimp.c b/hw/misc/unimp.c |
33 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 36 | index XXXXXXX..XXXXXXX 100644 |
34 | case 0x6f: /* FNEG */ | 37 | --- a/hw/misc/unimp.c |
35 | tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000); | 38 | +++ b/hw/misc/unimp.c |
36 | break; | 39 | @@ -XXX,XX +XXX,XX @@ |
37 | + case 0x7d: /* FRSQRTE */ | 40 | #include "qemu/log.h" |
38 | + gen_helper_rsqrte_f16(tcg_res, tcg_op, tcg_fpstatus); | 41 | #include "qapi/error.h" |
39 | + break; | 42 | |
40 | case 0x7f: /* FSQRT */ | 43 | -#define UNIMPLEMENTED_DEVICE(obj) \ |
41 | gen_helper_sqrt_f16(tcg_res, tcg_op, tcg_fpstatus); | 44 | - OBJECT_CHECK(UnimplementedDeviceState, (obj), TYPE_UNIMPLEMENTED_DEVICE) |
42 | break; | 45 | - |
46 | -typedef struct { | ||
47 | - SysBusDevice parent_obj; | ||
48 | - MemoryRegion iomem; | ||
49 | - char *name; | ||
50 | - uint64_t size; | ||
51 | -} UnimplementedDeviceState; | ||
52 | - | ||
53 | static uint64_t unimp_read(void *opaque, hwaddr offset, unsigned size) | ||
54 | { | ||
55 | UnimplementedDeviceState *s = UNIMPLEMENTED_DEVICE(opaque); | ||
43 | -- | 56 | -- |
44 | 2.16.2 | 57 | 2.16.2 |
45 | 58 | ||
46 | 59 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | The or-irq.h header file is missing the customary guard against |
---|---|---|---|
2 | multiple inclusion, which means compilation fails if it gets | ||
3 | included twice. Fix the omission. | ||
2 | 4 | ||
3 | Now we have added f16 during the re-factoring we can simply call the | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | helper. | 6 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20180220180325.29818-11-peter.maydell@linaro.org | ||
9 | --- | ||
10 | include/hw/or-irq.h | 5 +++++ | ||
11 | 1 file changed, 5 insertions(+) | ||
5 | 12 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 13 | diff --git a/include/hw/or-irq.h b/include/hw/or-irq.h |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
8 | Message-id: 20180227143852.11175-24-alex.bennee@linaro.org | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | ||
11 | target/arm/translate-a64.c | 8 ++++++++ | ||
12 | 1 file changed, 8 insertions(+) | ||
13 | |||
14 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/translate-a64.c | 15 | --- a/include/hw/or-irq.h |
17 | +++ b/target/arm/translate-a64.c | 16 | +++ b/include/hw/or-irq.h |
18 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 17 | @@ -XXX,XX +XXX,XX @@ |
19 | case 0x6d: /* FCMLE (zero) */ | 18 | * THE SOFTWARE. |
20 | handle_2misc_fcmp_zero(s, fpop, is_scalar, 0, is_q, MO_16, rn, rd); | 19 | */ |
21 | return; | 20 | |
22 | + case 0x3d: /* FRECPE */ | 21 | +#ifndef HW_OR_IRQ_H |
23 | + break; | 22 | +#define HW_OR_IRQ_H |
24 | case 0x18: /* FRINTN */ | 23 | + |
25 | need_rmode = true; | 24 | #include "hw/irq.h" |
26 | only_in_vector = true; | 25 | #include "hw/sysbus.h" |
27 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 26 | #include "qom/object.h" |
28 | case 0x3b: /* FCVTZS */ | 27 | @@ -XXX,XX +XXX,XX @@ struct OrIRQState { |
29 | gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus); | 28 | bool levels[MAX_OR_LINES]; |
30 | break; | 29 | uint16_t num_lines; |
31 | + case 0x3d: /* FRECPE */ | 30 | }; |
32 | + gen_helper_recpe_f16(tcg_res, tcg_op, tcg_fpstatus); | 31 | + |
33 | + break; | 32 | +#endif |
34 | case 0x5a: /* FCVTNU */ | ||
35 | case 0x5b: /* FCVTMU */ | ||
36 | case 0x5c: /* FCVTAU */ | ||
37 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | ||
38 | case 0x3b: /* FCVTZS */ | ||
39 | gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus); | ||
40 | break; | ||
41 | + case 0x3d: /* FRECPE */ | ||
42 | + gen_helper_recpe_f16(tcg_res, tcg_op, tcg_fpstatus); | ||
43 | + break; | ||
44 | case 0x5a: /* FCVTNU */ | ||
45 | case 0x5b: /* FCVTMU */ | ||
46 | case 0x5c: /* FCVTAU */ | ||
47 | -- | 33 | -- |
48 | 2.16.2 | 34 | 2.16.2 |
49 | 35 | ||
50 | 36 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | The function qdev_init_gpio_in_named() passes the DeviceState pointer |
---|---|---|---|
2 | as the opaque data pointor for the irq handler function. Usually | ||
3 | this is what you want, but in some cases it would be helpful to use | ||
4 | some other data pointer. | ||
2 | 5 | ||
3 | The fprintf is only there for debugging as the skeleton is added to, | 6 | Add a new function qdev_init_gpio_in_named_with_opaque() which allows |
4 | it will be removed once the skeleton is complete. | 7 | the caller to specify the data pointer they want. |
5 | 8 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20180227143852.11175-10-alex.bennee@linaro.org | 12 | Message-id: 20180220180325.29818-12-peter.maydell@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | 13 | --- |
11 | target/arm/helper-a64.h | 4 ++++ | 14 | include/hw/qdev-core.h | 30 ++++++++++++++++++++++++++++-- |
12 | target/arm/helper-a64.c | 4 ++++ | 15 | hw/core/qdev.c | 8 +++++--- |
13 | target/arm/translate-a64.c | 28 ++++++++++++++++++++++++++++ | 16 | 2 files changed, 33 insertions(+), 5 deletions(-) |
14 | 3 files changed, 36 insertions(+) | ||
15 | 17 | ||
16 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 18 | diff --git a/include/hw/qdev-core.h b/include/hw/qdev-core.h |
17 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-a64.h | 20 | --- a/include/hw/qdev-core.h |
19 | +++ b/target/arm/helper-a64.h | 21 | +++ b/include/hw/qdev-core.h |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(advsimd_maxh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 22 | @@ -XXX,XX +XXX,XX @@ BusState *qdev_get_child_bus(DeviceState *dev, const char *name); |
21 | DEF_HELPER_FLAGS_3(advsimd_minh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 23 | /* GPIO inputs also double as IRQ sinks. */ |
22 | DEF_HELPER_FLAGS_3(advsimd_maxnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 24 | void qdev_init_gpio_in(DeviceState *dev, qemu_irq_handler handler, int n); |
23 | DEF_HELPER_FLAGS_3(advsimd_minnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 25 | void qdev_init_gpio_out(DeviceState *dev, qemu_irq *pins, int n); |
24 | +DEF_HELPER_3(advsimd_addh, f16, f16, f16, ptr) | 26 | -void qdev_init_gpio_in_named(DeviceState *dev, qemu_irq_handler handler, |
25 | +DEF_HELPER_3(advsimd_subh, f16, f16, f16, ptr) | 27 | - const char *name, int n); |
26 | +DEF_HELPER_3(advsimd_mulh, f16, f16, f16, ptr) | 28 | void qdev_init_gpio_out_named(DeviceState *dev, qemu_irq *pins, |
27 | +DEF_HELPER_3(advsimd_divh, f16, f16, f16, ptr) | 29 | const char *name, int n); |
28 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 30 | +/** |
31 | + * qdev_init_gpio_in_named_with_opaque: create an array of input GPIO lines | ||
32 | + * for the specified device | ||
33 | + * | ||
34 | + * @dev: Device to create input GPIOs for | ||
35 | + * @handler: Function to call when GPIO line value is set | ||
36 | + * @opaque: Opaque data pointer to pass to @handler | ||
37 | + * @name: Name of the GPIO input (must be unique for this device) | ||
38 | + * @n: Number of GPIO lines in this input set | ||
39 | + */ | ||
40 | +void qdev_init_gpio_in_named_with_opaque(DeviceState *dev, | ||
41 | + qemu_irq_handler handler, | ||
42 | + void *opaque, | ||
43 | + const char *name, int n); | ||
44 | + | ||
45 | +/** | ||
46 | + * qdev_init_gpio_in_named: create an array of input GPIO lines | ||
47 | + * for the specified device | ||
48 | + * | ||
49 | + * Like qdev_init_gpio_in_named_with_opaque(), but the opaque pointer | ||
50 | + * passed to the handler is @dev (which is the most commonly desired behaviour). | ||
51 | + */ | ||
52 | +static inline void qdev_init_gpio_in_named(DeviceState *dev, | ||
53 | + qemu_irq_handler handler, | ||
54 | + const char *name, int n) | ||
55 | +{ | ||
56 | + qdev_init_gpio_in_named_with_opaque(dev, handler, dev, name, n); | ||
57 | +} | ||
58 | |||
59 | void qdev_pass_gpios(DeviceState *dev, DeviceState *container, | ||
60 | const char *name); | ||
61 | diff --git a/hw/core/qdev.c b/hw/core/qdev.c | ||
29 | index XXXXXXX..XXXXXXX 100644 | 62 | index XXXXXXX..XXXXXXX 100644 |
30 | --- a/target/arm/helper-a64.c | 63 | --- a/hw/core/qdev.c |
31 | +++ b/target/arm/helper-a64.c | 64 | +++ b/hw/core/qdev.c |
32 | @@ -XXX,XX +XXX,XX @@ float16 ADVSIMD_HELPER(name, h)(float16 a, float16 b, void *fpstp) \ | 65 | @@ -XXX,XX +XXX,XX @@ static NamedGPIOList *qdev_get_named_gpio_list(DeviceState *dev, |
33 | return float16_ ## name(a, b, fpst); \ | 66 | return ngl; |
34 | } | 67 | } |
35 | 68 | ||
36 | +ADVSIMD_HALFOP(add) | 69 | -void qdev_init_gpio_in_named(DeviceState *dev, qemu_irq_handler handler, |
37 | +ADVSIMD_HALFOP(sub) | 70 | - const char *name, int n) |
38 | +ADVSIMD_HALFOP(mul) | 71 | +void qdev_init_gpio_in_named_with_opaque(DeviceState *dev, |
39 | +ADVSIMD_HALFOP(div) | 72 | + qemu_irq_handler handler, |
40 | ADVSIMD_HALFOP(min) | 73 | + void *opaque, |
41 | ADVSIMD_HALFOP(max) | 74 | + const char *name, int n) |
42 | ADVSIMD_HALFOP(minnum) | 75 | { |
43 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 76 | int i; |
44 | index XXXXXXX..XXXXXXX 100644 | 77 | NamedGPIOList *gpio_list = qdev_get_named_gpio_list(dev, name); |
45 | --- a/target/arm/translate-a64.c | 78 | |
46 | +++ b/target/arm/translate-a64.c | 79 | assert(gpio_list->num_out == 0 || !name); |
47 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | 80 | gpio_list->in = qemu_extend_irqs(gpio_list->in, gpio_list->num_in, handler, |
48 | read_vec_element_i32(s, tcg_op2, rm, pass, MO_16); | 81 | - dev, n); |
49 | 82 | + opaque, n); | |
50 | switch (fpopcode) { | 83 | |
51 | + case 0x0: /* FMAXNM */ | 84 | if (!name) { |
52 | + gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst); | 85 | name = "unnamed-gpio-in"; |
53 | + break; | ||
54 | + case 0x2: /* FADD */ | ||
55 | + gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
56 | + break; | ||
57 | + case 0x6: /* FMAX */ | ||
58 | + gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
59 | + break; | ||
60 | + case 0x8: /* FMINNM */ | ||
61 | + gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
62 | + break; | ||
63 | + case 0xa: /* FSUB */ | ||
64 | + gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
65 | + break; | ||
66 | + case 0xe: /* FMIN */ | ||
67 | + gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
68 | + break; | ||
69 | + case 0x13: /* FMUL */ | ||
70 | + gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
71 | + break; | ||
72 | + case 0x17: /* FDIV */ | ||
73 | + gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
74 | + break; | ||
75 | + case 0x1a: /* FABD */ | ||
76 | + gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
77 | + tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff); | ||
78 | + break; | ||
79 | default: | ||
80 | fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n", | ||
81 | __func__, insn, fpopcode, s->pc); | ||
82 | -- | 86 | -- |
83 | 2.16.2 | 87 | 2.16.2 |
84 | 88 | ||
85 | 89 | diff view generated by jsdifflib |
1 | From: Corey Minyard <cminyard@mvista.com> | 1 | In some board or SoC models it is necessary to split a qemu_irq line |
---|---|---|---|
2 | 2 | so that one input can feed multiple outputs. We currently have | |
3 | Some devices need access to it. | 3 | qemu_irq_split() for this, but that has several deficiencies: |
4 | 4 | * it can only handle splitting a line into two | |
5 | Signed-off-by: Corey Minyard <cminyard@mvista.com> | 5 | * it unavoidably leaks memory, so it can't be used |
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | 6 | in a device that can be deleted |
7 | Signed-off-by: Linus Walleij <linus.walleij@linaro.org> | 7 | |
8 | Message-id: 20180227104903.21353-3-linus.walleij@linaro.org | 8 | Implement a qdev device that encapsulates splitting of IRQs, with a |
9 | configurable number of outputs. (This is in some ways the inverse of | ||
10 | the TYPE_OR_IRQ device.) | ||
11 | |||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
13 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
14 | Message-id: 20180220180325.29818-13-peter.maydell@linaro.org | ||
10 | --- | 15 | --- |
11 | include/hw/i2c/i2c.h | 17 +++++++++++++++++ | 16 | hw/core/Makefile.objs | 1 + |
12 | hw/i2c/core.c | 17 ----------------- | 17 | include/hw/core/split-irq.h | 57 +++++++++++++++++++++++++++++ |
13 | 2 files changed, 17 insertions(+), 17 deletions(-) | 18 | include/hw/irq.h | 4 +- |
14 | 19 | hw/core/split-irq.c | 89 +++++++++++++++++++++++++++++++++++++++++++++ | |
15 | diff --git a/include/hw/i2c/i2c.h b/include/hw/i2c/i2c.h | 20 | 4 files changed, 150 insertions(+), 1 deletion(-) |
21 | create mode 100644 include/hw/core/split-irq.h | ||
22 | create mode 100644 hw/core/split-irq.c | ||
23 | |||
24 | diff --git a/hw/core/Makefile.objs b/hw/core/Makefile.objs | ||
16 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/include/hw/i2c/i2c.h | 26 | --- a/hw/core/Makefile.objs |
18 | +++ b/include/hw/i2c/i2c.h | 27 | +++ b/hw/core/Makefile.objs |
19 | @@ -XXX,XX +XXX,XX @@ struct I2CSlave { | 28 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_FITLOADER) += loader-fit.o |
20 | uint8_t address; | 29 | common-obj-$(CONFIG_SOFTMMU) += qdev-properties-system.o |
21 | }; | 30 | common-obj-$(CONFIG_SOFTMMU) += register.o |
22 | 31 | common-obj-$(CONFIG_SOFTMMU) += or-irq.o | |
23 | +#define TYPE_I2C_BUS "i2c-bus" | 32 | +common-obj-$(CONFIG_SOFTMMU) += split-irq.o |
24 | +#define I2C_BUS(obj) OBJECT_CHECK(I2CBus, (obj), TYPE_I2C_BUS) | 33 | common-obj-$(CONFIG_PLATFORM_BUS) += platform-bus.o |
25 | + | 34 | |
26 | +typedef struct I2CNode I2CNode; | 35 | obj-$(CONFIG_SOFTMMU) += generic-loader.o |
27 | + | 36 | diff --git a/include/hw/core/split-irq.h b/include/hw/core/split-irq.h |
28 | +struct I2CNode { | 37 | new file mode 100644 |
29 | + I2CSlave *elt; | 38 | index XXXXXXX..XXXXXXX |
30 | + QLIST_ENTRY(I2CNode) next; | 39 | --- /dev/null |
40 | +++ b/include/hw/core/split-irq.h | ||
41 | @@ -XXX,XX +XXX,XX @@ | ||
42 | +/* | ||
43 | + * IRQ splitter device. | ||
44 | + * | ||
45 | + * Copyright (c) 2018 Linaro Limited. | ||
46 | + * Written by Peter Maydell | ||
47 | + * | ||
48 | + * Permission is hereby granted, free of charge, to any person obtaining a copy | ||
49 | + * of this software and associated documentation files (the "Software"), to deal | ||
50 | + * in the Software without restriction, including without limitation the rights | ||
51 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||
52 | + * copies of the Software, and to permit persons to whom the Software is | ||
53 | + * furnished to do so, subject to the following conditions: | ||
54 | + * | ||
55 | + * The above copyright notice and this permission notice shall be included in | ||
56 | + * all copies or substantial portions of the Software. | ||
57 | + * | ||
58 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
59 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
60 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | ||
61 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
62 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||
63 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | ||
64 | + * THE SOFTWARE. | ||
65 | + */ | ||
66 | + | ||
67 | +/* This is a simple device which has one GPIO input line and multiple | ||
68 | + * GPIO output lines. Any change on the input line is forwarded to all | ||
69 | + * of the outputs. | ||
70 | + * | ||
71 | + * QEMU interface: | ||
72 | + * + one unnamed GPIO input: the input line | ||
73 | + * + N unnamed GPIO outputs: the output lines | ||
74 | + * + QOM property "num-lines": sets the number of output lines | ||
75 | + */ | ||
76 | +#ifndef HW_SPLIT_IRQ_H | ||
77 | +#define HW_SPLIT_IRQ_H | ||
78 | + | ||
79 | +#include "hw/irq.h" | ||
80 | +#include "hw/sysbus.h" | ||
81 | +#include "qom/object.h" | ||
82 | + | ||
83 | +#define TYPE_SPLIT_IRQ "split-irq" | ||
84 | + | ||
85 | +#define MAX_SPLIT_LINES 16 | ||
86 | + | ||
87 | +typedef struct SplitIRQ SplitIRQ; | ||
88 | + | ||
89 | +#define SPLIT_IRQ(obj) OBJECT_CHECK(SplitIRQ, (obj), TYPE_SPLIT_IRQ) | ||
90 | + | ||
91 | +struct SplitIRQ { | ||
92 | + DeviceState parent_obj; | ||
93 | + | ||
94 | + qemu_irq out_irq[MAX_SPLIT_LINES]; | ||
95 | + uint16_t num_lines; | ||
31 | +}; | 96 | +}; |
32 | + | 97 | + |
33 | +struct I2CBus { | 98 | +#endif |
34 | + BusState qbus; | 99 | diff --git a/include/hw/irq.h b/include/hw/irq.h |
35 | + QLIST_HEAD(, I2CNode) current_devs; | 100 | index XXXXXXX..XXXXXXX 100644 |
36 | + uint8_t saved_address; | 101 | --- a/include/hw/irq.h |
37 | + bool broadcast; | 102 | +++ b/include/hw/irq.h |
103 | @@ -XXX,XX +XXX,XX @@ void qemu_free_irq(qemu_irq irq); | ||
104 | /* Returns a new IRQ with opposite polarity. */ | ||
105 | qemu_irq qemu_irq_invert(qemu_irq irq); | ||
106 | |||
107 | -/* Returns a new IRQ which feeds into both the passed IRQs */ | ||
108 | +/* Returns a new IRQ which feeds into both the passed IRQs. | ||
109 | + * It's probably better to use the TYPE_SPLIT_IRQ device instead. | ||
110 | + */ | ||
111 | qemu_irq qemu_irq_split(qemu_irq irq1, qemu_irq irq2); | ||
112 | |||
113 | /* Returns a new IRQ set which connects 1:1 to another IRQ set, which | ||
114 | diff --git a/hw/core/split-irq.c b/hw/core/split-irq.c | ||
115 | new file mode 100644 | ||
116 | index XXXXXXX..XXXXXXX | ||
117 | --- /dev/null | ||
118 | +++ b/hw/core/split-irq.c | ||
119 | @@ -XXX,XX +XXX,XX @@ | ||
120 | +/* | ||
121 | + * IRQ splitter device. | ||
122 | + * | ||
123 | + * Copyright (c) 2018 Linaro Limited. | ||
124 | + * Written by Peter Maydell | ||
125 | + * | ||
126 | + * Permission is hereby granted, free of charge, to any person obtaining a copy | ||
127 | + * of this software and associated documentation files (the "Software"), to deal | ||
128 | + * in the Software without restriction, including without limitation the rights | ||
129 | + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||
130 | + * copies of the Software, and to permit persons to whom the Software is | ||
131 | + * furnished to do so, subject to the following conditions: | ||
132 | + * | ||
133 | + * The above copyright notice and this permission notice shall be included in | ||
134 | + * all copies or substantial portions of the Software. | ||
135 | + * | ||
136 | + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
137 | + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
138 | + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | ||
139 | + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
140 | + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||
141 | + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | ||
142 | + * THE SOFTWARE. | ||
143 | + */ | ||
144 | + | ||
145 | +#include "qemu/osdep.h" | ||
146 | +#include "hw/core/split-irq.h" | ||
147 | +#include "qapi/error.h" | ||
148 | + | ||
149 | +static void split_irq_handler(void *opaque, int n, int level) | ||
150 | +{ | ||
151 | + SplitIRQ *s = SPLIT_IRQ(opaque); | ||
152 | + int i; | ||
153 | + | ||
154 | + for (i = 0; i < s->num_lines; i++) { | ||
155 | + qemu_set_irq(s->out_irq[i], level); | ||
156 | + } | ||
157 | +} | ||
158 | + | ||
159 | +static void split_irq_init(Object *obj) | ||
160 | +{ | ||
161 | + qdev_init_gpio_in(DEVICE(obj), split_irq_handler, 1); | ||
162 | +} | ||
163 | + | ||
164 | +static void split_irq_realize(DeviceState *dev, Error **errp) | ||
165 | +{ | ||
166 | + SplitIRQ *s = SPLIT_IRQ(dev); | ||
167 | + | ||
168 | + if (s->num_lines < 1 || s->num_lines >= MAX_SPLIT_LINES) { | ||
169 | + error_setg(errp, | ||
170 | + "IRQ splitter number of lines %d is not between 1 and %d", | ||
171 | + s->num_lines, MAX_SPLIT_LINES); | ||
172 | + return; | ||
173 | + } | ||
174 | + | ||
175 | + qdev_init_gpio_out(dev, s->out_irq, s->num_lines); | ||
176 | +} | ||
177 | + | ||
178 | +static Property split_irq_properties[] = { | ||
179 | + DEFINE_PROP_UINT16("num-lines", SplitIRQ, num_lines, 1), | ||
180 | + DEFINE_PROP_END_OF_LIST(), | ||
38 | +}; | 181 | +}; |
39 | + | 182 | + |
40 | I2CBus *i2c_init_bus(DeviceState *parent, const char *name); | 183 | +static void split_irq_class_init(ObjectClass *klass, void *data) |
41 | void i2c_set_slave_address(I2CSlave *dev, uint8_t address); | 184 | +{ |
42 | int i2c_bus_busy(I2CBus *bus); | 185 | + DeviceClass *dc = DEVICE_CLASS(klass); |
43 | diff --git a/hw/i2c/core.c b/hw/i2c/core.c | 186 | + |
44 | index XXXXXXX..XXXXXXX 100644 | 187 | + /* No state to reset or migrate */ |
45 | --- a/hw/i2c/core.c | 188 | + dc->props = split_irq_properties; |
46 | +++ b/hw/i2c/core.c | 189 | + dc->realize = split_irq_realize; |
47 | @@ -XXX,XX +XXX,XX @@ | 190 | + |
48 | #include "qemu/osdep.h" | 191 | + /* Reason: Needs to be wired up to work */ |
49 | #include "hw/i2c/i2c.h" | 192 | + dc->user_creatable = false; |
50 | 193 | +} | |
51 | -typedef struct I2CNode I2CNode; | 194 | + |
52 | - | 195 | +static const TypeInfo split_irq_type_info = { |
53 | -struct I2CNode { | 196 | + .name = TYPE_SPLIT_IRQ, |
54 | - I2CSlave *elt; | 197 | + .parent = TYPE_DEVICE, |
55 | - QLIST_ENTRY(I2CNode) next; | 198 | + .instance_size = sizeof(SplitIRQ), |
56 | -}; | 199 | + .instance_init = split_irq_init, |
57 | - | 200 | + .class_init = split_irq_class_init, |
58 | #define I2C_BROADCAST 0x00 | 201 | +}; |
59 | 202 | + | |
60 | -struct I2CBus { | 203 | +static void split_irq_register_types(void) |
61 | - BusState qbus; | 204 | +{ |
62 | - QLIST_HEAD(, I2CNode) current_devs; | 205 | + type_register_static(&split_irq_type_info); |
63 | - uint8_t saved_address; | 206 | +} |
64 | - bool broadcast; | 207 | + |
65 | -}; | 208 | +type_init(split_irq_register_types) |
66 | - | ||
67 | static Property i2c_props[] = { | ||
68 | DEFINE_PROP_UINT8("address", struct I2CSlave, address, 0), | ||
69 | DEFINE_PROP_END_OF_LIST(), | ||
70 | }; | ||
71 | |||
72 | -#define TYPE_I2C_BUS "i2c-bus" | ||
73 | -#define I2C_BUS(obj) OBJECT_CHECK(I2CBus, (obj), TYPE_I2C_BUS) | ||
74 | - | ||
75 | static const TypeInfo i2c_bus_info = { | ||
76 | .name = TYPE_I2C_BUS, | ||
77 | .parent = TYPE_BUS, | ||
78 | -- | 209 | -- |
79 | 2.16.2 | 210 | 2.16.2 |
80 | 211 | ||
81 | 212 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | The MPS2 AN505 FPGA image includes a "FPGA control block" |
---|---|---|---|
2 | 2 | which is a small set of registers handling LEDs, buttons | |
3 | This includes FMAXNMP, FADDP, FMAXP, FMINNMP, FMINP. | 3 | and some counters. |
4 | 4 | ||
5 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
7 | Message-id: 20180227143852.11175-14-alex.bennee@linaro.org | 7 | Message-id: 20180220180325.29818-14-peter.maydell@linaro.org |
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | --- | 8 | --- |
10 | target/arm/translate-a64.c | 208 +++++++++++++++++++++++++++++---------------- | 9 | hw/misc/Makefile.objs | 1 + |
11 | 1 file changed, 133 insertions(+), 75 deletions(-) | 10 | include/hw/misc/mps2-fpgaio.h | 43 ++++++++++ |
12 | 11 | hw/misc/mps2-fpgaio.c | 176 ++++++++++++++++++++++++++++++++++++++++ | |
13 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 12 | default-configs/arm-softmmu.mak | 1 + |
13 | hw/misc/trace-events | 6 ++ | ||
14 | 5 files changed, 227 insertions(+) | ||
15 | create mode 100644 include/hw/misc/mps2-fpgaio.h | ||
16 | create mode 100644 hw/misc/mps2-fpgaio.c | ||
17 | |||
18 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs | ||
14 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/translate-a64.c | 20 | --- a/hw/misc/Makefile.objs |
16 | +++ b/target/arm/translate-a64.c | 21 | +++ b/hw/misc/Makefile.objs |
17 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | 22 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_STM32F2XX_SYSCFG) += stm32f2xx_syscfg.o |
18 | int datasize, elements; | 23 | obj-$(CONFIG_MIPS_CPS) += mips_cmgcr.o |
19 | int pass; | 24 | obj-$(CONFIG_MIPS_CPS) += mips_cpc.o |
20 | TCGv_ptr fpst; | 25 | obj-$(CONFIG_MIPS_ITU) += mips_itu.o |
21 | + bool pairwise = false; | 26 | +obj-$(CONFIG_MPS2_FPGAIO) += mps2-fpgaio.o |
22 | 27 | obj-$(CONFIG_MPS2_SCC) += mps2-scc.o | |
23 | if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 28 | |
24 | unallocated_encoding(s); | 29 | obj-$(CONFIG_PVPANIC) += pvpanic.o |
25 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | 30 | diff --git a/include/hw/misc/mps2-fpgaio.h b/include/hw/misc/mps2-fpgaio.h |
26 | datasize = is_q ? 128 : 64; | 31 | new file mode 100644 |
27 | elements = datasize / 16; | 32 | index XXXXXXX..XXXXXXX |
28 | 33 | --- /dev/null | |
29 | + switch (fpopcode) { | 34 | +++ b/include/hw/misc/mps2-fpgaio.h |
30 | + case 0x10: /* FMAXNMP */ | 35 | @@ -XXX,XX +XXX,XX @@ |
31 | + case 0x12: /* FADDP */ | 36 | +/* |
32 | + case 0x16: /* FMAXP */ | 37 | + * ARM MPS2 FPGAIO emulation |
33 | + case 0x18: /* FMINNMP */ | 38 | + * |
34 | + case 0x1e: /* FMINP */ | 39 | + * Copyright (c) 2018 Linaro Limited |
35 | + pairwise = true; | 40 | + * Written by Peter Maydell |
41 | + * | ||
42 | + * This program is free software; you can redistribute it and/or modify | ||
43 | + * it under the terms of the GNU General Public License version 2 or | ||
44 | + * (at your option) any later version. | ||
45 | + */ | ||
46 | + | ||
47 | +/* This is a model of the FPGAIO register block in the AN505 | ||
48 | + * FPGA image for the MPS2 dev board; it is documented in the | ||
49 | + * application note: | ||
50 | + * http://infocenter.arm.com/help/topic/com.arm.doc.dai0505b/index.html | ||
51 | + * | ||
52 | + * QEMU interface: | ||
53 | + * + sysbus MMIO region 0: the register bank | ||
54 | + */ | ||
55 | + | ||
56 | +#ifndef MPS2_FPGAIO_H | ||
57 | +#define MPS2_FPGAIO_H | ||
58 | + | ||
59 | +#include "hw/sysbus.h" | ||
60 | + | ||
61 | +#define TYPE_MPS2_FPGAIO "mps2-fpgaio" | ||
62 | +#define MPS2_FPGAIO(obj) OBJECT_CHECK(MPS2FPGAIO, (obj), TYPE_MPS2_FPGAIO) | ||
63 | + | ||
64 | +typedef struct { | ||
65 | + /*< private >*/ | ||
66 | + SysBusDevice parent_obj; | ||
67 | + | ||
68 | + /*< public >*/ | ||
69 | + MemoryRegion iomem; | ||
70 | + | ||
71 | + uint32_t led0; | ||
72 | + uint32_t prescale; | ||
73 | + uint32_t misc; | ||
74 | + | ||
75 | + uint32_t prescale_clk; | ||
76 | +} MPS2FPGAIO; | ||
77 | + | ||
78 | +#endif | ||
79 | diff --git a/hw/misc/mps2-fpgaio.c b/hw/misc/mps2-fpgaio.c | ||
80 | new file mode 100644 | ||
81 | index XXXXXXX..XXXXXXX | ||
82 | --- /dev/null | ||
83 | +++ b/hw/misc/mps2-fpgaio.c | ||
84 | @@ -XXX,XX +XXX,XX @@ | ||
85 | +/* | ||
86 | + * ARM MPS2 AN505 FPGAIO emulation | ||
87 | + * | ||
88 | + * Copyright (c) 2018 Linaro Limited | ||
89 | + * Written by Peter Maydell | ||
90 | + * | ||
91 | + * This program is free software; you can redistribute it and/or modify | ||
92 | + * it under the terms of the GNU General Public License version 2 or | ||
93 | + * (at your option) any later version. | ||
94 | + */ | ||
95 | + | ||
96 | +/* This is a model of the "FPGA system control and I/O" block found | ||
97 | + * in the AN505 FPGA image for the MPS2 devboard. | ||
98 | + * It is documented in AN505: | ||
99 | + * http://infocenter.arm.com/help/topic/com.arm.doc.dai0505b/index.html | ||
100 | + */ | ||
101 | + | ||
102 | +#include "qemu/osdep.h" | ||
103 | +#include "qemu/log.h" | ||
104 | +#include "qapi/error.h" | ||
105 | +#include "trace.h" | ||
106 | +#include "hw/sysbus.h" | ||
107 | +#include "hw/registerfields.h" | ||
108 | +#include "hw/misc/mps2-fpgaio.h" | ||
109 | + | ||
110 | +REG32(LED0, 0) | ||
111 | +REG32(BUTTON, 8) | ||
112 | +REG32(CLK1HZ, 0x10) | ||
113 | +REG32(CLK100HZ, 0x14) | ||
114 | +REG32(COUNTER, 0x18) | ||
115 | +REG32(PRESCALE, 0x1c) | ||
116 | +REG32(PSCNTR, 0x20) | ||
117 | +REG32(MISC, 0x4c) | ||
118 | + | ||
119 | +static uint64_t mps2_fpgaio_read(void *opaque, hwaddr offset, unsigned size) | ||
120 | +{ | ||
121 | + MPS2FPGAIO *s = MPS2_FPGAIO(opaque); | ||
122 | + uint64_t r; | ||
123 | + | ||
124 | + switch (offset) { | ||
125 | + case A_LED0: | ||
126 | + r = s->led0; | ||
127 | + break; | ||
128 | + case A_BUTTON: | ||
129 | + /* User-pressable board buttons. We don't model that, so just return | ||
130 | + * zeroes. | ||
131 | + */ | ||
132 | + r = 0; | ||
133 | + break; | ||
134 | + case A_PRESCALE: | ||
135 | + r = s->prescale; | ||
136 | + break; | ||
137 | + case A_MISC: | ||
138 | + r = s->misc; | ||
139 | + break; | ||
140 | + case A_CLK1HZ: | ||
141 | + case A_CLK100HZ: | ||
142 | + case A_COUNTER: | ||
143 | + case A_PSCNTR: | ||
144 | + /* These are all upcounters of various frequencies. */ | ||
145 | + qemu_log_mask(LOG_UNIMP, "MPS2 FPGAIO: counters unimplemented\n"); | ||
146 | + r = 0; | ||
147 | + break; | ||
148 | + default: | ||
149 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
150 | + "MPS2 FPGAIO read: bad offset %x\n", (int) offset); | ||
151 | + r = 0; | ||
36 | + break; | 152 | + break; |
37 | + } | 153 | + } |
38 | + | 154 | + |
39 | fpst = get_fpstatus_ptr(true); | 155 | + trace_mps2_fpgaio_read(offset, r, size); |
40 | 156 | + return r; | |
41 | - for (pass = 0; pass < elements; pass++) { | 157 | +} |
42 | + if (pairwise) { | 158 | + |
43 | + int maxpass = is_q ? 8 : 4; | 159 | +static void mps2_fpgaio_write(void *opaque, hwaddr offset, uint64_t value, |
44 | TCGv_i32 tcg_op1 = tcg_temp_new_i32(); | 160 | + unsigned size) |
45 | TCGv_i32 tcg_op2 = tcg_temp_new_i32(); | 161 | +{ |
46 | - TCGv_i32 tcg_res = tcg_temp_new_i32(); | 162 | + MPS2FPGAIO *s = MPS2_FPGAIO(opaque); |
47 | + TCGv_i32 tcg_res[8]; | 163 | + |
48 | 164 | + trace_mps2_fpgaio_write(offset, value, size); | |
49 | - read_vec_element_i32(s, tcg_op1, rn, pass, MO_16); | 165 | + |
50 | - read_vec_element_i32(s, tcg_op2, rm, pass, MO_16); | 166 | + switch (offset) { |
51 | + for (pass = 0; pass < maxpass; pass++) { | 167 | + case A_LED0: |
52 | + int passreg = pass < (maxpass / 2) ? rn : rm; | 168 | + /* LED bits [1:0] control board LEDs. We don't currently have |
53 | + int passelt = (pass << 1) & (maxpass - 1); | 169 | + * a mechanism for displaying this graphically, so use a trace event. |
54 | 170 | + */ | |
55 | - switch (fpopcode) { | 171 | + trace_mps2_fpgaio_leds(value & 0x02 ? '*' : '.', |
56 | - case 0x0: /* FMAXNM */ | 172 | + value & 0x01 ? '*' : '.'); |
57 | - gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst); | 173 | + s->led0 = value & 0x3; |
58 | - break; | 174 | + break; |
59 | - case 0x1: /* FMLA */ | 175 | + case A_PRESCALE: |
60 | - read_vec_element_i32(s, tcg_res, rd, pass, MO_16); | 176 | + s->prescale = value; |
61 | - gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res, | 177 | + break; |
62 | - fpst); | 178 | + case A_MISC: |
63 | - break; | 179 | + /* These are control bits for some of the other devices on the |
64 | - case 0x2: /* FADD */ | 180 | + * board (SPI, CLCD, etc). We don't implement that yet, so just |
65 | - gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst); | 181 | + * make the bits read as written. |
66 | - break; | 182 | + */ |
67 | - case 0x3: /* FMULX */ | 183 | + qemu_log_mask(LOG_UNIMP, |
68 | - gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst); | 184 | + "MPS2 FPGAIO: MISC control bits unimplemented\n"); |
69 | - break; | 185 | + s->misc = value; |
70 | - case 0x4: /* FCMEQ */ | 186 | + break; |
71 | - gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 187 | + default: |
72 | - break; | 188 | + qemu_log_mask(LOG_GUEST_ERROR, |
73 | - case 0x6: /* FMAX */ | 189 | + "MPS2 FPGAIO write: bad offset 0x%x\n", (int) offset); |
74 | - gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst); | 190 | + break; |
75 | - break; | 191 | + } |
76 | - case 0x7: /* FRECPS */ | 192 | +} |
77 | - gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 193 | + |
78 | - break; | 194 | +static const MemoryRegionOps mps2_fpgaio_ops = { |
79 | - case 0x8: /* FMINNM */ | 195 | + .read = mps2_fpgaio_read, |
80 | - gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst); | 196 | + .write = mps2_fpgaio_write, |
81 | - break; | 197 | + .endianness = DEVICE_LITTLE_ENDIAN, |
82 | - case 0x9: /* FMLS */ | 198 | +}; |
83 | - /* As usual for ARM, separate negation for fused multiply-add */ | 199 | + |
84 | - tcg_gen_xori_i32(tcg_op1, tcg_op1, 0x8000); | 200 | +static void mps2_fpgaio_reset(DeviceState *dev) |
85 | - read_vec_element_i32(s, tcg_res, rd, pass, MO_16); | 201 | +{ |
86 | - gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res, | 202 | + MPS2FPGAIO *s = MPS2_FPGAIO(dev); |
87 | - fpst); | 203 | + |
88 | - break; | 204 | + trace_mps2_fpgaio_reset(); |
89 | - case 0xa: /* FSUB */ | 205 | + s->led0 = 0; |
90 | - gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | 206 | + s->prescale = 0; |
91 | - break; | 207 | + s->misc = 0; |
92 | - case 0xe: /* FMIN */ | 208 | +} |
93 | - gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst); | 209 | + |
94 | - break; | 210 | +static void mps2_fpgaio_init(Object *obj) |
95 | - case 0xf: /* FRSQRTS */ | 211 | +{ |
96 | - gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 212 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); |
97 | - break; | 213 | + MPS2FPGAIO *s = MPS2_FPGAIO(obj); |
98 | - case 0x13: /* FMUL */ | 214 | + |
99 | - gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst); | 215 | + memory_region_init_io(&s->iomem, obj, &mps2_fpgaio_ops, s, |
100 | - break; | 216 | + "mps2-fpgaio", 0x1000); |
101 | - case 0x14: /* FCMGE */ | 217 | + sysbus_init_mmio(sbd, &s->iomem); |
102 | - gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 218 | +} |
103 | - break; | 219 | + |
104 | - case 0x15: /* FACGE */ | 220 | +static const VMStateDescription mps2_fpgaio_vmstate = { |
105 | - gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 221 | + .name = "mps2-fpgaio", |
106 | - break; | 222 | + .version_id = 1, |
107 | - case 0x17: /* FDIV */ | 223 | + .minimum_version_id = 1, |
108 | - gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst); | 224 | + .fields = (VMStateField[]) { |
109 | - break; | 225 | + VMSTATE_UINT32(led0, MPS2FPGAIO), |
110 | - case 0x1a: /* FABD */ | 226 | + VMSTATE_UINT32(prescale, MPS2FPGAIO), |
111 | - gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | 227 | + VMSTATE_UINT32(misc, MPS2FPGAIO), |
112 | - tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff); | 228 | + VMSTATE_END_OF_LIST() |
113 | - break; | 229 | + } |
114 | - case 0x1c: /* FCMGT */ | 230 | +}; |
115 | - gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 231 | + |
116 | - break; | 232 | +static Property mps2_fpgaio_properties[] = { |
117 | - case 0x1d: /* FACGT */ | 233 | + /* Frequency of the prescale counter */ |
118 | - gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 234 | + DEFINE_PROP_UINT32("prescale-clk", MPS2FPGAIO, prescale_clk, 20000000), |
119 | - break; | 235 | + DEFINE_PROP_END_OF_LIST(), |
120 | - default: | 236 | +}; |
121 | - fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n", | 237 | + |
122 | - __func__, insn, fpopcode, s->pc); | 238 | +static void mps2_fpgaio_class_init(ObjectClass *klass, void *data) |
123 | - g_assert_not_reached(); | 239 | +{ |
124 | + read_vec_element_i32(s, tcg_op1, passreg, passelt, MO_16); | 240 | + DeviceClass *dc = DEVICE_CLASS(klass); |
125 | + read_vec_element_i32(s, tcg_op2, passreg, passelt + 1, MO_16); | 241 | + |
126 | + tcg_res[pass] = tcg_temp_new_i32(); | 242 | + dc->vmsd = &mps2_fpgaio_vmstate; |
127 | + | 243 | + dc->reset = mps2_fpgaio_reset; |
128 | + switch (fpopcode) { | 244 | + dc->props = mps2_fpgaio_properties; |
129 | + case 0x10: /* FMAXNMP */ | 245 | +} |
130 | + gen_helper_advsimd_maxnumh(tcg_res[pass], tcg_op1, tcg_op2, | 246 | + |
131 | + fpst); | 247 | +static const TypeInfo mps2_fpgaio_info = { |
132 | + break; | 248 | + .name = TYPE_MPS2_FPGAIO, |
133 | + case 0x12: /* FADDP */ | 249 | + .parent = TYPE_SYS_BUS_DEVICE, |
134 | + gen_helper_advsimd_addh(tcg_res[pass], tcg_op1, tcg_op2, fpst); | 250 | + .instance_size = sizeof(MPS2FPGAIO), |
135 | + break; | 251 | + .instance_init = mps2_fpgaio_init, |
136 | + case 0x16: /* FMAXP */ | 252 | + .class_init = mps2_fpgaio_class_init, |
137 | + gen_helper_advsimd_maxh(tcg_res[pass], tcg_op1, tcg_op2, fpst); | 253 | +}; |
138 | + break; | 254 | + |
139 | + case 0x18: /* FMINNMP */ | 255 | +static void mps2_fpgaio_register_types(void) |
140 | + gen_helper_advsimd_minnumh(tcg_res[pass], tcg_op1, tcg_op2, | 256 | +{ |
141 | + fpst); | 257 | + type_register_static(&mps2_fpgaio_info); |
142 | + break; | 258 | +} |
143 | + case 0x1e: /* FMINP */ | 259 | + |
144 | + gen_helper_advsimd_minh(tcg_res[pass], tcg_op1, tcg_op2, fpst); | 260 | +type_init(mps2_fpgaio_register_types); |
145 | + break; | 261 | diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak |
146 | + default: | 262 | index XXXXXXX..XXXXXXX 100644 |
147 | + g_assert_not_reached(); | 263 | --- a/default-configs/arm-softmmu.mak |
148 | + } | 264 | +++ b/default-configs/arm-softmmu.mak |
149 | + } | 265 | @@ -XXX,XX +XXX,XX @@ CONFIG_STM32F205_SOC=y |
150 | + | 266 | CONFIG_CMSDK_APB_TIMER=y |
151 | + for (pass = 0; pass < maxpass; pass++) { | 267 | CONFIG_CMSDK_APB_UART=y |
152 | + write_vec_element_i32(s, tcg_res[pass], rd, pass, MO_16); | 268 | |
153 | + tcg_temp_free_i32(tcg_res[pass]); | 269 | +CONFIG_MPS2_FPGAIO=y |
154 | } | 270 | CONFIG_MPS2_SCC=y |
155 | 271 | ||
156 | - write_vec_element_i32(s, tcg_res, rd, pass, MO_16); | 272 | CONFIG_VERSATILE_PCI=y |
157 | - tcg_temp_free_i32(tcg_res); | 273 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events |
158 | tcg_temp_free_i32(tcg_op1); | 274 | index XXXXXXX..XXXXXXX 100644 |
159 | tcg_temp_free_i32(tcg_op2); | 275 | --- a/hw/misc/trace-events |
160 | + | 276 | +++ b/hw/misc/trace-events |
161 | + } else { | 277 | @@ -XXX,XX +XXX,XX @@ mps2_scc_leds(char led7, char led6, char led5, char led4, char led3, char led2, |
162 | + for (pass = 0; pass < elements; pass++) { | 278 | mps2_scc_cfg_write(unsigned function, unsigned device, uint32_t value) "MPS2 SCC config write: function %d device %d data 0x%" PRIx32 |
163 | + TCGv_i32 tcg_op1 = tcg_temp_new_i32(); | 279 | mps2_scc_cfg_read(unsigned function, unsigned device, uint32_t value) "MPS2 SCC config read: function %d device %d data 0x%" PRIx32 |
164 | + TCGv_i32 tcg_op2 = tcg_temp_new_i32(); | 280 | |
165 | + TCGv_i32 tcg_res = tcg_temp_new_i32(); | 281 | +# hw/misc/mps2_fpgaio.c |
166 | + | 282 | +mps2_fpgaio_read(uint64_t offset, uint64_t data, unsigned size) "MPS2 FPGAIO read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u" |
167 | + read_vec_element_i32(s, tcg_op1, rn, pass, MO_16); | 283 | +mps2_fpgaio_write(uint64_t offset, uint64_t data, unsigned size) "MPS2 FPGAIO write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u" |
168 | + read_vec_element_i32(s, tcg_op2, rm, pass, MO_16); | 284 | +mps2_fpgaio_reset(void) "MPS2 FPGAIO: reset" |
169 | + | 285 | +mps2_fpgaio_leds(char led1, char led0) "MPS2 FPGAIO LEDs: %c%c" |
170 | + switch (fpopcode) { | 286 | + |
171 | + case 0x0: /* FMAXNM */ | 287 | # hw/misc/msf2-sysreg.c |
172 | + gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst); | 288 | msf2_sysreg_write(uint64_t offset, uint32_t val, uint32_t prev) "msf2-sysreg write: addr 0x%08" HWADDR_PRIx " data 0x%" PRIx32 " prev 0x%" PRIx32 |
173 | + break; | 289 | msf2_sysreg_read(uint64_t offset, uint32_t val) "msf2-sysreg read: addr 0x%08" HWADDR_PRIx " data 0x%08" PRIx32 |
174 | + case 0x1: /* FMLA */ | ||
175 | + read_vec_element_i32(s, tcg_res, rd, pass, MO_16); | ||
176 | + gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res, | ||
177 | + fpst); | ||
178 | + break; | ||
179 | + case 0x2: /* FADD */ | ||
180 | + gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
181 | + break; | ||
182 | + case 0x3: /* FMULX */ | ||
183 | + gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
184 | + break; | ||
185 | + case 0x4: /* FCMEQ */ | ||
186 | + gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
187 | + break; | ||
188 | + case 0x6: /* FMAX */ | ||
189 | + gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
190 | + break; | ||
191 | + case 0x7: /* FRECPS */ | ||
192 | + gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
193 | + break; | ||
194 | + case 0x8: /* FMINNM */ | ||
195 | + gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
196 | + break; | ||
197 | + case 0x9: /* FMLS */ | ||
198 | + /* As usual for ARM, separate negation for fused multiply-add */ | ||
199 | + tcg_gen_xori_i32(tcg_op1, tcg_op1, 0x8000); | ||
200 | + read_vec_element_i32(s, tcg_res, rd, pass, MO_16); | ||
201 | + gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res, | ||
202 | + fpst); | ||
203 | + break; | ||
204 | + case 0xa: /* FSUB */ | ||
205 | + gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
206 | + break; | ||
207 | + case 0xe: /* FMIN */ | ||
208 | + gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
209 | + break; | ||
210 | + case 0xf: /* FRSQRTS */ | ||
211 | + gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
212 | + break; | ||
213 | + case 0x13: /* FMUL */ | ||
214 | + gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
215 | + break; | ||
216 | + case 0x14: /* FCMGE */ | ||
217 | + gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
218 | + break; | ||
219 | + case 0x15: /* FACGE */ | ||
220 | + gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
221 | + break; | ||
222 | + case 0x17: /* FDIV */ | ||
223 | + gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
224 | + break; | ||
225 | + case 0x1a: /* FABD */ | ||
226 | + gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
227 | + tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff); | ||
228 | + break; | ||
229 | + case 0x1c: /* FCMGT */ | ||
230 | + gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
231 | + break; | ||
232 | + case 0x1d: /* FACGT */ | ||
233 | + gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
234 | + break; | ||
235 | + default: | ||
236 | + fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n", | ||
237 | + __func__, insn, fpopcode, s->pc); | ||
238 | + g_assert_not_reached(); | ||
239 | + } | ||
240 | + | ||
241 | + write_vec_element_i32(s, tcg_res, rd, pass, MO_16); | ||
242 | + tcg_temp_free_i32(tcg_res); | ||
243 | + tcg_temp_free_i32(tcg_op1); | ||
244 | + tcg_temp_free_i32(tcg_op2); | ||
245 | + } | ||
246 | } | ||
247 | |||
248 | tcg_temp_free_ptr(fpst); | ||
249 | -- | 290 | -- |
250 | 2.16.2 | 291 | 2.16.2 |
251 | 292 | ||
252 | 293 | diff view generated by jsdifflib |
1 | From: Linus Walleij <linus.walleij@linaro.org> | 1 | Add a model of the TrustZone peripheral protection controller (PPC), |
---|---|---|---|
2 | which is used to gate transactions to non-TZ-aware peripherals so | ||
3 | that secure software can configure them to not be accessible to | ||
4 | non-secure software. | ||
2 | 5 | ||
3 | This adds the SiI9022 (and implicitly EDID I2C) device to the ARM | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | Versatile Express machine, and selects the two I2C devices necessary | 7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | in the arm-softmmu.mak configuration so everything will build | 8 | Message-id: 20180220180325.29818-15-peter.maydell@linaro.org |
6 | smoothly. | 9 | --- |
10 | hw/misc/Makefile.objs | 2 + | ||
11 | include/hw/misc/tz-ppc.h | 101 ++++++++++++++ | ||
12 | hw/misc/tz-ppc.c | 302 ++++++++++++++++++++++++++++++++++++++++ | ||
13 | default-configs/arm-softmmu.mak | 2 + | ||
14 | hw/misc/trace-events | 11 ++ | ||
15 | 5 files changed, 418 insertions(+) | ||
16 | create mode 100644 include/hw/misc/tz-ppc.h | ||
17 | create mode 100644 hw/misc/tz-ppc.c | ||
7 | 18 | ||
8 | I am implementing proper handling of the graphics in the Linux | 19 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs |
9 | kernel and adding proper emulation of SiI9022 and EDID makes the | ||
10 | driver probe as nicely as before, retrieving the resolutions | ||
11 | supported by the "QEMU monitor" and overall just working nice. | ||
12 | |||
13 | Cc: Peter Maydell <peter.maydell@linaro.org> | ||
14 | Signed-off-by: Linus Walleij <linus.walleij@linaro.org> | ||
15 | Message-id: 20180227104903.21353-6-linus.walleij@linaro.org | ||
16 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
17 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> | ||
18 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
19 | --- | ||
20 | hw/arm/vexpress.c | 6 +++++- | ||
21 | default-configs/arm-softmmu.mak | 2 ++ | ||
22 | 2 files changed, 7 insertions(+), 1 deletion(-) | ||
23 | |||
24 | diff --git a/hw/arm/vexpress.c b/hw/arm/vexpress.c | ||
25 | index XXXXXXX..XXXXXXX 100644 | 20 | index XXXXXXX..XXXXXXX 100644 |
26 | --- a/hw/arm/vexpress.c | 21 | --- a/hw/misc/Makefile.objs |
27 | +++ b/hw/arm/vexpress.c | 22 | +++ b/hw/misc/Makefile.objs |
23 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_MIPS_ITU) += mips_itu.o | ||
24 | obj-$(CONFIG_MPS2_FPGAIO) += mps2-fpgaio.o | ||
25 | obj-$(CONFIG_MPS2_SCC) += mps2-scc.o | ||
26 | |||
27 | +obj-$(CONFIG_TZ_PPC) += tz-ppc.o | ||
28 | + | ||
29 | obj-$(CONFIG_PVPANIC) += pvpanic.o | ||
30 | obj-$(CONFIG_HYPERV_TESTDEV) += hyperv_testdev.o | ||
31 | obj-$(CONFIG_AUX) += auxbus.o | ||
32 | diff --git a/include/hw/misc/tz-ppc.h b/include/hw/misc/tz-ppc.h | ||
33 | new file mode 100644 | ||
34 | index XXXXXXX..XXXXXXX | ||
35 | --- /dev/null | ||
36 | +++ b/include/hw/misc/tz-ppc.h | ||
28 | @@ -XXX,XX +XXX,XX @@ | 37 | @@ -XXX,XX +XXX,XX @@ |
29 | #include "hw/arm/arm.h" | 38 | +/* |
30 | #include "hw/arm/primecell.h" | 39 | + * ARM TrustZone peripheral protection controller emulation |
31 | #include "hw/devices.h" | 40 | + * |
32 | +#include "hw/i2c/i2c.h" | 41 | + * Copyright (c) 2018 Linaro Limited |
33 | #include "net/net.h" | 42 | + * Written by Peter Maydell |
34 | #include "sysemu/sysemu.h" | 43 | + * |
35 | #include "hw/boards.h" | 44 | + * This program is free software; you can redistribute it and/or modify |
36 | @@ -XXX,XX +XXX,XX @@ static void vexpress_common_init(MachineState *machine) | 45 | + * it under the terms of the GNU General Public License version 2 or |
37 | uint32_t sys_id; | 46 | + * (at your option) any later version. |
38 | DriveInfo *dinfo; | 47 | + */ |
39 | pflash_t *pflash0; | 48 | + |
40 | + I2CBus *i2c; | 49 | +/* This is a model of the TrustZone peripheral protection controller (PPC). |
41 | ram_addr_t vram_size, sram_size; | 50 | + * It is documented in the ARM CoreLink SIE-200 System IP for Embedded TRM |
42 | MemoryRegion *sysmem = get_system_memory(); | 51 | + * (DDI 0571G): |
43 | MemoryRegion *vram = g_new(MemoryRegion, 1); | 52 | + * https://developer.arm.com/products/architecture/m-profile/docs/ddi0571/g |
44 | @@ -XXX,XX +XXX,XX @@ static void vexpress_common_init(MachineState *machine) | 53 | + * |
45 | sysbus_create_simple("sp804", map[VE_TIMER01], pic[2]); | 54 | + * The PPC sits in front of peripherals and allows secure software to |
46 | sysbus_create_simple("sp804", map[VE_TIMER23], pic[3]); | 55 | + * configure it to either pass through or reject transactions. |
47 | 56 | + * Rejected transactions may be configured to either be aborted, or to | |
48 | - /* VE_SERIALDVI: not modelled */ | 57 | + * behave as RAZ/WI. An interrupt can be signalled for a rejected transaction. |
49 | + dev = sysbus_create_simple("versatile_i2c", map[VE_SERIALDVI], NULL); | 58 | + * |
50 | + i2c = (I2CBus *)qdev_get_child_bus(dev, "i2c"); | 59 | + * The PPC has no register interface -- it is configured purely by a |
51 | + i2c_create_slave(i2c, "sii9022", 0x39); | 60 | + * collection of input signals from other hardware in the system. Typically |
52 | 61 | + * they are either hardwired or exposed in an ad-hoc register interface by | |
53 | sysbus_create_simple("pl031", map[VE_RTC], pic[4]); /* RTC */ | 62 | + * the SoC that uses the PPC. |
54 | 63 | + * | |
64 | + * This QEMU model can be used to model either the AHB5 or APB4 TZ PPC, | ||
65 | + * since the only difference between them is that the AHB version has a | ||
66 | + * "default" port which has no security checks applied. In QEMU the default | ||
67 | + * port can be emulated simply by wiring its downstream devices directly | ||
68 | + * into the parent address space, since the PPC does not need to intercept | ||
69 | + * transactions there. | ||
70 | + * | ||
71 | + * In the hardware, selection of which downstream port to use is done by | ||
72 | + * the user's decode logic asserting one of the hsel[] signals. In QEMU, | ||
73 | + * we provide 16 MMIO regions, one per port, and the user maps these into | ||
74 | + * the desired addresses to implement the address decode. | ||
75 | + * | ||
76 | + * QEMU interface: | ||
77 | + * + sysbus MMIO regions 0..15: MemoryRegions defining the upstream end | ||
78 | + * of each of the 16 ports of the PPC | ||
79 | + * + Property "port[0..15]": MemoryRegion defining the downstream device(s) | ||
80 | + * for each of the 16 ports of the PPC | ||
81 | + * + Named GPIO inputs "cfg_nonsec[0..15]": set to 1 if the port should be | ||
82 | + * accessible to NonSecure transactions | ||
83 | + * + Named GPIO inputs "cfg_ap[0..15]": set to 1 if the port should be | ||
84 | + * accessible to non-privileged transactions | ||
85 | + * + Named GPIO input "cfg_sec_resp": set to 1 if a rejected transaction should | ||
86 | + * result in a transaction error, or 0 for the transaction to RAZ/WI | ||
87 | + * + Named GPIO input "irq_enable": set to 1 to enable interrupts | ||
88 | + * + Named GPIO input "irq_clear": set to 1 to clear a pending interrupt | ||
89 | + * + Named GPIO output "irq": set for a transaction-failed interrupt | ||
90 | + * + Property "NONSEC_MASK": if a bit is set in this mask then accesses to | ||
91 | + * the associated port do not have the TZ security check performed. (This | ||
92 | + * corresponds to the hardware allowing this to be set as a Verilog | ||
93 | + * parameter.) | ||
94 | + */ | ||
95 | + | ||
96 | +#ifndef TZ_PPC_H | ||
97 | +#define TZ_PPC_H | ||
98 | + | ||
99 | +#include "hw/sysbus.h" | ||
100 | + | ||
101 | +#define TYPE_TZ_PPC "tz-ppc" | ||
102 | +#define TZ_PPC(obj) OBJECT_CHECK(TZPPC, (obj), TYPE_TZ_PPC) | ||
103 | + | ||
104 | +#define TZ_NUM_PORTS 16 | ||
105 | + | ||
106 | +typedef struct TZPPC TZPPC; | ||
107 | + | ||
108 | +typedef struct TZPPCPort { | ||
109 | + TZPPC *ppc; | ||
110 | + MemoryRegion upstream; | ||
111 | + AddressSpace downstream_as; | ||
112 | + MemoryRegion *downstream; | ||
113 | +} TZPPCPort; | ||
114 | + | ||
115 | +struct TZPPC { | ||
116 | + /*< private >*/ | ||
117 | + SysBusDevice parent_obj; | ||
118 | + | ||
119 | + /*< public >*/ | ||
120 | + | ||
121 | + /* State: these just track the values of our input signals */ | ||
122 | + bool cfg_nonsec[TZ_NUM_PORTS]; | ||
123 | + bool cfg_ap[TZ_NUM_PORTS]; | ||
124 | + bool cfg_sec_resp; | ||
125 | + bool irq_enable; | ||
126 | + bool irq_clear; | ||
127 | + /* State: are we asserting irq ? */ | ||
128 | + bool irq_status; | ||
129 | + | ||
130 | + qemu_irq irq; | ||
131 | + | ||
132 | + /* Properties */ | ||
133 | + uint32_t nonsec_mask; | ||
134 | + | ||
135 | + TZPPCPort port[TZ_NUM_PORTS]; | ||
136 | +}; | ||
137 | + | ||
138 | +#endif | ||
139 | diff --git a/hw/misc/tz-ppc.c b/hw/misc/tz-ppc.c | ||
140 | new file mode 100644 | ||
141 | index XXXXXXX..XXXXXXX | ||
142 | --- /dev/null | ||
143 | +++ b/hw/misc/tz-ppc.c | ||
144 | @@ -XXX,XX +XXX,XX @@ | ||
145 | +/* | ||
146 | + * ARM TrustZone peripheral protection controller emulation | ||
147 | + * | ||
148 | + * Copyright (c) 2018 Linaro Limited | ||
149 | + * Written by Peter Maydell | ||
150 | + * | ||
151 | + * This program is free software; you can redistribute it and/or modify | ||
152 | + * it under the terms of the GNU General Public License version 2 or | ||
153 | + * (at your option) any later version. | ||
154 | + */ | ||
155 | + | ||
156 | +#include "qemu/osdep.h" | ||
157 | +#include "qemu/log.h" | ||
158 | +#include "qapi/error.h" | ||
159 | +#include "trace.h" | ||
160 | +#include "hw/sysbus.h" | ||
161 | +#include "hw/registerfields.h" | ||
162 | +#include "hw/misc/tz-ppc.h" | ||
163 | + | ||
164 | +static void tz_ppc_update_irq(TZPPC *s) | ||
165 | +{ | ||
166 | + bool level = s->irq_status && s->irq_enable; | ||
167 | + | ||
168 | + trace_tz_ppc_update_irq(level); | ||
169 | + qemu_set_irq(s->irq, level); | ||
170 | +} | ||
171 | + | ||
172 | +static void tz_ppc_cfg_nonsec(void *opaque, int n, int level) | ||
173 | +{ | ||
174 | + TZPPC *s = TZ_PPC(opaque); | ||
175 | + | ||
176 | + assert(n < TZ_NUM_PORTS); | ||
177 | + trace_tz_ppc_cfg_nonsec(n, level); | ||
178 | + s->cfg_nonsec[n] = level; | ||
179 | +} | ||
180 | + | ||
181 | +static void tz_ppc_cfg_ap(void *opaque, int n, int level) | ||
182 | +{ | ||
183 | + TZPPC *s = TZ_PPC(opaque); | ||
184 | + | ||
185 | + assert(n < TZ_NUM_PORTS); | ||
186 | + trace_tz_ppc_cfg_ap(n, level); | ||
187 | + s->cfg_ap[n] = level; | ||
188 | +} | ||
189 | + | ||
190 | +static void tz_ppc_cfg_sec_resp(void *opaque, int n, int level) | ||
191 | +{ | ||
192 | + TZPPC *s = TZ_PPC(opaque); | ||
193 | + | ||
194 | + trace_tz_ppc_cfg_sec_resp(level); | ||
195 | + s->cfg_sec_resp = level; | ||
196 | +} | ||
197 | + | ||
198 | +static void tz_ppc_irq_enable(void *opaque, int n, int level) | ||
199 | +{ | ||
200 | + TZPPC *s = TZ_PPC(opaque); | ||
201 | + | ||
202 | + trace_tz_ppc_irq_enable(level); | ||
203 | + s->irq_enable = level; | ||
204 | + tz_ppc_update_irq(s); | ||
205 | +} | ||
206 | + | ||
207 | +static void tz_ppc_irq_clear(void *opaque, int n, int level) | ||
208 | +{ | ||
209 | + TZPPC *s = TZ_PPC(opaque); | ||
210 | + | ||
211 | + trace_tz_ppc_irq_clear(level); | ||
212 | + | ||
213 | + s->irq_clear = level; | ||
214 | + if (level) { | ||
215 | + s->irq_status = false; | ||
216 | + tz_ppc_update_irq(s); | ||
217 | + } | ||
218 | +} | ||
219 | + | ||
220 | +static bool tz_ppc_check(TZPPC *s, int n, MemTxAttrs attrs) | ||
221 | +{ | ||
222 | + /* Check whether to allow an access to port n; return true if | ||
223 | + * the check passes, and false if the transaction must be blocked. | ||
224 | + * If the latter, the caller must check cfg_sec_resp to determine | ||
225 | + * whether to abort or RAZ/WI the transaction. | ||
226 | + * The checks are: | ||
227 | + * + nonsec_mask suppresses any check of the secure attribute | ||
228 | + * + otherwise, block if cfg_nonsec is 1 and transaction is secure, | ||
229 | + * or if cfg_nonsec is 0 and transaction is non-secure | ||
230 | + * + block if transaction is usermode and cfg_ap is 0 | ||
231 | + */ | ||
232 | + if ((attrs.secure == s->cfg_nonsec[n] && !(s->nonsec_mask & (1 << n))) || | ||
233 | + (attrs.user && !s->cfg_ap[n])) { | ||
234 | + /* Block the transaction. */ | ||
235 | + if (!s->irq_clear) { | ||
236 | + /* Note that holding irq_clear high suppresses interrupts */ | ||
237 | + s->irq_status = true; | ||
238 | + tz_ppc_update_irq(s); | ||
239 | + } | ||
240 | + return false; | ||
241 | + } | ||
242 | + return true; | ||
243 | +} | ||
244 | + | ||
245 | +static MemTxResult tz_ppc_read(void *opaque, hwaddr addr, uint64_t *pdata, | ||
246 | + unsigned size, MemTxAttrs attrs) | ||
247 | +{ | ||
248 | + TZPPCPort *p = opaque; | ||
249 | + TZPPC *s = p->ppc; | ||
250 | + int n = p - s->port; | ||
251 | + AddressSpace *as = &p->downstream_as; | ||
252 | + uint64_t data; | ||
253 | + MemTxResult res; | ||
254 | + | ||
255 | + if (!tz_ppc_check(s, n, attrs)) { | ||
256 | + trace_tz_ppc_read_blocked(n, addr, attrs.secure, attrs.user); | ||
257 | + if (s->cfg_sec_resp) { | ||
258 | + return MEMTX_ERROR; | ||
259 | + } else { | ||
260 | + *pdata = 0; | ||
261 | + return MEMTX_OK; | ||
262 | + } | ||
263 | + } | ||
264 | + | ||
265 | + switch (size) { | ||
266 | + case 1: | ||
267 | + data = address_space_ldub(as, addr, attrs, &res); | ||
268 | + break; | ||
269 | + case 2: | ||
270 | + data = address_space_lduw_le(as, addr, attrs, &res); | ||
271 | + break; | ||
272 | + case 4: | ||
273 | + data = address_space_ldl_le(as, addr, attrs, &res); | ||
274 | + break; | ||
275 | + case 8: | ||
276 | + data = address_space_ldq_le(as, addr, attrs, &res); | ||
277 | + break; | ||
278 | + default: | ||
279 | + g_assert_not_reached(); | ||
280 | + } | ||
281 | + *pdata = data; | ||
282 | + return res; | ||
283 | +} | ||
284 | + | ||
285 | +static MemTxResult tz_ppc_write(void *opaque, hwaddr addr, uint64_t val, | ||
286 | + unsigned size, MemTxAttrs attrs) | ||
287 | +{ | ||
288 | + TZPPCPort *p = opaque; | ||
289 | + TZPPC *s = p->ppc; | ||
290 | + AddressSpace *as = &p->downstream_as; | ||
291 | + int n = p - s->port; | ||
292 | + MemTxResult res; | ||
293 | + | ||
294 | + if (!tz_ppc_check(s, n, attrs)) { | ||
295 | + trace_tz_ppc_write_blocked(n, addr, attrs.secure, attrs.user); | ||
296 | + if (s->cfg_sec_resp) { | ||
297 | + return MEMTX_ERROR; | ||
298 | + } else { | ||
299 | + return MEMTX_OK; | ||
300 | + } | ||
301 | + } | ||
302 | + | ||
303 | + switch (size) { | ||
304 | + case 1: | ||
305 | + address_space_stb(as, addr, val, attrs, &res); | ||
306 | + break; | ||
307 | + case 2: | ||
308 | + address_space_stw_le(as, addr, val, attrs, &res); | ||
309 | + break; | ||
310 | + case 4: | ||
311 | + address_space_stl_le(as, addr, val, attrs, &res); | ||
312 | + break; | ||
313 | + case 8: | ||
314 | + address_space_stq_le(as, addr, val, attrs, &res); | ||
315 | + break; | ||
316 | + default: | ||
317 | + g_assert_not_reached(); | ||
318 | + } | ||
319 | + return res; | ||
320 | +} | ||
321 | + | ||
322 | +static const MemoryRegionOps tz_ppc_ops = { | ||
323 | + .read_with_attrs = tz_ppc_read, | ||
324 | + .write_with_attrs = tz_ppc_write, | ||
325 | + .endianness = DEVICE_LITTLE_ENDIAN, | ||
326 | +}; | ||
327 | + | ||
328 | +static void tz_ppc_reset(DeviceState *dev) | ||
329 | +{ | ||
330 | + TZPPC *s = TZ_PPC(dev); | ||
331 | + | ||
332 | + trace_tz_ppc_reset(); | ||
333 | + s->cfg_sec_resp = false; | ||
334 | + memset(s->cfg_nonsec, 0, sizeof(s->cfg_nonsec)); | ||
335 | + memset(s->cfg_ap, 0, sizeof(s->cfg_ap)); | ||
336 | +} | ||
337 | + | ||
338 | +static void tz_ppc_init(Object *obj) | ||
339 | +{ | ||
340 | + DeviceState *dev = DEVICE(obj); | ||
341 | + TZPPC *s = TZ_PPC(obj); | ||
342 | + | ||
343 | + qdev_init_gpio_in_named(dev, tz_ppc_cfg_nonsec, "cfg_nonsec", TZ_NUM_PORTS); | ||
344 | + qdev_init_gpio_in_named(dev, tz_ppc_cfg_ap, "cfg_ap", TZ_NUM_PORTS); | ||
345 | + qdev_init_gpio_in_named(dev, tz_ppc_cfg_sec_resp, "cfg_sec_resp", 1); | ||
346 | + qdev_init_gpio_in_named(dev, tz_ppc_irq_enable, "irq_enable", 1); | ||
347 | + qdev_init_gpio_in_named(dev, tz_ppc_irq_clear, "irq_clear", 1); | ||
348 | + qdev_init_gpio_out_named(dev, &s->irq, "irq", 1); | ||
349 | +} | ||
350 | + | ||
351 | +static void tz_ppc_realize(DeviceState *dev, Error **errp) | ||
352 | +{ | ||
353 | + Object *obj = OBJECT(dev); | ||
354 | + SysBusDevice *sbd = SYS_BUS_DEVICE(dev); | ||
355 | + TZPPC *s = TZ_PPC(dev); | ||
356 | + int i; | ||
357 | + | ||
358 | + /* We can't create the upstream end of the port until realize, | ||
359 | + * as we don't know the size of the MR used as the downstream until then. | ||
360 | + */ | ||
361 | + for (i = 0; i < TZ_NUM_PORTS; i++) { | ||
362 | + TZPPCPort *port = &s->port[i]; | ||
363 | + char *name; | ||
364 | + uint64_t size; | ||
365 | + | ||
366 | + if (!port->downstream) { | ||
367 | + continue; | ||
368 | + } | ||
369 | + | ||
370 | + name = g_strdup_printf("tz-ppc-port[%d]", i); | ||
371 | + | ||
372 | + port->ppc = s; | ||
373 | + address_space_init(&port->downstream_as, port->downstream, name); | ||
374 | + | ||
375 | + size = memory_region_size(port->downstream); | ||
376 | + memory_region_init_io(&port->upstream, obj, &tz_ppc_ops, | ||
377 | + port, name, size); | ||
378 | + sysbus_init_mmio(sbd, &port->upstream); | ||
379 | + g_free(name); | ||
380 | + } | ||
381 | +} | ||
382 | + | ||
383 | +static const VMStateDescription tz_ppc_vmstate = { | ||
384 | + .name = "tz-ppc", | ||
385 | + .version_id = 1, | ||
386 | + .minimum_version_id = 1, | ||
387 | + .fields = (VMStateField[]) { | ||
388 | + VMSTATE_BOOL_ARRAY(cfg_nonsec, TZPPC, 16), | ||
389 | + VMSTATE_BOOL_ARRAY(cfg_ap, TZPPC, 16), | ||
390 | + VMSTATE_BOOL(cfg_sec_resp, TZPPC), | ||
391 | + VMSTATE_BOOL(irq_enable, TZPPC), | ||
392 | + VMSTATE_BOOL(irq_clear, TZPPC), | ||
393 | + VMSTATE_BOOL(irq_status, TZPPC), | ||
394 | + VMSTATE_END_OF_LIST() | ||
395 | + } | ||
396 | +}; | ||
397 | + | ||
398 | +#define DEFINE_PORT(N) \ | ||
399 | + DEFINE_PROP_LINK("port[" #N "]", TZPPC, port[N].downstream, \ | ||
400 | + TYPE_MEMORY_REGION, MemoryRegion *) | ||
401 | + | ||
402 | +static Property tz_ppc_properties[] = { | ||
403 | + DEFINE_PROP_UINT32("NONSEC_MASK", TZPPC, nonsec_mask, 0), | ||
404 | + DEFINE_PORT(0), | ||
405 | + DEFINE_PORT(1), | ||
406 | + DEFINE_PORT(2), | ||
407 | + DEFINE_PORT(3), | ||
408 | + DEFINE_PORT(4), | ||
409 | + DEFINE_PORT(5), | ||
410 | + DEFINE_PORT(6), | ||
411 | + DEFINE_PORT(7), | ||
412 | + DEFINE_PORT(8), | ||
413 | + DEFINE_PORT(9), | ||
414 | + DEFINE_PORT(10), | ||
415 | + DEFINE_PORT(11), | ||
416 | + DEFINE_PORT(12), | ||
417 | + DEFINE_PORT(13), | ||
418 | + DEFINE_PORT(14), | ||
419 | + DEFINE_PORT(15), | ||
420 | + DEFINE_PROP_END_OF_LIST(), | ||
421 | +}; | ||
422 | + | ||
423 | +static void tz_ppc_class_init(ObjectClass *klass, void *data) | ||
424 | +{ | ||
425 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
426 | + | ||
427 | + dc->realize = tz_ppc_realize; | ||
428 | + dc->vmsd = &tz_ppc_vmstate; | ||
429 | + dc->reset = tz_ppc_reset; | ||
430 | + dc->props = tz_ppc_properties; | ||
431 | +} | ||
432 | + | ||
433 | +static const TypeInfo tz_ppc_info = { | ||
434 | + .name = TYPE_TZ_PPC, | ||
435 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
436 | + .instance_size = sizeof(TZPPC), | ||
437 | + .instance_init = tz_ppc_init, | ||
438 | + .class_init = tz_ppc_class_init, | ||
439 | +}; | ||
440 | + | ||
441 | +static void tz_ppc_register_types(void) | ||
442 | +{ | ||
443 | + type_register_static(&tz_ppc_info); | ||
444 | +} | ||
445 | + | ||
446 | +type_init(tz_ppc_register_types); | ||
55 | diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak | 447 | diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak |
56 | index XXXXXXX..XXXXXXX 100644 | 448 | index XXXXXXX..XXXXXXX 100644 |
57 | --- a/default-configs/arm-softmmu.mak | 449 | --- a/default-configs/arm-softmmu.mak |
58 | +++ b/default-configs/arm-softmmu.mak | 450 | +++ b/default-configs/arm-softmmu.mak |
59 | @@ -XXX,XX +XXX,XX @@ CONFIG_STELLARIS_INPUT=y | 451 | @@ -XXX,XX +XXX,XX @@ CONFIG_CMSDK_APB_UART=y |
60 | CONFIG_STELLARIS_ENET=y | 452 | CONFIG_MPS2_FPGAIO=y |
61 | CONFIG_SSD0303=y | 453 | CONFIG_MPS2_SCC=y |
62 | CONFIG_SSD0323=y | 454 | |
63 | +CONFIG_DDC=y | 455 | +CONFIG_TZ_PPC=y |
64 | +CONFIG_SII9022=y | 456 | + |
65 | CONFIG_ADS7846=y | 457 | CONFIG_VERSATILE_PCI=y |
66 | CONFIG_MAX111X=y | 458 | CONFIG_VERSATILE_I2C=y |
67 | CONFIG_SSI=y | 459 | |
460 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events | ||
461 | index XXXXXXX..XXXXXXX 100644 | ||
462 | --- a/hw/misc/trace-events | ||
463 | +++ b/hw/misc/trace-events | ||
464 | @@ -XXX,XX +XXX,XX @@ mos6522_get_next_irq_time(uint16_t latch, int64_t d, int64_t delta) "latch=%d co | ||
465 | mos6522_set_sr_int(void) "set sr_int" | ||
466 | mos6522_write(uint64_t addr, uint64_t val) "reg=0x%"PRIx64 " val=0x%"PRIx64 | ||
467 | mos6522_read(uint64_t addr, unsigned val) "reg=0x%"PRIx64 " val=0x%x" | ||
468 | + | ||
469 | +# hw/misc/tz-ppc.c | ||
470 | +tz_ppc_reset(void) "TZ PPC: reset" | ||
471 | +tz_ppc_cfg_nonsec(int n, int level) "TZ PPC: cfg_nonsec[%d] = %d" | ||
472 | +tz_ppc_cfg_ap(int n, int level) "TZ PPC: cfg_ap[%d] = %d" | ||
473 | +tz_ppc_cfg_sec_resp(int level) "TZ PPC: cfg_sec_resp = %d" | ||
474 | +tz_ppc_irq_enable(int level) "TZ PPC: int_enable = %d" | ||
475 | +tz_ppc_irq_clear(int level) "TZ PPC: int_clear = %d" | ||
476 | +tz_ppc_update_irq(int level) "TZ PPC: setting irq line to %d" | ||
477 | +tz_ppc_read_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " read (secure %d user %d) blocked" | ||
478 | +tz_ppc_write_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " write (secure %d user %d) blocked" | ||
68 | -- | 479 | -- |
69 | 2.16.2 | 480 | 2.16.2 |
70 | 481 | ||
71 | 482 | diff view generated by jsdifflib |
1 | From: Linus Walleij <linus.walleij@linaro.org> | 1 | The Arm IoT Kit includes a "security controller" which is largely a |
---|---|---|---|
2 | collection of registers for controlling the PPCs and other bits of | ||
3 | glue in the system. This commit provides the initial skeleton of the | ||
4 | device, implementing just the ID registers, and a couple of read-only | ||
5 | read-as-zero registers. | ||
2 | 6 | ||
3 | This adds support for emulating the Silicon Image SII9022 DVI/HDMI | 7 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | bridge. It's not very clever right now, it just acknowledges | 8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | the switch into DDC I2C mode and back. Combining this with the | 9 | Message-id: 20180220180325.29818-16-peter.maydell@linaro.org |
6 | existing DDC I2C emulation gives the right behavior on the Versatile | 10 | --- |
7 | Express emulation passing through the QEMU EDID to the emulated | 11 | hw/misc/Makefile.objs | 1 + |
8 | platform. | 12 | include/hw/misc/iotkit-secctl.h | 39 ++++ |
13 | hw/misc/iotkit-secctl.c | 448 ++++++++++++++++++++++++++++++++++++++++ | ||
14 | default-configs/arm-softmmu.mak | 1 + | ||
15 | hw/misc/trace-events | 7 + | ||
16 | 5 files changed, 496 insertions(+) | ||
17 | create mode 100644 include/hw/misc/iotkit-secctl.h | ||
18 | create mode 100644 hw/misc/iotkit-secctl.c | ||
9 | 19 | ||
10 | Cc: Peter Maydell <peter.maydell@linaro.org> | 20 | diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs |
11 | Signed-off-by: Linus Walleij <linus.walleij@linaro.org> | ||
12 | Message-id: 20180227104903.21353-5-linus.walleij@linaro.org | ||
13 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
14 | [PMM: explictly reset ddc_req/ddc_skip_finish/ddc] | ||
15 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
16 | --- | ||
17 | hw/display/Makefile.objs | 1 + | ||
18 | hw/display/sii9022.c | 191 +++++++++++++++++++++++++++++++++++++++++++++++ | ||
19 | hw/display/trace-events | 5 ++ | ||
20 | 3 files changed, 197 insertions(+) | ||
21 | create mode 100644 hw/display/sii9022.c | ||
22 | |||
23 | diff --git a/hw/display/Makefile.objs b/hw/display/Makefile.objs | ||
24 | index XXXXXXX..XXXXXXX 100644 | 21 | index XXXXXXX..XXXXXXX 100644 |
25 | --- a/hw/display/Makefile.objs | 22 | --- a/hw/misc/Makefile.objs |
26 | +++ b/hw/display/Makefile.objs | 23 | +++ b/hw/misc/Makefile.objs |
27 | @@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_VGA_CIRRUS) += cirrus_vga.o | 24 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_MPS2_FPGAIO) += mps2-fpgaio.o |
28 | common-obj-$(CONFIG_G364FB) += g364fb.o | 25 | obj-$(CONFIG_MPS2_SCC) += mps2-scc.o |
29 | common-obj-$(CONFIG_JAZZ_LED) += jazz_led.o | 26 | |
30 | common-obj-$(CONFIG_PL110) += pl110.o | 27 | obj-$(CONFIG_TZ_PPC) += tz-ppc.o |
31 | +common-obj-$(CONFIG_SII9022) += sii9022.o | 28 | +obj-$(CONFIG_IOTKIT_SECCTL) += iotkit-secctl.o |
32 | common-obj-$(CONFIG_SSD0303) += ssd0303.o | 29 | |
33 | common-obj-$(CONFIG_SSD0323) += ssd0323.o | 30 | obj-$(CONFIG_PVPANIC) += pvpanic.o |
34 | common-obj-$(CONFIG_XEN) += xenfb.o | 31 | obj-$(CONFIG_HYPERV_TESTDEV) += hyperv_testdev.o |
35 | diff --git a/hw/display/sii9022.c b/hw/display/sii9022.c | 32 | diff --git a/include/hw/misc/iotkit-secctl.h b/include/hw/misc/iotkit-secctl.h |
36 | new file mode 100644 | 33 | new file mode 100644 |
37 | index XXXXXXX..XXXXXXX | 34 | index XXXXXXX..XXXXXXX |
38 | --- /dev/null | 35 | --- /dev/null |
39 | +++ b/hw/display/sii9022.c | 36 | +++ b/include/hw/misc/iotkit-secctl.h |
40 | @@ -XXX,XX +XXX,XX @@ | 37 | @@ -XXX,XX +XXX,XX @@ |
41 | +/* | 38 | +/* |
42 | + * Silicon Image SiI9022 | 39 | + * ARM IoT Kit security controller |
43 | + * | 40 | + * |
44 | + * This is a pretty hollow emulation: all we do is acknowledge that we | 41 | + * Copyright (c) 2018 Linaro Limited |
45 | + * exist (chip ID) and confirm that we get switched over into DDC mode | 42 | + * Written by Peter Maydell |
46 | + * so the emulated host can proceed to read out EDID data. All subsequent | ||
47 | + * set-up of connectors etc will be acknowledged and ignored. | ||
48 | + * | 43 | + * |
49 | + * Copyright (C) 2018 Linus Walleij | 44 | + * This program is free software; you can redistribute it and/or modify |
45 | + * it under the terms of the GNU General Public License version 2 or | ||
46 | + * (at your option) any later version. | ||
47 | + */ | ||
48 | + | ||
49 | +/* This is a model of the security controller which is part of the | ||
50 | + * Arm IoT Kit and documented in | ||
51 | + * http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html | ||
50 | + * | 52 | + * |
51 | + * This work is licensed under the terms of the GNU GPL, version 2 or later. | 53 | + * QEMU interface: |
52 | + * See the COPYING file in the top-level directory. | 54 | + * + sysbus MMIO region 0 is the "secure privilege control block" registers |
53 | + * SPDX-License-Identifier: GPL-2.0-or-later | 55 | + * + sysbus MMIO region 1 is the "non-secure privilege control block" registers |
54 | + */ | 56 | + */ |
55 | + | 57 | + |
58 | +#ifndef IOTKIT_SECCTL_H | ||
59 | +#define IOTKIT_SECCTL_H | ||
60 | + | ||
61 | +#include "hw/sysbus.h" | ||
62 | + | ||
63 | +#define TYPE_IOTKIT_SECCTL "iotkit-secctl" | ||
64 | +#define IOTKIT_SECCTL(obj) OBJECT_CHECK(IoTKitSecCtl, (obj), TYPE_IOTKIT_SECCTL) | ||
65 | + | ||
66 | +typedef struct IoTKitSecCtl { | ||
67 | + /*< private >*/ | ||
68 | + SysBusDevice parent_obj; | ||
69 | + | ||
70 | + /*< public >*/ | ||
71 | + | ||
72 | + MemoryRegion s_regs; | ||
73 | + MemoryRegion ns_regs; | ||
74 | +} IoTKitSecCtl; | ||
75 | + | ||
76 | +#endif | ||
77 | diff --git a/hw/misc/iotkit-secctl.c b/hw/misc/iotkit-secctl.c | ||
78 | new file mode 100644 | ||
79 | index XXXXXXX..XXXXXXX | ||
80 | --- /dev/null | ||
81 | +++ b/hw/misc/iotkit-secctl.c | ||
82 | @@ -XXX,XX +XXX,XX @@ | ||
83 | +/* | ||
84 | + * Arm IoT Kit security controller | ||
85 | + * | ||
86 | + * Copyright (c) 2018 Linaro Limited | ||
87 | + * Written by Peter Maydell | ||
88 | + * | ||
89 | + * This program is free software; you can redistribute it and/or modify | ||
90 | + * it under the terms of the GNU General Public License version 2 or | ||
91 | + * (at your option) any later version. | ||
92 | + */ | ||
93 | + | ||
56 | +#include "qemu/osdep.h" | 94 | +#include "qemu/osdep.h" |
57 | +#include "qemu-common.h" | 95 | +#include "qemu/log.h" |
58 | +#include "hw/i2c/i2c.h" | 96 | +#include "qapi/error.h" |
59 | +#include "hw/i2c/i2c-ddc.h" | ||
60 | +#include "trace.h" | 97 | +#include "trace.h" |
61 | + | 98 | +#include "hw/sysbus.h" |
62 | +#define SII9022_SYS_CTRL_DATA 0x1a | 99 | +#include "hw/registerfields.h" |
63 | +#define SII9022_SYS_CTRL_PWR_DWN 0x10 | 100 | +#include "hw/misc/iotkit-secctl.h" |
64 | +#define SII9022_SYS_CTRL_AV_MUTE 0x08 | 101 | + |
65 | +#define SII9022_SYS_CTRL_DDC_BUS_REQ 0x04 | 102 | +/* Registers in the secure privilege control block */ |
66 | +#define SII9022_SYS_CTRL_DDC_BUS_GRTD 0x02 | 103 | +REG32(SECRESPCFG, 0x10) |
67 | +#define SII9022_SYS_CTRL_OUTPUT_MODE 0x01 | 104 | +REG32(NSCCFG, 0x14) |
68 | +#define SII9022_SYS_CTRL_OUTPUT_HDMI 1 | 105 | +REG32(SECMPCINTSTATUS, 0x1c) |
69 | +#define SII9022_SYS_CTRL_OUTPUT_DVI 0 | 106 | +REG32(SECPPCINTSTAT, 0x20) |
70 | +#define SII9022_REG_CHIPID 0x1b | 107 | +REG32(SECPPCINTCLR, 0x24) |
71 | +#define SII9022_INT_ENABLE 0x3c | 108 | +REG32(SECPPCINTEN, 0x28) |
72 | +#define SII9022_INT_STATUS 0x3d | 109 | +REG32(SECMSCINTSTAT, 0x30) |
73 | +#define SII9022_INT_STATUS_HOTPLUG 0x01; | 110 | +REG32(SECMSCINTCLR, 0x34) |
74 | +#define SII9022_INT_STATUS_PLUGGED 0x04; | 111 | +REG32(SECMSCINTEN, 0x38) |
75 | + | 112 | +REG32(BRGINTSTAT, 0x40) |
76 | +#define TYPE_SII9022 "sii9022" | 113 | +REG32(BRGINTCLR, 0x44) |
77 | +#define SII9022(obj) OBJECT_CHECK(sii9022_state, (obj), TYPE_SII9022) | 114 | +REG32(BRGINTEN, 0x48) |
78 | + | 115 | +REG32(AHBNSPPC0, 0x50) |
79 | +typedef struct sii9022_state { | 116 | +REG32(AHBNSPPCEXP0, 0x60) |
80 | + I2CSlave parent_obj; | 117 | +REG32(AHBNSPPCEXP1, 0x64) |
81 | + uint8_t ptr; | 118 | +REG32(AHBNSPPCEXP2, 0x68) |
82 | + bool addr_byte; | 119 | +REG32(AHBNSPPCEXP3, 0x6c) |
83 | + bool ddc_req; | 120 | +REG32(APBNSPPC0, 0x70) |
84 | + bool ddc_skip_finish; | 121 | +REG32(APBNSPPC1, 0x74) |
85 | + bool ddc; | 122 | +REG32(APBNSPPCEXP0, 0x80) |
86 | +} sii9022_state; | 123 | +REG32(APBNSPPCEXP1, 0x84) |
87 | + | 124 | +REG32(APBNSPPCEXP2, 0x88) |
88 | +static const VMStateDescription vmstate_sii9022 = { | 125 | +REG32(APBNSPPCEXP3, 0x8c) |
89 | + .name = "sii9022", | 126 | +REG32(AHBSPPPC0, 0x90) |
127 | +REG32(AHBSPPPCEXP0, 0xa0) | ||
128 | +REG32(AHBSPPPCEXP1, 0xa4) | ||
129 | +REG32(AHBSPPPCEXP2, 0xa8) | ||
130 | +REG32(AHBSPPPCEXP3, 0xac) | ||
131 | +REG32(APBSPPPC0, 0xb0) | ||
132 | +REG32(APBSPPPC1, 0xb4) | ||
133 | +REG32(APBSPPPCEXP0, 0xc0) | ||
134 | +REG32(APBSPPPCEXP1, 0xc4) | ||
135 | +REG32(APBSPPPCEXP2, 0xc8) | ||
136 | +REG32(APBSPPPCEXP3, 0xcc) | ||
137 | +REG32(NSMSCEXP, 0xd0) | ||
138 | +REG32(PID4, 0xfd0) | ||
139 | +REG32(PID5, 0xfd4) | ||
140 | +REG32(PID6, 0xfd8) | ||
141 | +REG32(PID7, 0xfdc) | ||
142 | +REG32(PID0, 0xfe0) | ||
143 | +REG32(PID1, 0xfe4) | ||
144 | +REG32(PID2, 0xfe8) | ||
145 | +REG32(PID3, 0xfec) | ||
146 | +REG32(CID0, 0xff0) | ||
147 | +REG32(CID1, 0xff4) | ||
148 | +REG32(CID2, 0xff8) | ||
149 | +REG32(CID3, 0xffc) | ||
150 | + | ||
151 | +/* Registers in the non-secure privilege control block */ | ||
152 | +REG32(AHBNSPPPC0, 0x90) | ||
153 | +REG32(AHBNSPPPCEXP0, 0xa0) | ||
154 | +REG32(AHBNSPPPCEXP1, 0xa4) | ||
155 | +REG32(AHBNSPPPCEXP2, 0xa8) | ||
156 | +REG32(AHBNSPPPCEXP3, 0xac) | ||
157 | +REG32(APBNSPPPC0, 0xb0) | ||
158 | +REG32(APBNSPPPC1, 0xb4) | ||
159 | +REG32(APBNSPPPCEXP0, 0xc0) | ||
160 | +REG32(APBNSPPPCEXP1, 0xc4) | ||
161 | +REG32(APBNSPPPCEXP2, 0xc8) | ||
162 | +REG32(APBNSPPPCEXP3, 0xcc) | ||
163 | +/* PID and CID registers are also present in the NS block */ | ||
164 | + | ||
165 | +static const uint8_t iotkit_secctl_s_idregs[] = { | ||
166 | + 0x04, 0x00, 0x00, 0x00, | ||
167 | + 0x52, 0xb8, 0x0b, 0x00, | ||
168 | + 0x0d, 0xf0, 0x05, 0xb1, | ||
169 | +}; | ||
170 | + | ||
171 | +static const uint8_t iotkit_secctl_ns_idregs[] = { | ||
172 | + 0x04, 0x00, 0x00, 0x00, | ||
173 | + 0x53, 0xb8, 0x0b, 0x00, | ||
174 | + 0x0d, 0xf0, 0x05, 0xb1, | ||
175 | +}; | ||
176 | + | ||
177 | +static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr, | ||
178 | + uint64_t *pdata, | ||
179 | + unsigned size, MemTxAttrs attrs) | ||
180 | +{ | ||
181 | + uint64_t r; | ||
182 | + uint32_t offset = addr & ~0x3; | ||
183 | + | ||
184 | + switch (offset) { | ||
185 | + case A_AHBNSPPC0: | ||
186 | + case A_AHBSPPPC0: | ||
187 | + r = 0; | ||
188 | + break; | ||
189 | + case A_SECRESPCFG: | ||
190 | + case A_NSCCFG: | ||
191 | + case A_SECMPCINTSTATUS: | ||
192 | + case A_SECPPCINTSTAT: | ||
193 | + case A_SECPPCINTEN: | ||
194 | + case A_SECMSCINTSTAT: | ||
195 | + case A_SECMSCINTEN: | ||
196 | + case A_BRGINTSTAT: | ||
197 | + case A_BRGINTEN: | ||
198 | + case A_AHBNSPPCEXP0: | ||
199 | + case A_AHBNSPPCEXP1: | ||
200 | + case A_AHBNSPPCEXP2: | ||
201 | + case A_AHBNSPPCEXP3: | ||
202 | + case A_APBNSPPC0: | ||
203 | + case A_APBNSPPC1: | ||
204 | + case A_APBNSPPCEXP0: | ||
205 | + case A_APBNSPPCEXP1: | ||
206 | + case A_APBNSPPCEXP2: | ||
207 | + case A_APBNSPPCEXP3: | ||
208 | + case A_AHBSPPPCEXP0: | ||
209 | + case A_AHBSPPPCEXP1: | ||
210 | + case A_AHBSPPPCEXP2: | ||
211 | + case A_AHBSPPPCEXP3: | ||
212 | + case A_APBSPPPC0: | ||
213 | + case A_APBSPPPC1: | ||
214 | + case A_APBSPPPCEXP0: | ||
215 | + case A_APBSPPPCEXP1: | ||
216 | + case A_APBSPPPCEXP2: | ||
217 | + case A_APBSPPPCEXP3: | ||
218 | + case A_NSMSCEXP: | ||
219 | + qemu_log_mask(LOG_UNIMP, | ||
220 | + "IoTKit SecCtl S block read: " | ||
221 | + "unimplemented offset 0x%x\n", offset); | ||
222 | + r = 0; | ||
223 | + break; | ||
224 | + case A_PID4: | ||
225 | + case A_PID5: | ||
226 | + case A_PID6: | ||
227 | + case A_PID7: | ||
228 | + case A_PID0: | ||
229 | + case A_PID1: | ||
230 | + case A_PID2: | ||
231 | + case A_PID3: | ||
232 | + case A_CID0: | ||
233 | + case A_CID1: | ||
234 | + case A_CID2: | ||
235 | + case A_CID3: | ||
236 | + r = iotkit_secctl_s_idregs[(offset - A_PID4) / 4]; | ||
237 | + break; | ||
238 | + case A_SECPPCINTCLR: | ||
239 | + case A_SECMSCINTCLR: | ||
240 | + case A_BRGINTCLR: | ||
241 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
242 | + "IotKit SecCtl S block read: write-only offset 0x%x\n", | ||
243 | + offset); | ||
244 | + r = 0; | ||
245 | + break; | ||
246 | + default: | ||
247 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
248 | + "IotKit SecCtl S block read: bad offset 0x%x\n", offset); | ||
249 | + r = 0; | ||
250 | + break; | ||
251 | + } | ||
252 | + | ||
253 | + if (size != 4) { | ||
254 | + /* None of our registers are access-sensitive, so just pull the right | ||
255 | + * byte out of the word read result. | ||
256 | + */ | ||
257 | + r = extract32(r, (addr & 3) * 8, size * 8); | ||
258 | + } | ||
259 | + | ||
260 | + trace_iotkit_secctl_s_read(offset, r, size); | ||
261 | + *pdata = r; | ||
262 | + return MEMTX_OK; | ||
263 | +} | ||
264 | + | ||
265 | +static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr, | ||
266 | + uint64_t value, | ||
267 | + unsigned size, MemTxAttrs attrs) | ||
268 | +{ | ||
269 | + uint32_t offset = addr; | ||
270 | + | ||
271 | + trace_iotkit_secctl_s_write(offset, value, size); | ||
272 | + | ||
273 | + if (size != 4) { | ||
274 | + /* Byte and halfword writes are ignored */ | ||
275 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
276 | + "IotKit SecCtl S block write: bad size, ignored\n"); | ||
277 | + return MEMTX_OK; | ||
278 | + } | ||
279 | + | ||
280 | + switch (offset) { | ||
281 | + case A_SECRESPCFG: | ||
282 | + case A_NSCCFG: | ||
283 | + case A_SECPPCINTCLR: | ||
284 | + case A_SECPPCINTEN: | ||
285 | + case A_SECMSCINTCLR: | ||
286 | + case A_SECMSCINTEN: | ||
287 | + case A_BRGINTCLR: | ||
288 | + case A_BRGINTEN: | ||
289 | + case A_AHBNSPPCEXP0: | ||
290 | + case A_AHBNSPPCEXP1: | ||
291 | + case A_AHBNSPPCEXP2: | ||
292 | + case A_AHBNSPPCEXP3: | ||
293 | + case A_APBNSPPC0: | ||
294 | + case A_APBNSPPC1: | ||
295 | + case A_APBNSPPCEXP0: | ||
296 | + case A_APBNSPPCEXP1: | ||
297 | + case A_APBNSPPCEXP2: | ||
298 | + case A_APBNSPPCEXP3: | ||
299 | + case A_AHBSPPPCEXP0: | ||
300 | + case A_AHBSPPPCEXP1: | ||
301 | + case A_AHBSPPPCEXP2: | ||
302 | + case A_AHBSPPPCEXP3: | ||
303 | + case A_APBSPPPC0: | ||
304 | + case A_APBSPPPC1: | ||
305 | + case A_APBSPPPCEXP0: | ||
306 | + case A_APBSPPPCEXP1: | ||
307 | + case A_APBSPPPCEXP2: | ||
308 | + case A_APBSPPPCEXP3: | ||
309 | + qemu_log_mask(LOG_UNIMP, | ||
310 | + "IoTKit SecCtl S block write: " | ||
311 | + "unimplemented offset 0x%x\n", offset); | ||
312 | + break; | ||
313 | + case A_SECMPCINTSTATUS: | ||
314 | + case A_SECPPCINTSTAT: | ||
315 | + case A_SECMSCINTSTAT: | ||
316 | + case A_BRGINTSTAT: | ||
317 | + case A_AHBNSPPC0: | ||
318 | + case A_AHBSPPPC0: | ||
319 | + case A_NSMSCEXP: | ||
320 | + case A_PID4: | ||
321 | + case A_PID5: | ||
322 | + case A_PID6: | ||
323 | + case A_PID7: | ||
324 | + case A_PID0: | ||
325 | + case A_PID1: | ||
326 | + case A_PID2: | ||
327 | + case A_PID3: | ||
328 | + case A_CID0: | ||
329 | + case A_CID1: | ||
330 | + case A_CID2: | ||
331 | + case A_CID3: | ||
332 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
333 | + "IoTKit SecCtl S block write: " | ||
334 | + "read-only offset 0x%x\n", offset); | ||
335 | + break; | ||
336 | + default: | ||
337 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
338 | + "IotKit SecCtl S block write: bad offset 0x%x\n", | ||
339 | + offset); | ||
340 | + break; | ||
341 | + } | ||
342 | + | ||
343 | + return MEMTX_OK; | ||
344 | +} | ||
345 | + | ||
346 | +static MemTxResult iotkit_secctl_ns_read(void *opaque, hwaddr addr, | ||
347 | + uint64_t *pdata, | ||
348 | + unsigned size, MemTxAttrs attrs) | ||
349 | +{ | ||
350 | + uint64_t r; | ||
351 | + uint32_t offset = addr & ~0x3; | ||
352 | + | ||
353 | + switch (offset) { | ||
354 | + case A_AHBNSPPPC0: | ||
355 | + r = 0; | ||
356 | + break; | ||
357 | + case A_AHBNSPPPCEXP0: | ||
358 | + case A_AHBNSPPPCEXP1: | ||
359 | + case A_AHBNSPPPCEXP2: | ||
360 | + case A_AHBNSPPPCEXP3: | ||
361 | + case A_APBNSPPPC0: | ||
362 | + case A_APBNSPPPC1: | ||
363 | + case A_APBNSPPPCEXP0: | ||
364 | + case A_APBNSPPPCEXP1: | ||
365 | + case A_APBNSPPPCEXP2: | ||
366 | + case A_APBNSPPPCEXP3: | ||
367 | + qemu_log_mask(LOG_UNIMP, | ||
368 | + "IoTKit SecCtl NS block read: " | ||
369 | + "unimplemented offset 0x%x\n", offset); | ||
370 | + break; | ||
371 | + case A_PID4: | ||
372 | + case A_PID5: | ||
373 | + case A_PID6: | ||
374 | + case A_PID7: | ||
375 | + case A_PID0: | ||
376 | + case A_PID1: | ||
377 | + case A_PID2: | ||
378 | + case A_PID3: | ||
379 | + case A_CID0: | ||
380 | + case A_CID1: | ||
381 | + case A_CID2: | ||
382 | + case A_CID3: | ||
383 | + r = iotkit_secctl_ns_idregs[(offset - A_PID4) / 4]; | ||
384 | + break; | ||
385 | + default: | ||
386 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
387 | + "IotKit SecCtl NS block write: bad offset 0x%x\n", | ||
388 | + offset); | ||
389 | + r = 0; | ||
390 | + break; | ||
391 | + } | ||
392 | + | ||
393 | + if (size != 4) { | ||
394 | + /* None of our registers are access-sensitive, so just pull the right | ||
395 | + * byte out of the word read result. | ||
396 | + */ | ||
397 | + r = extract32(r, (addr & 3) * 8, size * 8); | ||
398 | + } | ||
399 | + | ||
400 | + trace_iotkit_secctl_ns_read(offset, r, size); | ||
401 | + *pdata = r; | ||
402 | + return MEMTX_OK; | ||
403 | +} | ||
404 | + | ||
405 | +static MemTxResult iotkit_secctl_ns_write(void *opaque, hwaddr addr, | ||
406 | + uint64_t value, | ||
407 | + unsigned size, MemTxAttrs attrs) | ||
408 | +{ | ||
409 | + uint32_t offset = addr; | ||
410 | + | ||
411 | + trace_iotkit_secctl_ns_write(offset, value, size); | ||
412 | + | ||
413 | + if (size != 4) { | ||
414 | + /* Byte and halfword writes are ignored */ | ||
415 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
416 | + "IotKit SecCtl NS block write: bad size, ignored\n"); | ||
417 | + return MEMTX_OK; | ||
418 | + } | ||
419 | + | ||
420 | + switch (offset) { | ||
421 | + case A_AHBNSPPPCEXP0: | ||
422 | + case A_AHBNSPPPCEXP1: | ||
423 | + case A_AHBNSPPPCEXP2: | ||
424 | + case A_AHBNSPPPCEXP3: | ||
425 | + case A_APBNSPPPC0: | ||
426 | + case A_APBNSPPPC1: | ||
427 | + case A_APBNSPPPCEXP0: | ||
428 | + case A_APBNSPPPCEXP1: | ||
429 | + case A_APBNSPPPCEXP2: | ||
430 | + case A_APBNSPPPCEXP3: | ||
431 | + qemu_log_mask(LOG_UNIMP, | ||
432 | + "IoTKit SecCtl NS block write: " | ||
433 | + "unimplemented offset 0x%x\n", offset); | ||
434 | + break; | ||
435 | + case A_AHBNSPPPC0: | ||
436 | + case A_PID4: | ||
437 | + case A_PID5: | ||
438 | + case A_PID6: | ||
439 | + case A_PID7: | ||
440 | + case A_PID0: | ||
441 | + case A_PID1: | ||
442 | + case A_PID2: | ||
443 | + case A_PID3: | ||
444 | + case A_CID0: | ||
445 | + case A_CID1: | ||
446 | + case A_CID2: | ||
447 | + case A_CID3: | ||
448 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
449 | + "IoTKit SecCtl NS block write: " | ||
450 | + "read-only offset 0x%x\n", offset); | ||
451 | + break; | ||
452 | + default: | ||
453 | + qemu_log_mask(LOG_GUEST_ERROR, | ||
454 | + "IotKit SecCtl NS block write: bad offset 0x%x\n", | ||
455 | + offset); | ||
456 | + break; | ||
457 | + } | ||
458 | + | ||
459 | + return MEMTX_OK; | ||
460 | +} | ||
461 | + | ||
462 | +static const MemoryRegionOps iotkit_secctl_s_ops = { | ||
463 | + .read_with_attrs = iotkit_secctl_s_read, | ||
464 | + .write_with_attrs = iotkit_secctl_s_write, | ||
465 | + .endianness = DEVICE_LITTLE_ENDIAN, | ||
466 | + .valid.min_access_size = 1, | ||
467 | + .valid.max_access_size = 4, | ||
468 | + .impl.min_access_size = 1, | ||
469 | + .impl.max_access_size = 4, | ||
470 | +}; | ||
471 | + | ||
472 | +static const MemoryRegionOps iotkit_secctl_ns_ops = { | ||
473 | + .read_with_attrs = iotkit_secctl_ns_read, | ||
474 | + .write_with_attrs = iotkit_secctl_ns_write, | ||
475 | + .endianness = DEVICE_LITTLE_ENDIAN, | ||
476 | + .valid.min_access_size = 1, | ||
477 | + .valid.max_access_size = 4, | ||
478 | + .impl.min_access_size = 1, | ||
479 | + .impl.max_access_size = 4, | ||
480 | +}; | ||
481 | + | ||
482 | +static void iotkit_secctl_reset(DeviceState *dev) | ||
483 | +{ | ||
484 | + | ||
485 | +} | ||
486 | + | ||
487 | +static void iotkit_secctl_init(Object *obj) | ||
488 | +{ | ||
489 | + IoTKitSecCtl *s = IOTKIT_SECCTL(obj); | ||
490 | + SysBusDevice *sbd = SYS_BUS_DEVICE(obj); | ||
491 | + | ||
492 | + memory_region_init_io(&s->s_regs, obj, &iotkit_secctl_s_ops, | ||
493 | + s, "iotkit-secctl-s-regs", 0x1000); | ||
494 | + memory_region_init_io(&s->ns_regs, obj, &iotkit_secctl_ns_ops, | ||
495 | + s, "iotkit-secctl-ns-regs", 0x1000); | ||
496 | + sysbus_init_mmio(sbd, &s->s_regs); | ||
497 | + sysbus_init_mmio(sbd, &s->ns_regs); | ||
498 | +} | ||
499 | + | ||
500 | +static const VMStateDescription iotkit_secctl_vmstate = { | ||
501 | + .name = "iotkit-secctl", | ||
90 | + .version_id = 1, | 502 | + .version_id = 1, |
91 | + .minimum_version_id = 1, | 503 | + .minimum_version_id = 1, |
92 | + .fields = (VMStateField[]) { | 504 | + .fields = (VMStateField[]) { |
93 | + VMSTATE_I2C_SLAVE(parent_obj, sii9022_state), | ||
94 | + VMSTATE_UINT8(ptr, sii9022_state), | ||
95 | + VMSTATE_BOOL(addr_byte, sii9022_state), | ||
96 | + VMSTATE_BOOL(ddc_req, sii9022_state), | ||
97 | + VMSTATE_BOOL(ddc_skip_finish, sii9022_state), | ||
98 | + VMSTATE_BOOL(ddc, sii9022_state), | ||
99 | + VMSTATE_END_OF_LIST() | 505 | + VMSTATE_END_OF_LIST() |
100 | + } | 506 | + } |
101 | +}; | 507 | +}; |
102 | + | 508 | + |
103 | +static int sii9022_event(I2CSlave *i2c, enum i2c_event event) | 509 | +static void iotkit_secctl_class_init(ObjectClass *klass, void *data) |
104 | +{ | ||
105 | + sii9022_state *s = SII9022(i2c); | ||
106 | + | ||
107 | + switch (event) { | ||
108 | + case I2C_START_SEND: | ||
109 | + s->addr_byte = true; | ||
110 | + break; | ||
111 | + case I2C_START_RECV: | ||
112 | + break; | ||
113 | + case I2C_FINISH: | ||
114 | + break; | ||
115 | + case I2C_NACK: | ||
116 | + break; | ||
117 | + } | ||
118 | + | ||
119 | + return 0; | ||
120 | +} | ||
121 | + | ||
122 | +static int sii9022_rx(I2CSlave *i2c) | ||
123 | +{ | ||
124 | + sii9022_state *s = SII9022(i2c); | ||
125 | + uint8_t res = 0x00; | ||
126 | + | ||
127 | + switch (s->ptr) { | ||
128 | + case SII9022_SYS_CTRL_DATA: | ||
129 | + if (s->ddc_req) { | ||
130 | + /* Acknowledge DDC bus request */ | ||
131 | + res = SII9022_SYS_CTRL_DDC_BUS_GRTD | SII9022_SYS_CTRL_DDC_BUS_REQ; | ||
132 | + } | ||
133 | + break; | ||
134 | + case SII9022_REG_CHIPID: | ||
135 | + res = 0xb0; | ||
136 | + break; | ||
137 | + case SII9022_INT_STATUS: | ||
138 | + /* Something is cold-plugged in, no interrupts */ | ||
139 | + res = SII9022_INT_STATUS_PLUGGED; | ||
140 | + break; | ||
141 | + default: | ||
142 | + break; | ||
143 | + } | ||
144 | + | ||
145 | + trace_sii9022_read_reg(s->ptr, res); | ||
146 | + s->ptr++; | ||
147 | + | ||
148 | + return res; | ||
149 | +} | ||
150 | + | ||
151 | +static int sii9022_tx(I2CSlave *i2c, uint8_t data) | ||
152 | +{ | ||
153 | + sii9022_state *s = SII9022(i2c); | ||
154 | + | ||
155 | + if (s->addr_byte) { | ||
156 | + s->ptr = data; | ||
157 | + s->addr_byte = false; | ||
158 | + return 0; | ||
159 | + } | ||
160 | + | ||
161 | + switch (s->ptr) { | ||
162 | + case SII9022_SYS_CTRL_DATA: | ||
163 | + if (data & SII9022_SYS_CTRL_DDC_BUS_REQ) { | ||
164 | + s->ddc_req = true; | ||
165 | + if (data & SII9022_SYS_CTRL_DDC_BUS_GRTD) { | ||
166 | + s->ddc = true; | ||
167 | + /* Skip this finish since we just switched to DDC */ | ||
168 | + s->ddc_skip_finish = true; | ||
169 | + trace_sii9022_switch_mode("DDC"); | ||
170 | + } | ||
171 | + } else { | ||
172 | + s->ddc_req = false; | ||
173 | + s->ddc = false; | ||
174 | + trace_sii9022_switch_mode("normal"); | ||
175 | + } | ||
176 | + break; | ||
177 | + default: | ||
178 | + break; | ||
179 | + } | ||
180 | + | ||
181 | + trace_sii9022_write_reg(s->ptr, data); | ||
182 | + s->ptr++; | ||
183 | + | ||
184 | + return 0; | ||
185 | +} | ||
186 | + | ||
187 | +static void sii9022_reset(DeviceState *dev) | ||
188 | +{ | ||
189 | + sii9022_state *s = SII9022(dev); | ||
190 | + | ||
191 | + s->ptr = 0; | ||
192 | + s->addr_byte = false; | ||
193 | + s->ddc_req = false; | ||
194 | + s->ddc_skip_finish = false; | ||
195 | + s->ddc = false; | ||
196 | +} | ||
197 | + | ||
198 | +static void sii9022_realize(DeviceState *dev, Error **errp) | ||
199 | +{ | ||
200 | + I2CBus *bus; | ||
201 | + | ||
202 | + bus = I2C_BUS(qdev_get_parent_bus(dev)); | ||
203 | + i2c_create_slave(bus, TYPE_I2CDDC, 0x50); | ||
204 | +} | ||
205 | + | ||
206 | +static void sii9022_class_init(ObjectClass *klass, void *data) | ||
207 | +{ | 510 | +{ |
208 | + DeviceClass *dc = DEVICE_CLASS(klass); | 511 | + DeviceClass *dc = DEVICE_CLASS(klass); |
209 | + I2CSlaveClass *k = I2C_SLAVE_CLASS(klass); | 512 | + |
210 | + | 513 | + dc->vmsd = &iotkit_secctl_vmstate; |
211 | + k->event = sii9022_event; | 514 | + dc->reset = iotkit_secctl_reset; |
212 | + k->recv = sii9022_rx; | 515 | +} |
213 | + k->send = sii9022_tx; | 516 | + |
214 | + dc->reset = sii9022_reset; | 517 | +static const TypeInfo iotkit_secctl_info = { |
215 | + dc->realize = sii9022_realize; | 518 | + .name = TYPE_IOTKIT_SECCTL, |
216 | + dc->vmsd = &vmstate_sii9022; | 519 | + .parent = TYPE_SYS_BUS_DEVICE, |
217 | +} | 520 | + .instance_size = sizeof(IoTKitSecCtl), |
218 | + | 521 | + .instance_init = iotkit_secctl_init, |
219 | +static const TypeInfo sii9022_info = { | 522 | + .class_init = iotkit_secctl_class_init, |
220 | + .name = TYPE_SII9022, | ||
221 | + .parent = TYPE_I2C_SLAVE, | ||
222 | + .instance_size = sizeof(sii9022_state), | ||
223 | + .class_init = sii9022_class_init, | ||
224 | +}; | 523 | +}; |
225 | + | 524 | + |
226 | +static void sii9022_register_types(void) | 525 | +static void iotkit_secctl_register_types(void) |
227 | +{ | 526 | +{ |
228 | + type_register_static(&sii9022_info); | 527 | + type_register_static(&iotkit_secctl_info); |
229 | +} | 528 | +} |
230 | + | 529 | + |
231 | +type_init(sii9022_register_types) | 530 | +type_init(iotkit_secctl_register_types); |
232 | diff --git a/hw/display/trace-events b/hw/display/trace-events | 531 | diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak |
233 | index XXXXXXX..XXXXXXX 100644 | 532 | index XXXXXXX..XXXXXXX 100644 |
234 | --- a/hw/display/trace-events | 533 | --- a/default-configs/arm-softmmu.mak |
235 | +++ b/hw/display/trace-events | 534 | +++ b/default-configs/arm-softmmu.mak |
236 | @@ -XXX,XX +XXX,XX @@ vga_cirrus_read_io(uint32_t addr, uint32_t val) "addr 0x%x, val 0x%x" | 535 | @@ -XXX,XX +XXX,XX @@ CONFIG_MPS2_FPGAIO=y |
237 | vga_cirrus_write_io(uint32_t addr, uint32_t val) "addr 0x%x, val 0x%x" | 536 | CONFIG_MPS2_SCC=y |
238 | vga_cirrus_read_blt(uint32_t offset, uint32_t val) "offset 0x%x, val 0x%x" | 537 | |
239 | vga_cirrus_write_blt(uint32_t offset, uint32_t val) "offset 0x%x, val 0x%x" | 538 | CONFIG_TZ_PPC=y |
240 | + | 539 | +CONFIG_IOTKIT_SECCTL=y |
241 | +# hw/display/sii9022.c | 540 | |
242 | +sii9022_read_reg(uint8_t addr, uint8_t val) "addr 0x%02x, val 0x%02x" | 541 | CONFIG_VERSATILE_PCI=y |
243 | +sii9022_write_reg(uint8_t addr, uint8_t val) "addr 0x%02x, val 0x%02x" | 542 | CONFIG_VERSATILE_I2C=y |
244 | +sii9022_switch_mode(const char *mode) "mode: %s" | 543 | diff --git a/hw/misc/trace-events b/hw/misc/trace-events |
544 | index XXXXXXX..XXXXXXX 100644 | ||
545 | --- a/hw/misc/trace-events | ||
546 | +++ b/hw/misc/trace-events | ||
547 | @@ -XXX,XX +XXX,XX @@ tz_ppc_irq_clear(int level) "TZ PPC: int_clear = %d" | ||
548 | tz_ppc_update_irq(int level) "TZ PPC: setting irq line to %d" | ||
549 | tz_ppc_read_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " read (secure %d user %d) blocked" | ||
550 | tz_ppc_write_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " write (secure %d user %d) blocked" | ||
551 | + | ||
552 | +# hw/misc/iotkit-secctl.c | ||
553 | +iotkit_secctl_s_read(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl S regs read: offset 0x%x data 0x%" PRIx64 " size %u" | ||
554 | +iotkit_secctl_s_write(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl S regs write: offset 0x%x data 0x%" PRIx64 " size %u" | ||
555 | +iotkit_secctl_ns_read(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl NS regs read: offset 0x%x data 0x%" PRIx64 " size %u" | ||
556 | +iotkit_secctl_ns_write(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl NS regs write: offset 0x%x data 0x%" PRIx64 " size %u" | ||
557 | +iotkit_secctl_reset(void) "IoTKit SecCtl: reset" | ||
245 | -- | 558 | -- |
246 | 2.16.2 | 559 | 2.16.2 |
247 | 560 | ||
248 | 561 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | The IoTKit Security Controller includes various registers |
---|---|---|---|
2 | that expose to software the controls for the Peripheral | ||
3 | Protection Controllers in the system. Implement these. | ||
2 | 4 | ||
3 | As some of the constants here will also be needed | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | elsewhere (specifically for the upcoming SVE support) we move them out | 6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | to softfloat.h. | 7 | Message-id: 20180220180325.29818-17-peter.maydell@linaro.org |
8 | --- | ||
9 | include/hw/misc/iotkit-secctl.h | 64 +++++++++- | ||
10 | hw/misc/iotkit-secctl.c | 270 +++++++++++++++++++++++++++++++++++++--- | ||
11 | 2 files changed, 315 insertions(+), 19 deletions(-) | ||
6 | 12 | ||
7 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 13 | diff --git a/include/hw/misc/iotkit-secctl.h b/include/hw/misc/iotkit-secctl.h |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20180227143852.11175-13-alex.bennee@linaro.org | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | --- | ||
12 | include/fpu/softfloat.h | 18 +++++++++++++----- | ||
13 | target/arm/helper-a64.h | 2 ++ | ||
14 | target/arm/helper-a64.c | 34 ++++++++++++++++++++++++++++++++++ | ||
15 | target/arm/translate-a64.c | 6 ++++++ | ||
16 | 4 files changed, 55 insertions(+), 5 deletions(-) | ||
17 | |||
18 | diff --git a/include/fpu/softfloat.h b/include/fpu/softfloat.h | ||
19 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/include/fpu/softfloat.h | 15 | --- a/include/hw/misc/iotkit-secctl.h |
21 | +++ b/include/fpu/softfloat.h | 16 | +++ b/include/hw/misc/iotkit-secctl.h |
22 | @@ -XXX,XX +XXX,XX @@ static inline float16 float16_set_sign(float16 a, int sign) | 17 | @@ -XXX,XX +XXX,XX @@ |
18 | * QEMU interface: | ||
19 | * + sysbus MMIO region 0 is the "secure privilege control block" registers | ||
20 | * + sysbus MMIO region 1 is the "non-secure privilege control block" registers | ||
21 | + * + named GPIO output "sec_resp_cfg" indicating whether blocked accesses | ||
22 | + * should RAZ/WI or bus error | ||
23 | + * Controlling the 2 APB PPCs in the IoTKit: | ||
24 | + * + named GPIO outputs apb_ppc0_nonsec[0..2] and apb_ppc1_nonsec | ||
25 | + * + named GPIO outputs apb_ppc0_ap[0..2] and apb_ppc1_ap | ||
26 | + * + named GPIO outputs apb_ppc{0,1}_irq_enable | ||
27 | + * + named GPIO outputs apb_ppc{0,1}_irq_clear | ||
28 | + * + named GPIO inputs apb_ppc{0,1}_irq_status | ||
29 | + * Controlling each of the 4 expansion APB PPCs which a system using the IoTKit | ||
30 | + * might provide: | ||
31 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_nonsec[0..15] | ||
32 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_ap[0..15] | ||
33 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_enable | ||
34 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_clear | ||
35 | + * + named GPIO inputs apb_ppcexp{0,1,2,3}_irq_status | ||
36 | + * Controlling each of the 4 expansion AHB PPCs which a system using the IoTKit | ||
37 | + * might provide: | ||
38 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_nonsec[0..15] | ||
39 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_ap[0..15] | ||
40 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_enable | ||
41 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_clear | ||
42 | + * + named GPIO inputs ahb_ppcexp{0,1,2,3}_irq_status | ||
43 | */ | ||
44 | |||
45 | #ifndef IOTKIT_SECCTL_H | ||
46 | @@ -XXX,XX +XXX,XX @@ | ||
47 | #define TYPE_IOTKIT_SECCTL "iotkit-secctl" | ||
48 | #define IOTKIT_SECCTL(obj) OBJECT_CHECK(IoTKitSecCtl, (obj), TYPE_IOTKIT_SECCTL) | ||
49 | |||
50 | -typedef struct IoTKitSecCtl { | ||
51 | +#define IOTS_APB_PPC0_NUM_PORTS 3 | ||
52 | +#define IOTS_APB_PPC1_NUM_PORTS 1 | ||
53 | +#define IOTS_PPC_NUM_PORTS 16 | ||
54 | +#define IOTS_NUM_APB_PPC 2 | ||
55 | +#define IOTS_NUM_APB_EXP_PPC 4 | ||
56 | +#define IOTS_NUM_AHB_EXP_PPC 4 | ||
57 | + | ||
58 | +typedef struct IoTKitSecCtl IoTKitSecCtl; | ||
59 | + | ||
60 | +/* State and IRQ lines relating to a PPC. For the | ||
61 | + * PPCs in the IoTKit not all the IRQ lines are used. | ||
62 | + */ | ||
63 | +typedef struct IoTKitSecCtlPPC { | ||
64 | + qemu_irq nonsec[IOTS_PPC_NUM_PORTS]; | ||
65 | + qemu_irq ap[IOTS_PPC_NUM_PORTS]; | ||
66 | + qemu_irq irq_enable; | ||
67 | + qemu_irq irq_clear; | ||
68 | + | ||
69 | + uint32_t ns; | ||
70 | + uint32_t sp; | ||
71 | + uint32_t nsp; | ||
72 | + | ||
73 | + /* Number of ports actually present */ | ||
74 | + int numports; | ||
75 | + /* Offset of this PPC's interrupt bits in SECPPCINTSTAT */ | ||
76 | + int irq_bit_offset; | ||
77 | + IoTKitSecCtl *parent; | ||
78 | +} IoTKitSecCtlPPC; | ||
79 | + | ||
80 | +struct IoTKitSecCtl { | ||
81 | /*< private >*/ | ||
82 | SysBusDevice parent_obj; | ||
83 | |||
84 | /*< public >*/ | ||
85 | + qemu_irq sec_resp_cfg; | ||
86 | |||
87 | MemoryRegion s_regs; | ||
88 | MemoryRegion ns_regs; | ||
89 | -} IoTKitSecCtl; | ||
90 | + | ||
91 | + uint32_t secppcintstat; | ||
92 | + uint32_t secppcinten; | ||
93 | + uint32_t secrespcfg; | ||
94 | + | ||
95 | + IoTKitSecCtlPPC apb[IOTS_NUM_APB_PPC]; | ||
96 | + IoTKitSecCtlPPC apbexp[IOTS_NUM_APB_EXP_PPC]; | ||
97 | + IoTKitSecCtlPPC ahbexp[IOTS_NUM_APB_EXP_PPC]; | ||
98 | +}; | ||
99 | |||
100 | #endif | ||
101 | diff --git a/hw/misc/iotkit-secctl.c b/hw/misc/iotkit-secctl.c | ||
102 | index XXXXXXX..XXXXXXX 100644 | ||
103 | --- a/hw/misc/iotkit-secctl.c | ||
104 | +++ b/hw/misc/iotkit-secctl.c | ||
105 | @@ -XXX,XX +XXX,XX @@ static const uint8_t iotkit_secctl_ns_idregs[] = { | ||
106 | 0x0d, 0xf0, 0x05, 0xb1, | ||
107 | }; | ||
108 | |||
109 | +/* The register sets for the various PPCs (AHB internal, APB internal, | ||
110 | + * AHB expansion, APB expansion) are all set up so that they are | ||
111 | + * in 16-aligned blocks so offsets 0xN0, 0xN4, 0xN8, 0xNC are PPCs | ||
112 | + * 0, 1, 2, 3 of that type, so we can convert a register address offset | ||
113 | + * into an an index into a PPC array easily. | ||
114 | + */ | ||
115 | +static inline int offset_to_ppc_idx(uint32_t offset) | ||
116 | +{ | ||
117 | + return extract32(offset, 2, 2); | ||
118 | +} | ||
119 | + | ||
120 | +typedef void PerPPCFunction(IoTKitSecCtlPPC *ppc); | ||
121 | + | ||
122 | +static void foreach_ppc(IoTKitSecCtl *s, PerPPCFunction *fn) | ||
123 | +{ | ||
124 | + int i; | ||
125 | + | ||
126 | + for (i = 0; i < IOTS_NUM_APB_PPC; i++) { | ||
127 | + fn(&s->apb[i]); | ||
128 | + } | ||
129 | + for (i = 0; i < IOTS_NUM_APB_EXP_PPC; i++) { | ||
130 | + fn(&s->apbexp[i]); | ||
131 | + } | ||
132 | + for (i = 0; i < IOTS_NUM_AHB_EXP_PPC; i++) { | ||
133 | + fn(&s->ahbexp[i]); | ||
134 | + } | ||
135 | +} | ||
136 | + | ||
137 | static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr, | ||
138 | uint64_t *pdata, | ||
139 | unsigned size, MemTxAttrs attrs) | ||
140 | { | ||
141 | uint64_t r; | ||
142 | uint32_t offset = addr & ~0x3; | ||
143 | + IoTKitSecCtl *s = IOTKIT_SECCTL(opaque); | ||
144 | |||
145 | switch (offset) { | ||
146 | case A_AHBNSPPC0: | ||
147 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr, | ||
148 | r = 0; | ||
149 | break; | ||
150 | case A_SECRESPCFG: | ||
151 | - case A_NSCCFG: | ||
152 | - case A_SECMPCINTSTATUS: | ||
153 | + r = s->secrespcfg; | ||
154 | + break; | ||
155 | case A_SECPPCINTSTAT: | ||
156 | + r = s->secppcintstat; | ||
157 | + break; | ||
158 | case A_SECPPCINTEN: | ||
159 | - case A_SECMSCINTSTAT: | ||
160 | - case A_SECMSCINTEN: | ||
161 | - case A_BRGINTSTAT: | ||
162 | - case A_BRGINTEN: | ||
163 | + r = s->secppcinten; | ||
164 | + break; | ||
165 | case A_AHBNSPPCEXP0: | ||
166 | case A_AHBNSPPCEXP1: | ||
167 | case A_AHBNSPPCEXP2: | ||
168 | case A_AHBNSPPCEXP3: | ||
169 | + r = s->ahbexp[offset_to_ppc_idx(offset)].ns; | ||
170 | + break; | ||
171 | case A_APBNSPPC0: | ||
172 | case A_APBNSPPC1: | ||
173 | + r = s->apb[offset_to_ppc_idx(offset)].ns; | ||
174 | + break; | ||
175 | case A_APBNSPPCEXP0: | ||
176 | case A_APBNSPPCEXP1: | ||
177 | case A_APBNSPPCEXP2: | ||
178 | case A_APBNSPPCEXP3: | ||
179 | + r = s->apbexp[offset_to_ppc_idx(offset)].ns; | ||
180 | + break; | ||
181 | case A_AHBSPPPCEXP0: | ||
182 | case A_AHBSPPPCEXP1: | ||
183 | case A_AHBSPPPCEXP2: | ||
184 | case A_AHBSPPPCEXP3: | ||
185 | + r = s->apbexp[offset_to_ppc_idx(offset)].sp; | ||
186 | + break; | ||
187 | case A_APBSPPPC0: | ||
188 | case A_APBSPPPC1: | ||
189 | + r = s->apb[offset_to_ppc_idx(offset)].sp; | ||
190 | + break; | ||
191 | case A_APBSPPPCEXP0: | ||
192 | case A_APBSPPPCEXP1: | ||
193 | case A_APBSPPPCEXP2: | ||
194 | case A_APBSPPPCEXP3: | ||
195 | + r = s->apbexp[offset_to_ppc_idx(offset)].sp; | ||
196 | + break; | ||
197 | + case A_NSCCFG: | ||
198 | + case A_SECMPCINTSTATUS: | ||
199 | + case A_SECMSCINTSTAT: | ||
200 | + case A_SECMSCINTEN: | ||
201 | + case A_BRGINTSTAT: | ||
202 | + case A_BRGINTEN: | ||
203 | case A_NSMSCEXP: | ||
204 | qemu_log_mask(LOG_UNIMP, | ||
205 | "IoTKit SecCtl S block read: " | ||
206 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr, | ||
207 | return MEMTX_OK; | ||
23 | } | 208 | } |
24 | 209 | ||
25 | #define float16_zero make_float16(0) | 210 | +static void iotkit_secctl_update_ppc_ap(IoTKitSecCtlPPC *ppc) |
26 | -#define float16_one make_float16(0x3c00) | 211 | +{ |
27 | #define float16_half make_float16(0x3800) | 212 | + int i; |
28 | +#define float16_one make_float16(0x3c00) | 213 | + |
29 | +#define float16_one_point_five make_float16(0x3e00) | 214 | + for (i = 0; i < ppc->numports; i++) { |
30 | +#define float16_two make_float16(0x4000) | 215 | + bool v; |
31 | +#define float16_three make_float16(0x4200) | 216 | + |
32 | #define float16_infinity make_float16(0x7c00) | 217 | + if (extract32(ppc->ns, i, 1)) { |
33 | 218 | + v = extract32(ppc->nsp, i, 1); | |
34 | /*---------------------------------------------------------------------------- | 219 | + } else { |
35 | @@ -XXX,XX +XXX,XX @@ static inline float32 float32_set_sign(float32 a, int sign) | 220 | + v = extract32(ppc->sp, i, 1); |
221 | + } | ||
222 | + qemu_set_irq(ppc->ap[i], v); | ||
223 | + } | ||
224 | +} | ||
225 | + | ||
226 | +static void iotkit_secctl_ppc_ns_write(IoTKitSecCtlPPC *ppc, uint32_t value) | ||
227 | +{ | ||
228 | + int i; | ||
229 | + | ||
230 | + ppc->ns = value & MAKE_64BIT_MASK(0, ppc->numports); | ||
231 | + for (i = 0; i < ppc->numports; i++) { | ||
232 | + qemu_set_irq(ppc->nonsec[i], extract32(ppc->ns, i, 1)); | ||
233 | + } | ||
234 | + iotkit_secctl_update_ppc_ap(ppc); | ||
235 | +} | ||
236 | + | ||
237 | +static void iotkit_secctl_ppc_sp_write(IoTKitSecCtlPPC *ppc, uint32_t value) | ||
238 | +{ | ||
239 | + ppc->sp = value & MAKE_64BIT_MASK(0, ppc->numports); | ||
240 | + iotkit_secctl_update_ppc_ap(ppc); | ||
241 | +} | ||
242 | + | ||
243 | +static void iotkit_secctl_ppc_nsp_write(IoTKitSecCtlPPC *ppc, uint32_t value) | ||
244 | +{ | ||
245 | + ppc->nsp = value & MAKE_64BIT_MASK(0, ppc->numports); | ||
246 | + iotkit_secctl_update_ppc_ap(ppc); | ||
247 | +} | ||
248 | + | ||
249 | +static void iotkit_secctl_ppc_update_irq_clear(IoTKitSecCtlPPC *ppc) | ||
250 | +{ | ||
251 | + uint32_t value = ppc->parent->secppcintstat; | ||
252 | + | ||
253 | + qemu_set_irq(ppc->irq_clear, extract32(value, ppc->irq_bit_offset, 1)); | ||
254 | +} | ||
255 | + | ||
256 | +static void iotkit_secctl_ppc_update_irq_enable(IoTKitSecCtlPPC *ppc) | ||
257 | +{ | ||
258 | + uint32_t value = ppc->parent->secppcinten; | ||
259 | + | ||
260 | + qemu_set_irq(ppc->irq_enable, extract32(value, ppc->irq_bit_offset, 1)); | ||
261 | +} | ||
262 | + | ||
263 | static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr, | ||
264 | uint64_t value, | ||
265 | unsigned size, MemTxAttrs attrs) | ||
266 | { | ||
267 | + IoTKitSecCtl *s = IOTKIT_SECCTL(opaque); | ||
268 | uint32_t offset = addr; | ||
269 | + IoTKitSecCtlPPC *ppc; | ||
270 | |||
271 | trace_iotkit_secctl_s_write(offset, value, size); | ||
272 | |||
273 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr, | ||
274 | |||
275 | switch (offset) { | ||
276 | case A_SECRESPCFG: | ||
277 | - case A_NSCCFG: | ||
278 | + value &= 1; | ||
279 | + s->secrespcfg = value; | ||
280 | + qemu_set_irq(s->sec_resp_cfg, s->secrespcfg); | ||
281 | + break; | ||
282 | case A_SECPPCINTCLR: | ||
283 | + value &= 0x00f000f3; | ||
284 | + foreach_ppc(s, iotkit_secctl_ppc_update_irq_clear); | ||
285 | + break; | ||
286 | case A_SECPPCINTEN: | ||
287 | - case A_SECMSCINTCLR: | ||
288 | - case A_SECMSCINTEN: | ||
289 | - case A_BRGINTCLR: | ||
290 | - case A_BRGINTEN: | ||
291 | + s->secppcinten = value & 0x00f000f3; | ||
292 | + foreach_ppc(s, iotkit_secctl_ppc_update_irq_enable); | ||
293 | + break; | ||
294 | case A_AHBNSPPCEXP0: | ||
295 | case A_AHBNSPPCEXP1: | ||
296 | case A_AHBNSPPCEXP2: | ||
297 | case A_AHBNSPPCEXP3: | ||
298 | + ppc = &s->ahbexp[offset_to_ppc_idx(offset)]; | ||
299 | + iotkit_secctl_ppc_ns_write(ppc, value); | ||
300 | + break; | ||
301 | case A_APBNSPPC0: | ||
302 | case A_APBNSPPC1: | ||
303 | + ppc = &s->apb[offset_to_ppc_idx(offset)]; | ||
304 | + iotkit_secctl_ppc_ns_write(ppc, value); | ||
305 | + break; | ||
306 | case A_APBNSPPCEXP0: | ||
307 | case A_APBNSPPCEXP1: | ||
308 | case A_APBNSPPCEXP2: | ||
309 | case A_APBNSPPCEXP3: | ||
310 | + ppc = &s->apbexp[offset_to_ppc_idx(offset)]; | ||
311 | + iotkit_secctl_ppc_ns_write(ppc, value); | ||
312 | + break; | ||
313 | case A_AHBSPPPCEXP0: | ||
314 | case A_AHBSPPPCEXP1: | ||
315 | case A_AHBSPPPCEXP2: | ||
316 | case A_AHBSPPPCEXP3: | ||
317 | + ppc = &s->ahbexp[offset_to_ppc_idx(offset)]; | ||
318 | + iotkit_secctl_ppc_sp_write(ppc, value); | ||
319 | + break; | ||
320 | case A_APBSPPPC0: | ||
321 | case A_APBSPPPC1: | ||
322 | + ppc = &s->apb[offset_to_ppc_idx(offset)]; | ||
323 | + iotkit_secctl_ppc_sp_write(ppc, value); | ||
324 | + break; | ||
325 | case A_APBSPPPCEXP0: | ||
326 | case A_APBSPPPCEXP1: | ||
327 | case A_APBSPPPCEXP2: | ||
328 | case A_APBSPPPCEXP3: | ||
329 | + ppc = &s->apbexp[offset_to_ppc_idx(offset)]; | ||
330 | + iotkit_secctl_ppc_sp_write(ppc, value); | ||
331 | + break; | ||
332 | + case A_NSCCFG: | ||
333 | + case A_SECMSCINTCLR: | ||
334 | + case A_SECMSCINTEN: | ||
335 | + case A_BRGINTCLR: | ||
336 | + case A_BRGINTEN: | ||
337 | qemu_log_mask(LOG_UNIMP, | ||
338 | "IoTKit SecCtl S block write: " | ||
339 | "unimplemented offset 0x%x\n", offset); | ||
340 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_read(void *opaque, hwaddr addr, | ||
341 | uint64_t *pdata, | ||
342 | unsigned size, MemTxAttrs attrs) | ||
343 | { | ||
344 | + IoTKitSecCtl *s = IOTKIT_SECCTL(opaque); | ||
345 | uint64_t r; | ||
346 | uint32_t offset = addr & ~0x3; | ||
347 | |||
348 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_read(void *opaque, hwaddr addr, | ||
349 | case A_AHBNSPPPCEXP1: | ||
350 | case A_AHBNSPPPCEXP2: | ||
351 | case A_AHBNSPPPCEXP3: | ||
352 | + r = s->ahbexp[offset_to_ppc_idx(offset)].nsp; | ||
353 | + break; | ||
354 | case A_APBNSPPPC0: | ||
355 | case A_APBNSPPPC1: | ||
356 | + r = s->apb[offset_to_ppc_idx(offset)].nsp; | ||
357 | + break; | ||
358 | case A_APBNSPPPCEXP0: | ||
359 | case A_APBNSPPPCEXP1: | ||
360 | case A_APBNSPPPCEXP2: | ||
361 | case A_APBNSPPPCEXP3: | ||
362 | - qemu_log_mask(LOG_UNIMP, | ||
363 | - "IoTKit SecCtl NS block read: " | ||
364 | - "unimplemented offset 0x%x\n", offset); | ||
365 | + r = s->apbexp[offset_to_ppc_idx(offset)].nsp; | ||
366 | break; | ||
367 | case A_PID4: | ||
368 | case A_PID5: | ||
369 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_write(void *opaque, hwaddr addr, | ||
370 | uint64_t value, | ||
371 | unsigned size, MemTxAttrs attrs) | ||
372 | { | ||
373 | + IoTKitSecCtl *s = IOTKIT_SECCTL(opaque); | ||
374 | uint32_t offset = addr; | ||
375 | + IoTKitSecCtlPPC *ppc; | ||
376 | |||
377 | trace_iotkit_secctl_ns_write(offset, value, size); | ||
378 | |||
379 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_write(void *opaque, hwaddr addr, | ||
380 | case A_AHBNSPPPCEXP1: | ||
381 | case A_AHBNSPPPCEXP2: | ||
382 | case A_AHBNSPPPCEXP3: | ||
383 | + ppc = &s->ahbexp[offset_to_ppc_idx(offset)]; | ||
384 | + iotkit_secctl_ppc_nsp_write(ppc, value); | ||
385 | + break; | ||
386 | case A_APBNSPPPC0: | ||
387 | case A_APBNSPPPC1: | ||
388 | + ppc = &s->apb[offset_to_ppc_idx(offset)]; | ||
389 | + iotkit_secctl_ppc_nsp_write(ppc, value); | ||
390 | + break; | ||
391 | case A_APBNSPPPCEXP0: | ||
392 | case A_APBNSPPPCEXP1: | ||
393 | case A_APBNSPPPCEXP2: | ||
394 | case A_APBNSPPPCEXP3: | ||
395 | - qemu_log_mask(LOG_UNIMP, | ||
396 | - "IoTKit SecCtl NS block write: " | ||
397 | - "unimplemented offset 0x%x\n", offset); | ||
398 | + ppc = &s->apbexp[offset_to_ppc_idx(offset)]; | ||
399 | + iotkit_secctl_ppc_nsp_write(ppc, value); | ||
400 | break; | ||
401 | case A_AHBNSPPPC0: | ||
402 | case A_PID4: | ||
403 | @@ -XXX,XX +XXX,XX @@ static const MemoryRegionOps iotkit_secctl_ns_ops = { | ||
404 | .impl.max_access_size = 4, | ||
405 | }; | ||
406 | |||
407 | +static void iotkit_secctl_reset_ppc(IoTKitSecCtlPPC *ppc) | ||
408 | +{ | ||
409 | + ppc->ns = 0; | ||
410 | + ppc->sp = 0; | ||
411 | + ppc->nsp = 0; | ||
412 | +} | ||
413 | + | ||
414 | static void iotkit_secctl_reset(DeviceState *dev) | ||
415 | { | ||
416 | + IoTKitSecCtl *s = IOTKIT_SECCTL(dev); | ||
417 | |||
418 | + s->secppcintstat = 0; | ||
419 | + s->secppcinten = 0; | ||
420 | + s->secrespcfg = 0; | ||
421 | + | ||
422 | + foreach_ppc(s, iotkit_secctl_reset_ppc); | ||
423 | +} | ||
424 | + | ||
425 | +static void iotkit_secctl_ppc_irqstatus(void *opaque, int n, int level) | ||
426 | +{ | ||
427 | + IoTKitSecCtlPPC *ppc = opaque; | ||
428 | + IoTKitSecCtl *s = IOTKIT_SECCTL(ppc->parent); | ||
429 | + int irqbit = ppc->irq_bit_offset + n; | ||
430 | + | ||
431 | + s->secppcintstat = deposit32(s->secppcintstat, irqbit, 1, level); | ||
432 | +} | ||
433 | + | ||
434 | +static void iotkit_secctl_init_ppc(IoTKitSecCtl *s, | ||
435 | + IoTKitSecCtlPPC *ppc, | ||
436 | + const char *name, | ||
437 | + int numports, | ||
438 | + int irq_bit_offset) | ||
439 | +{ | ||
440 | + char *gpioname; | ||
441 | + DeviceState *dev = DEVICE(s); | ||
442 | + | ||
443 | + ppc->numports = numports; | ||
444 | + ppc->irq_bit_offset = irq_bit_offset; | ||
445 | + ppc->parent = s; | ||
446 | + | ||
447 | + gpioname = g_strdup_printf("%s_nonsec", name); | ||
448 | + qdev_init_gpio_out_named(dev, ppc->nonsec, gpioname, numports); | ||
449 | + g_free(gpioname); | ||
450 | + gpioname = g_strdup_printf("%s_ap", name); | ||
451 | + qdev_init_gpio_out_named(dev, ppc->ap, gpioname, numports); | ||
452 | + g_free(gpioname); | ||
453 | + gpioname = g_strdup_printf("%s_irq_enable", name); | ||
454 | + qdev_init_gpio_out_named(dev, &ppc->irq_enable, gpioname, 1); | ||
455 | + g_free(gpioname); | ||
456 | + gpioname = g_strdup_printf("%s_irq_clear", name); | ||
457 | + qdev_init_gpio_out_named(dev, &ppc->irq_clear, gpioname, 1); | ||
458 | + g_free(gpioname); | ||
459 | + gpioname = g_strdup_printf("%s_irq_status", name); | ||
460 | + qdev_init_gpio_in_named_with_opaque(dev, iotkit_secctl_ppc_irqstatus, | ||
461 | + ppc, gpioname, 1); | ||
462 | + g_free(gpioname); | ||
36 | } | 463 | } |
37 | 464 | ||
38 | #define float32_zero make_float32(0) | 465 | static void iotkit_secctl_init(Object *obj) |
39 | -#define float32_one make_float32(0x3f800000) | 466 | { |
40 | #define float32_half make_float32(0x3f000000) | 467 | IoTKitSecCtl *s = IOTKIT_SECCTL(obj); |
41 | +#define float32_one make_float32(0x3f800000) | 468 | SysBusDevice *sbd = SYS_BUS_DEVICE(obj); |
42 | +#define float32_one_point_five make_float32(0x3fc00000) | 469 | + DeviceState *dev = DEVICE(obj); |
43 | +#define float32_two make_float32(0x40000000) | 470 | + int i; |
44 | +#define float32_three make_float32(0x40400000) | 471 | + |
45 | #define float32_infinity make_float32(0x7f800000) | 472 | + iotkit_secctl_init_ppc(s, &s->apb[0], "apb_ppc0", |
46 | 473 | + IOTS_APB_PPC0_NUM_PORTS, 0); | |
47 | - | 474 | + iotkit_secctl_init_ppc(s, &s->apb[1], "apb_ppc1", |
48 | /*---------------------------------------------------------------------------- | 475 | + IOTS_APB_PPC1_NUM_PORTS, 1); |
49 | | The pattern for a default generated single-precision NaN. | 476 | + |
50 | *----------------------------------------------------------------------------*/ | 477 | + for (i = 0; i < IOTS_NUM_APB_EXP_PPC; i++) { |
51 | @@ -XXX,XX +XXX,XX @@ static inline float64 float64_set_sign(float64 a, int sign) | 478 | + IoTKitSecCtlPPC *ppc = &s->apbexp[i]; |
479 | + char *ppcname = g_strdup_printf("apb_ppcexp%d", i); | ||
480 | + iotkit_secctl_init_ppc(s, ppc, ppcname, IOTS_PPC_NUM_PORTS, 4 + i); | ||
481 | + g_free(ppcname); | ||
482 | + } | ||
483 | + for (i = 0; i < IOTS_NUM_AHB_EXP_PPC; i++) { | ||
484 | + IoTKitSecCtlPPC *ppc = &s->ahbexp[i]; | ||
485 | + char *ppcname = g_strdup_printf("ahb_ppcexp%d", i); | ||
486 | + iotkit_secctl_init_ppc(s, ppc, ppcname, IOTS_PPC_NUM_PORTS, 20 + i); | ||
487 | + g_free(ppcname); | ||
488 | + } | ||
489 | + | ||
490 | + qdev_init_gpio_out_named(dev, &s->sec_resp_cfg, "sec_resp_cfg", 1); | ||
491 | |||
492 | memory_region_init_io(&s->s_regs, obj, &iotkit_secctl_s_ops, | ||
493 | s, "iotkit-secctl-s-regs", 0x1000); | ||
494 | @@ -XXX,XX +XXX,XX @@ static void iotkit_secctl_init(Object *obj) | ||
495 | sysbus_init_mmio(sbd, &s->ns_regs); | ||
52 | } | 496 | } |
53 | 497 | ||
54 | #define float64_zero make_float64(0) | 498 | +static const VMStateDescription iotkit_secctl_ppc_vmstate = { |
55 | -#define float64_one make_float64(0x3ff0000000000000LL) | 499 | + .name = "iotkit-secctl-ppc", |
56 | -#define float64_ln2 make_float64(0x3fe62e42fefa39efLL) | 500 | + .version_id = 1, |
57 | #define float64_half make_float64(0x3fe0000000000000LL) | 501 | + .minimum_version_id = 1, |
58 | +#define float64_one make_float64(0x3ff0000000000000LL) | 502 | + .fields = (VMStateField[]) { |
59 | +#define float64_one_point_five make_float64(0x3FF8000000000000ULL) | 503 | + VMSTATE_UINT32(ns, IoTKitSecCtlPPC), |
60 | +#define float64_two make_float64(0x4000000000000000ULL) | 504 | + VMSTATE_UINT32(sp, IoTKitSecCtlPPC), |
61 | +#define float64_three make_float64(0x4008000000000000ULL) | 505 | + VMSTATE_UINT32(nsp, IoTKitSecCtlPPC), |
62 | +#define float64_ln2 make_float64(0x3fe62e42fefa39efLL) | 506 | + VMSTATE_END_OF_LIST() |
63 | #define float64_infinity make_float64(0x7ff0000000000000LL) | 507 | + } |
64 | 508 | +}; | |
65 | /*---------------------------------------------------------------------------- | 509 | + |
66 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 510 | static const VMStateDescription iotkit_secctl_vmstate = { |
67 | index XXXXXXX..XXXXXXX 100644 | 511 | .name = "iotkit-secctl", |
68 | --- a/target/arm/helper-a64.h | 512 | .version_id = 1, |
69 | +++ b/target/arm/helper-a64.h | 513 | .minimum_version_id = 1, |
70 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(vfp_mulxd, TCG_CALL_NO_RWG, f64, f64, f64, ptr) | 514 | .fields = (VMStateField[]) { |
71 | DEF_HELPER_FLAGS_3(neon_ceq_f64, TCG_CALL_NO_RWG, i64, i64, i64, ptr) | 515 | + VMSTATE_UINT32(secppcintstat, IoTKitSecCtl), |
72 | DEF_HELPER_FLAGS_3(neon_cge_f64, TCG_CALL_NO_RWG, i64, i64, i64, ptr) | 516 | + VMSTATE_UINT32(secppcinten, IoTKitSecCtl), |
73 | DEF_HELPER_FLAGS_3(neon_cgt_f64, TCG_CALL_NO_RWG, i64, i64, i64, ptr) | 517 | + VMSTATE_UINT32(secrespcfg, IoTKitSecCtl), |
74 | +DEF_HELPER_FLAGS_3(recpsf_f16, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 518 | + VMSTATE_STRUCT_ARRAY(apb, IoTKitSecCtl, IOTS_NUM_APB_PPC, 1, |
75 | DEF_HELPER_FLAGS_3(recpsf_f32, TCG_CALL_NO_RWG, f32, f32, f32, ptr) | 519 | + iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC), |
76 | DEF_HELPER_FLAGS_3(recpsf_f64, TCG_CALL_NO_RWG, f64, f64, f64, ptr) | 520 | + VMSTATE_STRUCT_ARRAY(apbexp, IoTKitSecCtl, IOTS_NUM_APB_EXP_PPC, 1, |
77 | +DEF_HELPER_FLAGS_3(rsqrtsf_f16, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 521 | + iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC), |
78 | DEF_HELPER_FLAGS_3(rsqrtsf_f32, TCG_CALL_NO_RWG, f32, f32, f32, ptr) | 522 | + VMSTATE_STRUCT_ARRAY(ahbexp, IoTKitSecCtl, IOTS_NUM_AHB_EXP_PPC, 1, |
79 | DEF_HELPER_FLAGS_3(rsqrtsf_f64, TCG_CALL_NO_RWG, f64, f64, f64, ptr) | 523 | + iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC), |
80 | DEF_HELPER_FLAGS_1(neon_addlp_s8, TCG_CALL_NO_RWG_SE, i64, i64) | 524 | VMSTATE_END_OF_LIST() |
81 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 525 | } |
82 | index XXXXXXX..XXXXXXX 100644 | 526 | }; |
83 | --- a/target/arm/helper-a64.c | ||
84 | +++ b/target/arm/helper-a64.c | ||
85 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_cgt_f64)(float64 a, float64 b, void *fpstp) | ||
86 | * versions, these do a fully fused multiply-add or | ||
87 | * multiply-add-and-halve. | ||
88 | */ | ||
89 | +#define float16_two make_float16(0x4000) | ||
90 | +#define float16_three make_float16(0x4200) | ||
91 | +#define float16_one_point_five make_float16(0x3e00) | ||
92 | + | ||
93 | #define float32_two make_float32(0x40000000) | ||
94 | #define float32_three make_float32(0x40400000) | ||
95 | #define float32_one_point_five make_float32(0x3fc00000) | ||
96 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_cgt_f64)(float64 a, float64 b, void *fpstp) | ||
97 | #define float64_three make_float64(0x4008000000000000ULL) | ||
98 | #define float64_one_point_five make_float64(0x3FF8000000000000ULL) | ||
99 | |||
100 | +float16 HELPER(recpsf_f16)(float16 a, float16 b, void *fpstp) | ||
101 | +{ | ||
102 | + float_status *fpst = fpstp; | ||
103 | + | ||
104 | + a = float16_squash_input_denormal(a, fpst); | ||
105 | + b = float16_squash_input_denormal(b, fpst); | ||
106 | + | ||
107 | + a = float16_chs(a); | ||
108 | + if ((float16_is_infinity(a) && float16_is_zero(b)) || | ||
109 | + (float16_is_infinity(b) && float16_is_zero(a))) { | ||
110 | + return float16_two; | ||
111 | + } | ||
112 | + return float16_muladd(a, b, float16_two, 0, fpst); | ||
113 | +} | ||
114 | + | ||
115 | float32 HELPER(recpsf_f32)(float32 a, float32 b, void *fpstp) | ||
116 | { | ||
117 | float_status *fpst = fpstp; | ||
118 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(recpsf_f64)(float64 a, float64 b, void *fpstp) | ||
119 | return float64_muladd(a, b, float64_two, 0, fpst); | ||
120 | } | ||
121 | |||
122 | +float16 HELPER(rsqrtsf_f16)(float16 a, float16 b, void *fpstp) | ||
123 | +{ | ||
124 | + float_status *fpst = fpstp; | ||
125 | + | ||
126 | + a = float16_squash_input_denormal(a, fpst); | ||
127 | + b = float16_squash_input_denormal(b, fpst); | ||
128 | + | ||
129 | + a = float16_chs(a); | ||
130 | + if ((float16_is_infinity(a) && float16_is_zero(b)) || | ||
131 | + (float16_is_infinity(b) && float16_is_zero(a))) { | ||
132 | + return float16_one_point_five; | ||
133 | + } | ||
134 | + return float16_muladd(a, b, float16_three, float_muladd_halve_result, fpst); | ||
135 | +} | ||
136 | + | ||
137 | float32 HELPER(rsqrtsf_f32)(float32 a, float32 b, void *fpstp) | ||
138 | { | ||
139 | float_status *fpst = fpstp; | ||
140 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
141 | index XXXXXXX..XXXXXXX 100644 | ||
142 | --- a/target/arm/translate-a64.c | ||
143 | +++ b/target/arm/translate-a64.c | ||
144 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | ||
145 | case 0x6: /* FMAX */ | ||
146 | gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
147 | break; | ||
148 | + case 0x7: /* FRECPS */ | ||
149 | + gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
150 | + break; | ||
151 | case 0x8: /* FMINNM */ | ||
152 | gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
153 | break; | ||
154 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | ||
155 | case 0xe: /* FMIN */ | ||
156 | gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
157 | break; | ||
158 | + case 0xf: /* FRSQRTS */ | ||
159 | + gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
160 | + break; | ||
161 | case 0x13: /* FMUL */ | ||
162 | gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
163 | break; | ||
164 | -- | 527 | -- |
165 | 2.16.2 | 528 | 2.16.2 |
166 | 529 | ||
167 | 530 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Add remaining easy registers to iotkit-secctl: |
---|---|---|---|
2 | * NSCCFG just routes its two bits out to external GPIO lines | ||
3 | * BRGINSTAT/BRGINTCLR/BRGINTEN can be dummies, because QEMU's | ||
4 | bus fabric can never report errors | ||
2 | 5 | ||
3 | Neither of these operations alter the floating point status registers | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | so we can do a pure bitwise operation, either squashing any sign | 7 | Message-id: 20180220180325.29818-18-peter.maydell@linaro.org |
5 | bit (ABS) or inverting it (NEG). | 8 | --- |
9 | include/hw/misc/iotkit-secctl.h | 4 ++++ | ||
10 | hw/misc/iotkit-secctl.c | 32 ++++++++++++++++++++++++++------ | ||
11 | 2 files changed, 30 insertions(+), 6 deletions(-) | ||
6 | 12 | ||
7 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 13 | diff --git a/include/hw/misc/iotkit-secctl.h b/include/hw/misc/iotkit-secctl.h |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20180227143852.11175-22-alex.bennee@linaro.org | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
11 | --- | ||
12 | target/arm/translate-a64.c | 16 +++++++++++++++- | ||
13 | 1 file changed, 15 insertions(+), 1 deletion(-) | ||
14 | |||
15 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
16 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/translate-a64.c | 15 | --- a/include/hw/misc/iotkit-secctl.h |
18 | +++ b/target/arm/translate-a64.c | 16 | +++ b/include/hw/misc/iotkit-secctl.h |
19 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 17 | @@ -XXX,XX +XXX,XX @@ |
20 | TCGv_i32 tcg_rmode = NULL; | 18 | * + sysbus MMIO region 1 is the "non-secure privilege control block" registers |
21 | TCGv_ptr tcg_fpstatus = NULL; | 19 | * + named GPIO output "sec_resp_cfg" indicating whether blocked accesses |
22 | bool need_rmode = false; | 20 | * should RAZ/WI or bus error |
23 | + bool need_fpst = true; | 21 | + * + named GPIO output "nsc_cfg" whose value tracks the NSCCFG register value |
24 | int rmode; | 22 | * Controlling the 2 APB PPCs in the IoTKit: |
25 | 23 | * + named GPIO outputs apb_ppc0_nonsec[0..2] and apb_ppc1_nonsec | |
26 | if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 24 | * + named GPIO outputs apb_ppc0_ap[0..2] and apb_ppc1_ap |
27 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 25 | @@ -XXX,XX +XXX,XX @@ struct IoTKitSecCtl { |
28 | need_rmode = true; | 26 | |
29 | rmode = FPROUNDING_ZERO; | 27 | /*< public >*/ |
28 | qemu_irq sec_resp_cfg; | ||
29 | + qemu_irq nsc_cfg_irq; | ||
30 | |||
31 | MemoryRegion s_regs; | ||
32 | MemoryRegion ns_regs; | ||
33 | @@ -XXX,XX +XXX,XX @@ struct IoTKitSecCtl { | ||
34 | uint32_t secppcintstat; | ||
35 | uint32_t secppcinten; | ||
36 | uint32_t secrespcfg; | ||
37 | + uint32_t nsccfg; | ||
38 | + uint32_t brginten; | ||
39 | |||
40 | IoTKitSecCtlPPC apb[IOTS_NUM_APB_PPC]; | ||
41 | IoTKitSecCtlPPC apbexp[IOTS_NUM_APB_EXP_PPC]; | ||
42 | diff --git a/hw/misc/iotkit-secctl.c b/hw/misc/iotkit-secctl.c | ||
43 | index XXXXXXX..XXXXXXX 100644 | ||
44 | --- a/hw/misc/iotkit-secctl.c | ||
45 | +++ b/hw/misc/iotkit-secctl.c | ||
46 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr, | ||
47 | case A_SECRESPCFG: | ||
48 | r = s->secrespcfg; | ||
30 | break; | 49 | break; |
31 | + case 0x2f: /* FABS */ | 50 | + case A_NSCCFG: |
32 | + case 0x6f: /* FNEG */ | 51 | + r = s->nsccfg; |
33 | + need_fpst = false; | ||
34 | + break; | 52 | + break; |
35 | default: | 53 | case A_SECPPCINTSTAT: |
36 | fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop); | 54 | r = s->secppcintstat; |
37 | g_assert_not_reached(); | 55 | break; |
38 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 56 | case A_SECPPCINTEN: |
39 | return; | 57 | r = s->secppcinten; |
58 | break; | ||
59 | + case A_BRGINTSTAT: | ||
60 | + /* QEMU's bus fabric can never report errors as it doesn't buffer | ||
61 | + * writes, so we never report bridge interrupts. | ||
62 | + */ | ||
63 | + r = 0; | ||
64 | + break; | ||
65 | + case A_BRGINTEN: | ||
66 | + r = s->brginten; | ||
67 | + break; | ||
68 | case A_AHBNSPPCEXP0: | ||
69 | case A_AHBNSPPCEXP1: | ||
70 | case A_AHBNSPPCEXP2: | ||
71 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr, | ||
72 | case A_APBSPPPCEXP3: | ||
73 | r = s->apbexp[offset_to_ppc_idx(offset)].sp; | ||
74 | break; | ||
75 | - case A_NSCCFG: | ||
76 | case A_SECMPCINTSTATUS: | ||
77 | case A_SECMSCINTSTAT: | ||
78 | case A_SECMSCINTEN: | ||
79 | - case A_BRGINTSTAT: | ||
80 | - case A_BRGINTEN: | ||
81 | case A_NSMSCEXP: | ||
82 | qemu_log_mask(LOG_UNIMP, | ||
83 | "IoTKit SecCtl S block read: " | ||
84 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr, | ||
40 | } | 85 | } |
41 | 86 | ||
42 | - if (need_rmode) { | 87 | switch (offset) { |
43 | + if (need_rmode || need_fpst) { | 88 | + case A_NSCCFG: |
44 | tcg_fpstatus = get_fpstatus_ptr(true); | 89 | + s->nsccfg = value & 3; |
90 | + qemu_set_irq(s->nsc_cfg_irq, s->nsccfg); | ||
91 | + break; | ||
92 | case A_SECRESPCFG: | ||
93 | value &= 1; | ||
94 | s->secrespcfg = value; | ||
95 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr, | ||
96 | s->secppcinten = value & 0x00f000f3; | ||
97 | foreach_ppc(s, iotkit_secctl_ppc_update_irq_enable); | ||
98 | break; | ||
99 | + case A_BRGINTCLR: | ||
100 | + break; | ||
101 | + case A_BRGINTEN: | ||
102 | + s->brginten = value & 0xffff0000; | ||
103 | + break; | ||
104 | case A_AHBNSPPCEXP0: | ||
105 | case A_AHBNSPPCEXP1: | ||
106 | case A_AHBNSPPCEXP2: | ||
107 | @@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr, | ||
108 | ppc = &s->apbexp[offset_to_ppc_idx(offset)]; | ||
109 | iotkit_secctl_ppc_sp_write(ppc, value); | ||
110 | break; | ||
111 | - case A_NSCCFG: | ||
112 | case A_SECMSCINTCLR: | ||
113 | case A_SECMSCINTEN: | ||
114 | - case A_BRGINTCLR: | ||
115 | - case A_BRGINTEN: | ||
116 | qemu_log_mask(LOG_UNIMP, | ||
117 | "IoTKit SecCtl S block write: " | ||
118 | "unimplemented offset 0x%x\n", offset); | ||
119 | @@ -XXX,XX +XXX,XX @@ static void iotkit_secctl_reset(DeviceState *dev) | ||
120 | s->secppcintstat = 0; | ||
121 | s->secppcinten = 0; | ||
122 | s->secrespcfg = 0; | ||
123 | + s->nsccfg = 0; | ||
124 | + s->brginten = 0; | ||
125 | |||
126 | foreach_ppc(s, iotkit_secctl_reset_ppc); | ||
127 | } | ||
128 | @@ -XXX,XX +XXX,XX @@ static void iotkit_secctl_init(Object *obj) | ||
45 | } | 129 | } |
46 | 130 | ||
47 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 131 | qdev_init_gpio_out_named(dev, &s->sec_resp_cfg, "sec_resp_cfg", 1); |
48 | case 0x7b: /* FCVTZU */ | 132 | + qdev_init_gpio_out_named(dev, &s->nsc_cfg_irq, "nsc_cfg", 1); |
49 | gen_helper_advsimd_f16touinth(tcg_res, tcg_op, tcg_fpstatus); | 133 | |
50 | break; | 134 | memory_region_init_io(&s->s_regs, obj, &iotkit_secctl_s_ops, |
51 | + case 0x6f: /* FNEG */ | 135 | s, "iotkit-secctl-s-regs", 0x1000); |
52 | + tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000); | 136 | @@ -XXX,XX +XXX,XX @@ static const VMStateDescription iotkit_secctl_vmstate = { |
53 | + break; | 137 | VMSTATE_UINT32(secppcintstat, IoTKitSecCtl), |
54 | default: | 138 | VMSTATE_UINT32(secppcinten, IoTKitSecCtl), |
55 | g_assert_not_reached(); | 139 | VMSTATE_UINT32(secrespcfg, IoTKitSecCtl), |
56 | } | 140 | + VMSTATE_UINT32(nsccfg, IoTKitSecCtl), |
57 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 141 | + VMSTATE_UINT32(brginten, IoTKitSecCtl), |
58 | case 0x59: /* FRINTX */ | 142 | VMSTATE_STRUCT_ARRAY(apb, IoTKitSecCtl, IOTS_NUM_APB_PPC, 1, |
59 | gen_helper_advsimd_rinth_exact(tcg_res, tcg_op, tcg_fpstatus); | 143 | iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC), |
60 | break; | 144 | VMSTATE_STRUCT_ARRAY(apbexp, IoTKitSecCtl, IOTS_NUM_APB_EXP_PPC, 1, |
61 | + case 0x2f: /* FABS */ | ||
62 | + tcg_gen_andi_i32(tcg_res, tcg_op, 0x7fff); | ||
63 | + break; | ||
64 | + case 0x6f: /* FNEG */ | ||
65 | + tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000); | ||
66 | + break; | ||
67 | default: | ||
68 | g_assert_not_reached(); | ||
69 | } | ||
70 | -- | 145 | -- |
71 | 2.16.2 | 146 | 2.16.2 |
72 | 147 | ||
73 | 148 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Model the Arm IoT Kit documented in |
---|---|---|---|
2 | http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html | ||
2 | 3 | ||
3 | This adds the full range of half-precision floating point to integral | 4 | The Arm IoT Kit is a subsystem which includes a CPU and some devices, |
4 | instructions. | 5 | and is intended be extended by adding extra devices to form a |
6 | complete system. It is used in the MPS2 board's AN505 image for the | ||
7 | Cortex-M33. | ||
5 | 8 | ||
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 10 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20180227143852.11175-18-alex.bennee@linaro.org | 11 | Message-id: 20180220180325.29818-19-peter.maydell@linaro.org |
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
10 | --- | 12 | --- |
11 | target/arm/helper-a64.h | 2 + | 13 | hw/arm/Makefile.objs | 1 + |
12 | target/arm/helper-a64.c | 22 ++++++++ | 14 | include/hw/arm/iotkit.h | 109 ++++++++ |
13 | target/arm/translate-a64.c | 123 +++++++++++++++++++++++++++++++++++++++++++-- | 15 | hw/arm/iotkit.c | 598 ++++++++++++++++++++++++++++++++++++++++ |
14 | 3 files changed, 142 insertions(+), 5 deletions(-) | 16 | default-configs/arm-softmmu.mak | 1 + |
17 | 4 files changed, 709 insertions(+) | ||
18 | create mode 100644 include/hw/arm/iotkit.h | ||
19 | create mode 100644 hw/arm/iotkit.c | ||
15 | 20 | ||
16 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 21 | diff --git a/hw/arm/Makefile.objs b/hw/arm/Makefile.objs |
17 | index XXXXXXX..XXXXXXX 100644 | 22 | index XXXXXXX..XXXXXXX 100644 |
18 | --- a/target/arm/helper-a64.h | 23 | --- a/hw/arm/Makefile.objs |
19 | +++ b/target/arm/helper-a64.h | 24 | +++ b/hw/arm/Makefile.objs |
20 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_maxnum2h, i32, i32, i32, ptr) | 25 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_FSL_IMX6) += fsl-imx6.o sabrelite.o |
21 | DEF_HELPER_3(advsimd_minnum2h, i32, i32, i32, ptr) | 26 | obj-$(CONFIG_ASPEED_SOC) += aspeed_soc.o aspeed.o |
22 | DEF_HELPER_3(advsimd_mulx2h, i32, i32, i32, ptr) | 27 | obj-$(CONFIG_MPS2) += mps2.o |
23 | DEF_HELPER_4(advsimd_muladd2h, i32, i32, i32, i32, ptr) | 28 | obj-$(CONFIG_MSF2) += msf2-soc.o msf2-som.o |
24 | +DEF_HELPER_2(advsimd_rinth_exact, f16, f16, ptr) | 29 | +obj-$(CONFIG_IOTKIT) += iotkit.o |
25 | +DEF_HELPER_2(advsimd_rinth, f16, f16, ptr) | 30 | diff --git a/include/hw/arm/iotkit.h b/include/hw/arm/iotkit.h |
26 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 31 | new file mode 100644 |
27 | index XXXXXXX..XXXXXXX 100644 | 32 | index XXXXXXX..XXXXXXX |
28 | --- a/target/arm/helper-a64.c | 33 | --- /dev/null |
29 | +++ b/target/arm/helper-a64.c | 34 | +++ b/include/hw/arm/iotkit.h |
30 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(advsimd_acgt_f16)(float16 a, float16 b, void *fpstp) | 35 | @@ -XXX,XX +XXX,XX @@ |
31 | int compare = float16_compare(f0, f1, fpst); | 36 | +/* |
32 | return ADVSIMD_CMPRES(compare == float_relation_greater); | 37 | + * ARM IoT Kit |
33 | } | 38 | + * |
34 | + | 39 | + * Copyright (c) 2018 Linaro Limited |
35 | +/* round to integral */ | 40 | + * Written by Peter Maydell |
36 | +float16 HELPER(advsimd_rinth_exact)(float16 x, void *fp_status) | 41 | + * |
37 | +{ | 42 | + * This program is free software; you can redistribute it and/or modify |
38 | + return float16_round_to_int(x, fp_status); | 43 | + * it under the terms of the GNU General Public License version 2 or |
39 | +} | 44 | + * (at your option) any later version. |
40 | + | 45 | + */ |
41 | +float16 HELPER(advsimd_rinth)(float16 x, void *fp_status) | 46 | + |
42 | +{ | 47 | +/* This is a model of the Arm IoT Kit which is documented in |
43 | + int old_flags = get_float_exception_flags(fp_status), new_flags; | 48 | + * http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html |
44 | + float16 ret; | 49 | + * It contains: |
45 | + | 50 | + * a Cortex-M33 |
46 | + ret = float16_round_to_int(x, fp_status); | 51 | + * the IDAU |
47 | + | 52 | + * some timers and watchdogs |
48 | + /* Suppress any inexact exceptions the conversion produced */ | 53 | + * two peripheral protection controllers |
49 | + if (!(old_flags & float_flag_inexact)) { | 54 | + * a memory protection controller |
50 | + new_flags = get_float_exception_flags(fp_status); | 55 | + * a security controller |
51 | + set_float_exception_flags(new_flags & ~float_flag_inexact, fp_status); | 56 | + * a bus fabric which arranges that some parts of the address |
52 | + } | 57 | + * space are secure and non-secure aliases of each other |
53 | + | 58 | + * |
54 | + return ret; | 59 | + * QEMU interface: |
55 | +} | 60 | + * + QOM property "memory" is a MemoryRegion containing the devices provided |
56 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 61 | + * by the board model. |
57 | index XXXXXXX..XXXXXXX 100644 | 62 | + * + QOM property "MAINCLK" is the frequency of the main system clock |
58 | --- a/target/arm/translate-a64.c | 63 | + * + QOM property "EXP_NUMIRQ" sets the number of expansion interrupts |
59 | +++ b/target/arm/translate-a64.c | 64 | + * + Named GPIO inputs "EXP_IRQ" 0..n are the expansion interrupts, which |
60 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn) | 65 | + * are wired to the NVIC lines 32 .. n+32 |
61 | */ | 66 | + * Controlling up to 4 AHB expansion PPBs which a system using the IoTKit |
62 | static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 67 | + * might provide: |
63 | { | 68 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_nonsec[0..15] |
64 | - int fpop, opcode, a; | 69 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_ap[0..15] |
65 | + int fpop, opcode, a, u; | 70 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_enable |
66 | + int rn, rd; | 71 | + * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_clear |
67 | + bool is_q; | 72 | + * + named GPIO inputs apb_ppcexp{0,1,2,3}_irq_status |
68 | + bool is_scalar; | 73 | + * Controlling each of the 4 expansion AHB PPCs which a system using the IoTKit |
69 | + bool only_in_vector = false; | 74 | + * might provide: |
70 | + | 75 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_nonsec[0..15] |
71 | + int pass; | 76 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_ap[0..15] |
72 | + TCGv_i32 tcg_rmode = NULL; | 77 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_enable |
73 | + TCGv_ptr tcg_fpstatus = NULL; | 78 | + * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_clear |
74 | + bool need_rmode = false; | 79 | + * + named GPIO inputs ahb_ppcexp{0,1,2,3}_irq_status |
75 | + int rmode; | 80 | + */ |
76 | 81 | + | |
77 | if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 82 | +#ifndef IOTKIT_H |
78 | unallocated_encoding(s); | 83 | +#define IOTKIT_H |
79 | return; | 84 | + |
80 | } | 85 | +#include "hw/sysbus.h" |
81 | 86 | +#include "hw/arm/armv7m.h" | |
82 | - if (!fp_access_check(s)) { | 87 | +#include "hw/misc/iotkit-secctl.h" |
83 | - return; | 88 | +#include "hw/misc/tz-ppc.h" |
84 | - } | 89 | +#include "hw/timer/cmsdk-apb-timer.h" |
85 | + rd = extract32(insn, 0, 5); | 90 | +#include "hw/misc/unimp.h" |
86 | + rn = extract32(insn, 5, 5); | 91 | +#include "hw/or-irq.h" |
87 | 92 | +#include "hw/core/split-irq.h" | |
88 | - opcode = extract32(insn, 12, 4); | 93 | + |
89 | a = extract32(insn, 23, 1); | 94 | +#define TYPE_IOTKIT "iotkit" |
90 | + u = extract32(insn, 29, 1); | 95 | +#define IOTKIT(obj) OBJECT_CHECK(IoTKit, (obj), TYPE_IOTKIT) |
91 | + is_scalar = extract32(insn, 28, 1); | 96 | + |
92 | + is_q = extract32(insn, 30, 1); | 97 | +/* We have an IRQ splitter and an OR gate input for each external PPC |
93 | + | 98 | + * and the 2 internal PPCs |
94 | + opcode = extract32(insn, 12, 5); | 99 | + */ |
95 | fpop = deposit32(opcode, 5, 1, a); | 100 | +#define NUM_EXTERNAL_PPCS (IOTS_NUM_AHB_EXP_PPC + IOTS_NUM_APB_EXP_PPC) |
96 | + fpop = deposit32(fpop, 6, 1, u); | 101 | +#define NUM_PPCS (NUM_EXTERNAL_PPCS + 2) |
97 | 102 | + | |
98 | switch (fpop) { | 103 | +typedef struct IoTKit { |
99 | + case 0x18: /* FRINTN */ | 104 | + /*< private >*/ |
100 | + need_rmode = true; | 105 | + SysBusDevice parent_obj; |
101 | + only_in_vector = true; | 106 | + |
102 | + rmode = FPROUNDING_TIEEVEN; | 107 | + /*< public >*/ |
103 | + break; | 108 | + ARMv7MState armv7m; |
104 | + case 0x19: /* FRINTM */ | 109 | + IoTKitSecCtl secctl; |
105 | + need_rmode = true; | 110 | + TZPPC apb_ppc0; |
106 | + only_in_vector = true; | 111 | + TZPPC apb_ppc1; |
107 | + rmode = FPROUNDING_NEGINF; | 112 | + CMSDKAPBTIMER timer0; |
108 | + break; | 113 | + CMSDKAPBTIMER timer1; |
109 | + case 0x38: /* FRINTP */ | 114 | + qemu_or_irq ppc_irq_orgate; |
110 | + need_rmode = true; | 115 | + SplitIRQ sec_resp_splitter; |
111 | + only_in_vector = true; | 116 | + SplitIRQ ppc_irq_splitter[NUM_PPCS]; |
112 | + rmode = FPROUNDING_POSINF; | 117 | + |
113 | + break; | 118 | + UnimplementedDeviceState dualtimer; |
114 | + case 0x39: /* FRINTZ */ | 119 | + UnimplementedDeviceState s32ktimer; |
115 | + need_rmode = true; | 120 | + |
116 | + only_in_vector = true; | 121 | + MemoryRegion container; |
117 | + rmode = FPROUNDING_ZERO; | 122 | + MemoryRegion alias1; |
118 | + break; | 123 | + MemoryRegion alias2; |
119 | + case 0x58: /* FRINTA */ | 124 | + MemoryRegion alias3; |
120 | + need_rmode = true; | 125 | + MemoryRegion sram0; |
121 | + only_in_vector = true; | 126 | + |
122 | + rmode = FPROUNDING_TIEAWAY; | 127 | + qemu_irq *exp_irqs; |
123 | + break; | 128 | + qemu_irq ppc0_irq; |
124 | + case 0x59: /* FRINTX */ | 129 | + qemu_irq ppc1_irq; |
125 | + case 0x79: /* FRINTI */ | 130 | + qemu_irq sec_resp_cfg; |
126 | + only_in_vector = true; | 131 | + qemu_irq sec_resp_cfg_in; |
127 | + /* current rounding mode */ | 132 | + qemu_irq nsc_cfg_in; |
128 | + break; | 133 | + |
129 | default: | 134 | + qemu_irq irq_status_in[NUM_EXTERNAL_PPCS]; |
130 | fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop); | 135 | + |
131 | g_assert_not_reached(); | 136 | + uint32_t nsccfg; |
132 | } | 137 | + |
133 | 138 | + /* Properties */ | |
134 | + | 139 | + MemoryRegion *board_memory; |
135 | + /* Check additional constraints for the scalar encoding */ | 140 | + uint32_t exp_numirq; |
136 | + if (is_scalar) { | 141 | + uint32_t mainclk_frq; |
137 | + if (!is_q) { | 142 | +} IoTKit; |
138 | + unallocated_encoding(s); | 143 | + |
144 | +#endif | ||
145 | diff --git a/hw/arm/iotkit.c b/hw/arm/iotkit.c | ||
146 | new file mode 100644 | ||
147 | index XXXXXXX..XXXXXXX | ||
148 | --- /dev/null | ||
149 | +++ b/hw/arm/iotkit.c | ||
150 | @@ -XXX,XX +XXX,XX @@ | ||
151 | +/* | ||
152 | + * Arm IoT Kit | ||
153 | + * | ||
154 | + * Copyright (c) 2018 Linaro Limited | ||
155 | + * Written by Peter Maydell | ||
156 | + * | ||
157 | + * This program is free software; you can redistribute it and/or modify | ||
158 | + * it under the terms of the GNU General Public License version 2 or | ||
159 | + * (at your option) any later version. | ||
160 | + */ | ||
161 | + | ||
162 | +#include "qemu/osdep.h" | ||
163 | +#include "qemu/log.h" | ||
164 | +#include "qapi/error.h" | ||
165 | +#include "trace.h" | ||
166 | +#include "hw/sysbus.h" | ||
167 | +#include "hw/registerfields.h" | ||
168 | +#include "hw/arm/iotkit.h" | ||
169 | +#include "hw/misc/unimp.h" | ||
170 | +#include "hw/arm/arm.h" | ||
171 | + | ||
172 | +/* Create an alias region of @size bytes starting at @base | ||
173 | + * which mirrors the memory starting at @orig. | ||
174 | + */ | ||
175 | +static void make_alias(IoTKit *s, MemoryRegion *mr, const char *name, | ||
176 | + hwaddr base, hwaddr size, hwaddr orig) | ||
177 | +{ | ||
178 | + memory_region_init_alias(mr, NULL, name, &s->container, orig, size); | ||
179 | + /* The alias is even lower priority than unimplemented_device regions */ | ||
180 | + memory_region_add_subregion_overlap(&s->container, base, mr, -1500); | ||
181 | +} | ||
182 | + | ||
183 | +static void init_sysbus_child(Object *parent, const char *childname, | ||
184 | + void *child, size_t childsize, | ||
185 | + const char *childtype) | ||
186 | +{ | ||
187 | + object_initialize(child, childsize, childtype); | ||
188 | + object_property_add_child(parent, childname, OBJECT(child), &error_abort); | ||
189 | + qdev_set_parent_bus(DEVICE(child), sysbus_get_default()); | ||
190 | +} | ||
191 | + | ||
192 | +static void irq_status_forwarder(void *opaque, int n, int level) | ||
193 | +{ | ||
194 | + qemu_irq destirq = opaque; | ||
195 | + | ||
196 | + qemu_set_irq(destirq, level); | ||
197 | +} | ||
198 | + | ||
199 | +static void nsccfg_handler(void *opaque, int n, int level) | ||
200 | +{ | ||
201 | + IoTKit *s = IOTKIT(opaque); | ||
202 | + | ||
203 | + s->nsccfg = level; | ||
204 | +} | ||
205 | + | ||
206 | +static void iotkit_forward_ppc(IoTKit *s, const char *ppcname, int ppcnum) | ||
207 | +{ | ||
208 | + /* Each of the 4 AHB and 4 APB PPCs that might be present in a | ||
209 | + * system using the IoTKit has a collection of control lines which | ||
210 | + * are provided by the security controller and which we want to | ||
211 | + * expose as control lines on the IoTKit device itself, so the | ||
212 | + * code using the IoTKit can wire them up to the PPCs. | ||
213 | + */ | ||
214 | + SplitIRQ *splitter = &s->ppc_irq_splitter[ppcnum]; | ||
215 | + DeviceState *iotkitdev = DEVICE(s); | ||
216 | + DeviceState *dev_secctl = DEVICE(&s->secctl); | ||
217 | + DeviceState *dev_splitter = DEVICE(splitter); | ||
218 | + char *name; | ||
219 | + | ||
220 | + name = g_strdup_printf("%s_nonsec", ppcname); | ||
221 | + qdev_pass_gpios(dev_secctl, iotkitdev, name); | ||
222 | + g_free(name); | ||
223 | + name = g_strdup_printf("%s_ap", ppcname); | ||
224 | + qdev_pass_gpios(dev_secctl, iotkitdev, name); | ||
225 | + g_free(name); | ||
226 | + name = g_strdup_printf("%s_irq_enable", ppcname); | ||
227 | + qdev_pass_gpios(dev_secctl, iotkitdev, name); | ||
228 | + g_free(name); | ||
229 | + name = g_strdup_printf("%s_irq_clear", ppcname); | ||
230 | + qdev_pass_gpios(dev_secctl, iotkitdev, name); | ||
231 | + g_free(name); | ||
232 | + | ||
233 | + /* irq_status is a little more tricky, because we need to | ||
234 | + * split it so we can send it both to the security controller | ||
235 | + * and to our OR gate for the NVIC interrupt line. | ||
236 | + * Connect up the splitter's outputs, and create a GPIO input | ||
237 | + * which will pass the line state to the input splitter. | ||
238 | + */ | ||
239 | + name = g_strdup_printf("%s_irq_status", ppcname); | ||
240 | + qdev_connect_gpio_out(dev_splitter, 0, | ||
241 | + qdev_get_gpio_in_named(dev_secctl, | ||
242 | + name, 0)); | ||
243 | + qdev_connect_gpio_out(dev_splitter, 1, | ||
244 | + qdev_get_gpio_in(DEVICE(&s->ppc_irq_orgate), ppcnum)); | ||
245 | + s->irq_status_in[ppcnum] = qdev_get_gpio_in(dev_splitter, 0); | ||
246 | + qdev_init_gpio_in_named_with_opaque(iotkitdev, irq_status_forwarder, | ||
247 | + s->irq_status_in[ppcnum], name, 1); | ||
248 | + g_free(name); | ||
249 | +} | ||
250 | + | ||
251 | +static void iotkit_forward_sec_resp_cfg(IoTKit *s) | ||
252 | +{ | ||
253 | + /* Forward the 3rd output from the splitter device as a | ||
254 | + * named GPIO output of the iotkit object. | ||
255 | + */ | ||
256 | + DeviceState *dev = DEVICE(s); | ||
257 | + DeviceState *dev_splitter = DEVICE(&s->sec_resp_splitter); | ||
258 | + | ||
259 | + qdev_init_gpio_out_named(dev, &s->sec_resp_cfg, "sec_resp_cfg", 1); | ||
260 | + s->sec_resp_cfg_in = qemu_allocate_irq(irq_status_forwarder, | ||
261 | + s->sec_resp_cfg, 1); | ||
262 | + qdev_connect_gpio_out(dev_splitter, 2, s->sec_resp_cfg_in); | ||
263 | +} | ||
264 | + | ||
265 | +static void iotkit_init(Object *obj) | ||
266 | +{ | ||
267 | + IoTKit *s = IOTKIT(obj); | ||
268 | + int i; | ||
269 | + | ||
270 | + memory_region_init(&s->container, obj, "iotkit-container", UINT64_MAX); | ||
271 | + | ||
272 | + init_sysbus_child(obj, "armv7m", &s->armv7m, sizeof(s->armv7m), | ||
273 | + TYPE_ARMV7M); | ||
274 | + qdev_prop_set_string(DEVICE(&s->armv7m), "cpu-type", | ||
275 | + ARM_CPU_TYPE_NAME("cortex-m33")); | ||
276 | + | ||
277 | + init_sysbus_child(obj, "secctl", &s->secctl, sizeof(s->secctl), | ||
278 | + TYPE_IOTKIT_SECCTL); | ||
279 | + init_sysbus_child(obj, "apb-ppc0", &s->apb_ppc0, sizeof(s->apb_ppc0), | ||
280 | + TYPE_TZ_PPC); | ||
281 | + init_sysbus_child(obj, "apb-ppc1", &s->apb_ppc1, sizeof(s->apb_ppc1), | ||
282 | + TYPE_TZ_PPC); | ||
283 | + init_sysbus_child(obj, "timer0", &s->timer0, sizeof(s->timer0), | ||
284 | + TYPE_CMSDK_APB_TIMER); | ||
285 | + init_sysbus_child(obj, "timer1", &s->timer1, sizeof(s->timer1), | ||
286 | + TYPE_CMSDK_APB_TIMER); | ||
287 | + init_sysbus_child(obj, "dualtimer", &s->dualtimer, sizeof(s->dualtimer), | ||
288 | + TYPE_UNIMPLEMENTED_DEVICE); | ||
289 | + object_initialize(&s->ppc_irq_orgate, sizeof(s->ppc_irq_orgate), | ||
290 | + TYPE_OR_IRQ); | ||
291 | + object_property_add_child(obj, "ppc-irq-orgate", | ||
292 | + OBJECT(&s->ppc_irq_orgate), &error_abort); | ||
293 | + object_initialize(&s->sec_resp_splitter, sizeof(s->sec_resp_splitter), | ||
294 | + TYPE_SPLIT_IRQ); | ||
295 | + object_property_add_child(obj, "sec-resp-splitter", | ||
296 | + OBJECT(&s->sec_resp_splitter), &error_abort); | ||
297 | + for (i = 0; i < ARRAY_SIZE(s->ppc_irq_splitter); i++) { | ||
298 | + char *name = g_strdup_printf("ppc-irq-splitter-%d", i); | ||
299 | + SplitIRQ *splitter = &s->ppc_irq_splitter[i]; | ||
300 | + | ||
301 | + object_initialize(splitter, sizeof(*splitter), TYPE_SPLIT_IRQ); | ||
302 | + object_property_add_child(obj, name, OBJECT(splitter), &error_abort); | ||
303 | + } | ||
304 | + init_sysbus_child(obj, "s32ktimer", &s->s32ktimer, sizeof(s->s32ktimer), | ||
305 | + TYPE_UNIMPLEMENTED_DEVICE); | ||
306 | +} | ||
307 | + | ||
308 | +static void iotkit_exp_irq(void *opaque, int n, int level) | ||
309 | +{ | ||
310 | + IoTKit *s = IOTKIT(opaque); | ||
311 | + | ||
312 | + qemu_set_irq(s->exp_irqs[n], level); | ||
313 | +} | ||
314 | + | ||
315 | +static void iotkit_realize(DeviceState *dev, Error **errp) | ||
316 | +{ | ||
317 | + IoTKit *s = IOTKIT(dev); | ||
318 | + int i; | ||
319 | + MemoryRegion *mr; | ||
320 | + Error *err = NULL; | ||
321 | + SysBusDevice *sbd_apb_ppc0; | ||
322 | + SysBusDevice *sbd_secctl; | ||
323 | + DeviceState *dev_apb_ppc0; | ||
324 | + DeviceState *dev_apb_ppc1; | ||
325 | + DeviceState *dev_secctl; | ||
326 | + DeviceState *dev_splitter; | ||
327 | + | ||
328 | + if (!s->board_memory) { | ||
329 | + error_setg(errp, "memory property was not set"); | ||
330 | + return; | ||
331 | + } | ||
332 | + | ||
333 | + if (!s->mainclk_frq) { | ||
334 | + error_setg(errp, "MAINCLK property was not set"); | ||
335 | + return; | ||
336 | + } | ||
337 | + | ||
338 | + /* Handling of which devices should be available only to secure | ||
339 | + * code is usually done differently for M profile than for A profile. | ||
340 | + * Instead of putting some devices only into the secure address space, | ||
341 | + * devices exist in both address spaces but with hard-wired security | ||
342 | + * permissions that will cause the CPU to fault for non-secure accesses. | ||
343 | + * | ||
344 | + * The IoTKit has an IDAU (Implementation Defined Access Unit), | ||
345 | + * which specifies hard-wired security permissions for different | ||
346 | + * areas of the physical address space. For the IoTKit IDAU, the | ||
347 | + * top 4 bits of the physical address are the IDAU region ID, and | ||
348 | + * if bit 28 (ie the lowest bit of the ID) is 0 then this is an NS | ||
349 | + * region, otherwise it is an S region. | ||
350 | + * | ||
351 | + * The various devices and RAMs are generally all mapped twice, | ||
352 | + * once into a region that the IDAU defines as secure and once | ||
353 | + * into a non-secure region. They sit behind either a Memory | ||
354 | + * Protection Controller (for RAM) or a Peripheral Protection | ||
355 | + * Controller (for devices), which allow a more fine grained | ||
356 | + * configuration of whether non-secure accesses are permitted. | ||
357 | + * | ||
358 | + * (The other place that guest software can configure security | ||
359 | + * permissions is in the architected SAU (Security Attribution | ||
360 | + * Unit), which is entirely inside the CPU. The IDAU can upgrade | ||
361 | + * the security attributes for a region to more restrictive than | ||
362 | + * the SAU specifies, but cannot downgrade them.) | ||
363 | + * | ||
364 | + * 0x10000000..0x1fffffff alias of 0x00000000..0x0fffffff | ||
365 | + * 0x20000000..0x2007ffff 32KB FPGA block RAM | ||
366 | + * 0x30000000..0x3fffffff alias of 0x20000000..0x2fffffff | ||
367 | + * 0x40000000..0x4000ffff base peripheral region 1 | ||
368 | + * 0x40010000..0x4001ffff CPU peripherals (none for IoTKit) | ||
369 | + * 0x40020000..0x4002ffff system control element peripherals | ||
370 | + * 0x40080000..0x400fffff base peripheral region 2 | ||
371 | + * 0x50000000..0x5fffffff alias of 0x40000000..0x4fffffff | ||
372 | + */ | ||
373 | + | ||
374 | + memory_region_add_subregion_overlap(&s->container, 0, s->board_memory, -1); | ||
375 | + | ||
376 | + qdev_prop_set_uint32(DEVICE(&s->armv7m), "num-irq", s->exp_numirq + 32); | ||
377 | + /* In real hardware the initial Secure VTOR is set from the INITSVTOR0 | ||
378 | + * register in the IoT Kit System Control Register block, and the | ||
379 | + * initial value of that is in turn specifiable by the FPGA that | ||
380 | + * instantiates the IoT Kit. In QEMU we don't implement this wrinkle, | ||
381 | + * and simply set the CPU's init-svtor to the IoT Kit default value. | ||
382 | + */ | ||
383 | + qdev_prop_set_uint32(DEVICE(&s->armv7m), "init-svtor", 0x10000000); | ||
384 | + object_property_set_link(OBJECT(&s->armv7m), OBJECT(&s->container), | ||
385 | + "memory", &err); | ||
386 | + if (err) { | ||
387 | + error_propagate(errp, err); | ||
388 | + return; | ||
389 | + } | ||
390 | + object_property_set_link(OBJECT(&s->armv7m), OBJECT(s), "idau", &err); | ||
391 | + if (err) { | ||
392 | + error_propagate(errp, err); | ||
393 | + return; | ||
394 | + } | ||
395 | + object_property_set_bool(OBJECT(&s->armv7m), true, "realized", &err); | ||
396 | + if (err) { | ||
397 | + error_propagate(errp, err); | ||
398 | + return; | ||
399 | + } | ||
400 | + | ||
401 | + /* Connect our EXP_IRQ GPIOs to the NVIC's lines 32 and up. */ | ||
402 | + s->exp_irqs = g_new(qemu_irq, s->exp_numirq); | ||
403 | + for (i = 0; i < s->exp_numirq; i++) { | ||
404 | + s->exp_irqs[i] = qdev_get_gpio_in(DEVICE(&s->armv7m), i + 32); | ||
405 | + } | ||
406 | + qdev_init_gpio_in_named(dev, iotkit_exp_irq, "EXP_IRQ", s->exp_numirq); | ||
407 | + | ||
408 | + /* Set up the big aliases first */ | ||
409 | + make_alias(s, &s->alias1, "alias 1", 0x10000000, 0x10000000, 0x00000000); | ||
410 | + make_alias(s, &s->alias2, "alias 2", 0x30000000, 0x10000000, 0x20000000); | ||
411 | + /* The 0x50000000..0x5fffffff region is not a pure alias: it has | ||
412 | + * a few extra devices that only appear there (generally the | ||
413 | + * control interfaces for the protection controllers). | ||
414 | + * We implement this by mapping those devices over the top of this | ||
415 | + * alias MR at a higher priority. | ||
416 | + */ | ||
417 | + make_alias(s, &s->alias3, "alias 3", 0x50000000, 0x10000000, 0x40000000); | ||
418 | + | ||
419 | + /* This RAM should be behind a Memory Protection Controller, but we | ||
420 | + * don't implement that yet. | ||
421 | + */ | ||
422 | + memory_region_init_ram(&s->sram0, NULL, "iotkit.sram0", 0x00008000, &err); | ||
423 | + if (err) { | ||
424 | + error_propagate(errp, err); | ||
425 | + return; | ||
426 | + } | ||
427 | + memory_region_add_subregion(&s->container, 0x20000000, &s->sram0); | ||
428 | + | ||
429 | + /* Security controller */ | ||
430 | + object_property_set_bool(OBJECT(&s->secctl), true, "realized", &err); | ||
431 | + if (err) { | ||
432 | + error_propagate(errp, err); | ||
433 | + return; | ||
434 | + } | ||
435 | + sbd_secctl = SYS_BUS_DEVICE(&s->secctl); | ||
436 | + dev_secctl = DEVICE(&s->secctl); | ||
437 | + sysbus_mmio_map(sbd_secctl, 0, 0x50080000); | ||
438 | + sysbus_mmio_map(sbd_secctl, 1, 0x40080000); | ||
439 | + | ||
440 | + s->nsc_cfg_in = qemu_allocate_irq(nsccfg_handler, s, 1); | ||
441 | + qdev_connect_gpio_out_named(dev_secctl, "nsc_cfg", 0, s->nsc_cfg_in); | ||
442 | + | ||
443 | + /* The sec_resp_cfg output from the security controller must be split into | ||
444 | + * multiple lines, one for each of the PPCs within the IoTKit and one | ||
445 | + * that will be an output from the IoTKit to the system. | ||
446 | + */ | ||
447 | + object_property_set_int(OBJECT(&s->sec_resp_splitter), 3, | ||
448 | + "num-lines", &err); | ||
449 | + if (err) { | ||
450 | + error_propagate(errp, err); | ||
451 | + return; | ||
452 | + } | ||
453 | + object_property_set_bool(OBJECT(&s->sec_resp_splitter), true, | ||
454 | + "realized", &err); | ||
455 | + if (err) { | ||
456 | + error_propagate(errp, err); | ||
457 | + return; | ||
458 | + } | ||
459 | + dev_splitter = DEVICE(&s->sec_resp_splitter); | ||
460 | + qdev_connect_gpio_out_named(dev_secctl, "sec_resp_cfg", 0, | ||
461 | + qdev_get_gpio_in(dev_splitter, 0)); | ||
462 | + | ||
463 | + /* Devices behind APB PPC0: | ||
464 | + * 0x40000000: timer0 | ||
465 | + * 0x40001000: timer1 | ||
466 | + * 0x40002000: dual timer | ||
467 | + * We must configure and realize each downstream device and connect | ||
468 | + * it to the appropriate PPC port; then we can realize the PPC and | ||
469 | + * map its upstream ends to the right place in the container. | ||
470 | + */ | ||
471 | + qdev_prop_set_uint32(DEVICE(&s->timer0), "pclk-frq", s->mainclk_frq); | ||
472 | + object_property_set_bool(OBJECT(&s->timer0), true, "realized", &err); | ||
473 | + if (err) { | ||
474 | + error_propagate(errp, err); | ||
475 | + return; | ||
476 | + } | ||
477 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer0), 0, | ||
478 | + qdev_get_gpio_in(DEVICE(&s->armv7m), 3)); | ||
479 | + mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->timer0), 0); | ||
480 | + object_property_set_link(OBJECT(&s->apb_ppc0), OBJECT(mr), "port[0]", &err); | ||
481 | + if (err) { | ||
482 | + error_propagate(errp, err); | ||
483 | + return; | ||
484 | + } | ||
485 | + | ||
486 | + qdev_prop_set_uint32(DEVICE(&s->timer1), "pclk-frq", s->mainclk_frq); | ||
487 | + object_property_set_bool(OBJECT(&s->timer1), true, "realized", &err); | ||
488 | + if (err) { | ||
489 | + error_propagate(errp, err); | ||
490 | + return; | ||
491 | + } | ||
492 | + sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer1), 0, | ||
493 | + qdev_get_gpio_in(DEVICE(&s->armv7m), 3)); | ||
494 | + mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->timer1), 0); | ||
495 | + object_property_set_link(OBJECT(&s->apb_ppc0), OBJECT(mr), "port[1]", &err); | ||
496 | + if (err) { | ||
497 | + error_propagate(errp, err); | ||
498 | + return; | ||
499 | + } | ||
500 | + | ||
501 | + qdev_prop_set_string(DEVICE(&s->dualtimer), "name", "Dual timer"); | ||
502 | + qdev_prop_set_uint64(DEVICE(&s->dualtimer), "size", 0x1000); | ||
503 | + object_property_set_bool(OBJECT(&s->dualtimer), true, "realized", &err); | ||
504 | + if (err) { | ||
505 | + error_propagate(errp, err); | ||
506 | + return; | ||
507 | + } | ||
508 | + mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->dualtimer), 0); | ||
509 | + object_property_set_link(OBJECT(&s->apb_ppc0), OBJECT(mr), "port[2]", &err); | ||
510 | + if (err) { | ||
511 | + error_propagate(errp, err); | ||
512 | + return; | ||
513 | + } | ||
514 | + | ||
515 | + object_property_set_bool(OBJECT(&s->apb_ppc0), true, "realized", &err); | ||
516 | + if (err) { | ||
517 | + error_propagate(errp, err); | ||
518 | + return; | ||
519 | + } | ||
520 | + | ||
521 | + sbd_apb_ppc0 = SYS_BUS_DEVICE(&s->apb_ppc0); | ||
522 | + dev_apb_ppc0 = DEVICE(&s->apb_ppc0); | ||
523 | + | ||
524 | + mr = sysbus_mmio_get_region(sbd_apb_ppc0, 0); | ||
525 | + memory_region_add_subregion(&s->container, 0x40000000, mr); | ||
526 | + mr = sysbus_mmio_get_region(sbd_apb_ppc0, 1); | ||
527 | + memory_region_add_subregion(&s->container, 0x40001000, mr); | ||
528 | + mr = sysbus_mmio_get_region(sbd_apb_ppc0, 2); | ||
529 | + memory_region_add_subregion(&s->container, 0x40002000, mr); | ||
530 | + for (i = 0; i < IOTS_APB_PPC0_NUM_PORTS; i++) { | ||
531 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_nonsec", i, | ||
532 | + qdev_get_gpio_in_named(dev_apb_ppc0, | ||
533 | + "cfg_nonsec", i)); | ||
534 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_ap", i, | ||
535 | + qdev_get_gpio_in_named(dev_apb_ppc0, | ||
536 | + "cfg_ap", i)); | ||
537 | + } | ||
538 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_irq_enable", 0, | ||
539 | + qdev_get_gpio_in_named(dev_apb_ppc0, | ||
540 | + "irq_enable", 0)); | ||
541 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_irq_clear", 0, | ||
542 | + qdev_get_gpio_in_named(dev_apb_ppc0, | ||
543 | + "irq_clear", 0)); | ||
544 | + qdev_connect_gpio_out(dev_splitter, 0, | ||
545 | + qdev_get_gpio_in_named(dev_apb_ppc0, | ||
546 | + "cfg_sec_resp", 0)); | ||
547 | + | ||
548 | + /* All the PPC irq lines (from the 2 internal PPCs and the 8 external | ||
549 | + * ones) are sent individually to the security controller, and also | ||
550 | + * ORed together to give a single combined PPC interrupt to the NVIC. | ||
551 | + */ | ||
552 | + object_property_set_int(OBJECT(&s->ppc_irq_orgate), | ||
553 | + NUM_PPCS, "num-lines", &err); | ||
554 | + if (err) { | ||
555 | + error_propagate(errp, err); | ||
556 | + return; | ||
557 | + } | ||
558 | + object_property_set_bool(OBJECT(&s->ppc_irq_orgate), true, | ||
559 | + "realized", &err); | ||
560 | + if (err) { | ||
561 | + error_propagate(errp, err); | ||
562 | + return; | ||
563 | + } | ||
564 | + qdev_connect_gpio_out(DEVICE(&s->ppc_irq_orgate), 0, | ||
565 | + qdev_get_gpio_in(DEVICE(&s->armv7m), 10)); | ||
566 | + | ||
567 | + /* 0x40010000 .. 0x4001ffff: private CPU region: unused in IoTKit */ | ||
568 | + | ||
569 | + /* 0x40020000 .. 0x4002ffff : IoTKit system control peripheral region */ | ||
570 | + /* Devices behind APB PPC1: | ||
571 | + * 0x4002f000: S32K timer | ||
572 | + */ | ||
573 | + qdev_prop_set_string(DEVICE(&s->s32ktimer), "name", "S32KTIMER"); | ||
574 | + qdev_prop_set_uint64(DEVICE(&s->s32ktimer), "size", 0x1000); | ||
575 | + object_property_set_bool(OBJECT(&s->s32ktimer), true, "realized", &err); | ||
576 | + if (err) { | ||
577 | + error_propagate(errp, err); | ||
578 | + return; | ||
579 | + } | ||
580 | + mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->s32ktimer), 0); | ||
581 | + object_property_set_link(OBJECT(&s->apb_ppc1), OBJECT(mr), "port[0]", &err); | ||
582 | + if (err) { | ||
583 | + error_propagate(errp, err); | ||
584 | + return; | ||
585 | + } | ||
586 | + | ||
587 | + object_property_set_bool(OBJECT(&s->apb_ppc1), true, "realized", &err); | ||
588 | + if (err) { | ||
589 | + error_propagate(errp, err); | ||
590 | + return; | ||
591 | + } | ||
592 | + mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->apb_ppc1), 0); | ||
593 | + memory_region_add_subregion(&s->container, 0x4002f000, mr); | ||
594 | + | ||
595 | + dev_apb_ppc1 = DEVICE(&s->apb_ppc1); | ||
596 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_nonsec", 0, | ||
597 | + qdev_get_gpio_in_named(dev_apb_ppc1, | ||
598 | + "cfg_nonsec", 0)); | ||
599 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_ap", 0, | ||
600 | + qdev_get_gpio_in_named(dev_apb_ppc1, | ||
601 | + "cfg_ap", 0)); | ||
602 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_irq_enable", 0, | ||
603 | + qdev_get_gpio_in_named(dev_apb_ppc1, | ||
604 | + "irq_enable", 0)); | ||
605 | + qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_irq_clear", 0, | ||
606 | + qdev_get_gpio_in_named(dev_apb_ppc1, | ||
607 | + "irq_clear", 0)); | ||
608 | + qdev_connect_gpio_out(dev_splitter, 1, | ||
609 | + qdev_get_gpio_in_named(dev_apb_ppc1, | ||
610 | + "cfg_sec_resp", 0)); | ||
611 | + | ||
612 | + /* Using create_unimplemented_device() maps the stub into the | ||
613 | + * system address space rather than into our container, but the | ||
614 | + * overall effect to the guest is the same. | ||
615 | + */ | ||
616 | + create_unimplemented_device("SYSINFO", 0x40020000, 0x1000); | ||
617 | + | ||
618 | + create_unimplemented_device("SYSCONTROL", 0x50021000, 0x1000); | ||
619 | + create_unimplemented_device("S32KWATCHDOG", 0x5002e000, 0x1000); | ||
620 | + | ||
621 | + /* 0x40080000 .. 0x4008ffff : IoTKit second Base peripheral region */ | ||
622 | + | ||
623 | + create_unimplemented_device("NS watchdog", 0x40081000, 0x1000); | ||
624 | + create_unimplemented_device("S watchdog", 0x50081000, 0x1000); | ||
625 | + | ||
626 | + create_unimplemented_device("SRAM0 MPC", 0x50083000, 0x1000); | ||
627 | + | ||
628 | + for (i = 0; i < ARRAY_SIZE(s->ppc_irq_splitter); i++) { | ||
629 | + Object *splitter = OBJECT(&s->ppc_irq_splitter[i]); | ||
630 | + | ||
631 | + object_property_set_int(splitter, 2, "num-lines", &err); | ||
632 | + if (err) { | ||
633 | + error_propagate(errp, err); | ||
139 | + return; | 634 | + return; |
140 | + } | 635 | + } |
141 | + /* FRINTxx is only in the vector form */ | 636 | + object_property_set_bool(splitter, true, "realized", &err); |
142 | + if (only_in_vector) { | 637 | + if (err) { |
143 | + unallocated_encoding(s); | 638 | + error_propagate(errp, err); |
144 | + return; | 639 | + return; |
145 | + } | 640 | + } |
146 | + } | 641 | + } |
147 | + | 642 | + |
148 | + if (!fp_access_check(s)) { | 643 | + for (i = 0; i < IOTS_NUM_AHB_EXP_PPC; i++) { |
149 | + return; | 644 | + char *ppcname = g_strdup_printf("ahb_ppcexp%d", i); |
150 | + } | 645 | + |
151 | + | 646 | + iotkit_forward_ppc(s, ppcname, i); |
152 | + if (need_rmode) { | 647 | + g_free(ppcname); |
153 | + tcg_fpstatus = get_fpstatus_ptr(true); | 648 | + } |
154 | + } | 649 | + |
155 | + | 650 | + for (i = 0; i < IOTS_NUM_APB_EXP_PPC; i++) { |
156 | + if (need_rmode) { | 651 | + char *ppcname = g_strdup_printf("apb_ppcexp%d", i); |
157 | + tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | 652 | + |
158 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | 653 | + iotkit_forward_ppc(s, ppcname, i + IOTS_NUM_AHB_EXP_PPC); |
159 | + } | 654 | + g_free(ppcname); |
160 | + | 655 | + } |
161 | + if (is_scalar) { | 656 | + |
162 | + /* no operations yet */ | 657 | + for (i = NUM_EXTERNAL_PPCS; i < NUM_PPCS; i++) { |
163 | + } else { | 658 | + /* Wire up IRQ splitter for internal PPCs */ |
164 | + for (pass = 0; pass < (is_q ? 8 : 4); pass++) { | 659 | + DeviceState *devs = DEVICE(&s->ppc_irq_splitter[i]); |
165 | + TCGv_i32 tcg_op = tcg_temp_new_i32(); | 660 | + char *gpioname = g_strdup_printf("apb_ppc%d_irq_status", |
166 | + TCGv_i32 tcg_res = tcg_temp_new_i32(); | 661 | + i - NUM_EXTERNAL_PPCS); |
167 | + | 662 | + TZPPC *ppc = (i == NUM_EXTERNAL_PPCS) ? &s->apb_ppc0 : &s->apb_ppc1; |
168 | + read_vec_element_i32(s, tcg_op, rn, pass, MO_16); | 663 | + |
169 | + | 664 | + qdev_connect_gpio_out(devs, 0, |
170 | + switch (fpop) { | 665 | + qdev_get_gpio_in_named(dev_secctl, gpioname, 0)); |
171 | + case 0x18: /* FRINTN */ | 666 | + qdev_connect_gpio_out(devs, 1, |
172 | + case 0x19: /* FRINTM */ | 667 | + qdev_get_gpio_in(DEVICE(&s->ppc_irq_orgate), i)); |
173 | + case 0x38: /* FRINTP */ | 668 | + qdev_connect_gpio_out_named(DEVICE(ppc), "irq", 0, |
174 | + case 0x39: /* FRINTZ */ | 669 | + qdev_get_gpio_in(devs, 0)); |
175 | + case 0x58: /* FRINTA */ | 670 | + } |
176 | + case 0x79: /* FRINTI */ | 671 | + |
177 | + gen_helper_advsimd_rinth(tcg_res, tcg_op, tcg_fpstatus); | 672 | + iotkit_forward_sec_resp_cfg(s); |
178 | + break; | 673 | + |
179 | + case 0x59: /* FRINTX */ | 674 | + system_clock_scale = NANOSECONDS_PER_SECOND / s->mainclk_frq; |
180 | + gen_helper_advsimd_rinth_exact(tcg_res, tcg_op, tcg_fpstatus); | 675 | +} |
181 | + break; | 676 | + |
182 | + default: | 677 | +static void iotkit_idau_check(IDAUInterface *ii, uint32_t address, |
183 | + g_assert_not_reached(); | 678 | + int *iregion, bool *exempt, bool *ns, bool *nsc) |
184 | + } | 679 | +{ |
185 | + | 680 | + /* For IoTKit systems the IDAU responses are simple logical functions |
186 | + write_vec_element_i32(s, tcg_res, rd, pass, MO_16); | 681 | + * of the address bits. The NSC attribute is guest-adjustable via the |
187 | + | 682 | + * NSCCFG register in the security controller. |
188 | + tcg_temp_free_i32(tcg_res); | 683 | + */ |
189 | + tcg_temp_free_i32(tcg_op); | 684 | + IoTKit *s = IOTKIT(ii); |
190 | + } | 685 | + int region = extract32(address, 28, 4); |
191 | + | 686 | + |
192 | + clear_vec_high(s, is_q, rd); | 687 | + *ns = !(region & 1); |
193 | + } | 688 | + *nsc = (region == 1 && (s->nsccfg & 1)) || (region == 3 && (s->nsccfg & 2)); |
194 | + | 689 | + /* 0xe0000000..0xe00fffff and 0xf0000000..0xf00fffff are exempt */ |
195 | + if (tcg_rmode) { | 690 | + *exempt = (address & 0xeff00000) == 0xe0000000; |
196 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | 691 | + *iregion = region; |
197 | + tcg_temp_free_i32(tcg_rmode); | 692 | +} |
198 | + } | 693 | + |
199 | + | 694 | +static const VMStateDescription iotkit_vmstate = { |
200 | + if (tcg_fpstatus) { | 695 | + .name = "iotkit", |
201 | + tcg_temp_free_ptr(tcg_fpstatus); | 696 | + .version_id = 1, |
202 | + } | 697 | + .minimum_version_id = 1, |
203 | } | 698 | + .fields = (VMStateField[]) { |
204 | 699 | + VMSTATE_UINT32(nsccfg, IoTKit), | |
205 | /* AdvSIMD scalar x indexed element | 700 | + VMSTATE_END_OF_LIST() |
701 | + } | ||
702 | +}; | ||
703 | + | ||
704 | +static Property iotkit_properties[] = { | ||
705 | + DEFINE_PROP_LINK("memory", IoTKit, board_memory, TYPE_MEMORY_REGION, | ||
706 | + MemoryRegion *), | ||
707 | + DEFINE_PROP_UINT32("EXP_NUMIRQ", IoTKit, exp_numirq, 64), | ||
708 | + DEFINE_PROP_UINT32("MAINCLK", IoTKit, mainclk_frq, 0), | ||
709 | + DEFINE_PROP_END_OF_LIST() | ||
710 | +}; | ||
711 | + | ||
712 | +static void iotkit_reset(DeviceState *dev) | ||
713 | +{ | ||
714 | + IoTKit *s = IOTKIT(dev); | ||
715 | + | ||
716 | + s->nsccfg = 0; | ||
717 | +} | ||
718 | + | ||
719 | +static void iotkit_class_init(ObjectClass *klass, void *data) | ||
720 | +{ | ||
721 | + DeviceClass *dc = DEVICE_CLASS(klass); | ||
722 | + IDAUInterfaceClass *iic = IDAU_INTERFACE_CLASS(klass); | ||
723 | + | ||
724 | + dc->realize = iotkit_realize; | ||
725 | + dc->vmsd = &iotkit_vmstate; | ||
726 | + dc->props = iotkit_properties; | ||
727 | + dc->reset = iotkit_reset; | ||
728 | + iic->check = iotkit_idau_check; | ||
729 | +} | ||
730 | + | ||
731 | +static const TypeInfo iotkit_info = { | ||
732 | + .name = TYPE_IOTKIT, | ||
733 | + .parent = TYPE_SYS_BUS_DEVICE, | ||
734 | + .instance_size = sizeof(IoTKit), | ||
735 | + .instance_init = iotkit_init, | ||
736 | + .class_init = iotkit_class_init, | ||
737 | + .interfaces = (InterfaceInfo[]) { | ||
738 | + { TYPE_IDAU_INTERFACE }, | ||
739 | + { } | ||
740 | + } | ||
741 | +}; | ||
742 | + | ||
743 | +static void iotkit_register_types(void) | ||
744 | +{ | ||
745 | + type_register_static(&iotkit_info); | ||
746 | +} | ||
747 | + | ||
748 | +type_init(iotkit_register_types); | ||
749 | diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak | ||
750 | index XXXXXXX..XXXXXXX 100644 | ||
751 | --- a/default-configs/arm-softmmu.mak | ||
752 | +++ b/default-configs/arm-softmmu.mak | ||
753 | @@ -XXX,XX +XXX,XX @@ CONFIG_MPS2_FPGAIO=y | ||
754 | CONFIG_MPS2_SCC=y | ||
755 | |||
756 | CONFIG_TZ_PPC=y | ||
757 | +CONFIG_IOTKIT=y | ||
758 | CONFIG_IOTKIT_SECCTL=y | ||
759 | |||
760 | CONFIG_VERSATILE_PCI=y | ||
206 | -- | 761 | -- |
207 | 2.16.2 | 762 | 2.16.2 |
208 | 763 | ||
209 | 764 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | Define a new board model for the MPS2 with an AN505 FPGA image |
---|---|---|---|
2 | containing a Cortex-M33. Since the FPGA images for TrustZone | ||
3 | cores (AN505, and the similar AN519 for Cortex-M23) have a | ||
4 | significantly different layout of devices to the non-TrustZone | ||
5 | images, we use a new source file rather than shoehorning them | ||
6 | into the existing mps2.c. | ||
2 | 7 | ||
3 | It looks like the ARM ARM has simplified the pseudo code for the | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
4 | calculation which is done on a fixed point 9 bit integer maths. So | 9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> |
5 | while adding f16 we can also clean this up to be a little less heavy | 10 | Message-id: 20180220180325.29818-20-peter.maydell@linaro.org |
6 | on the floating point and just return the fractional part and leave | 11 | --- |
7 | the calle's to do the final packing of the result. | 12 | hw/arm/Makefile.objs | 1 + |
13 | hw/arm/mps2-tz.c | 503 +++++++++++++++++++++++++++++++++++++++++++++++++++ | ||
14 | 2 files changed, 504 insertions(+) | ||
15 | create mode 100644 hw/arm/mps2-tz.c | ||
8 | 16 | ||
9 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 17 | diff --git a/hw/arm/Makefile.objs b/hw/arm/Makefile.objs |
10 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
11 | Message-id: 20180227143852.11175-23-alex.bennee@linaro.org | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
13 | --- | ||
14 | target/arm/helper.h | 1 + | ||
15 | target/arm/helper.c | 226 +++++++++++++++++++++++++++++----------------------- | ||
16 | 2 files changed, 129 insertions(+), 98 deletions(-) | ||
17 | |||
18 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
19 | index XXXXXXX..XXXXXXX 100644 | 18 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/helper.h | 19 | --- a/hw/arm/Makefile.objs |
21 | +++ b/target/arm/helper.h | 20 | +++ b/hw/arm/Makefile.objs |
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_4(vfp_muladds, f32, f32, f32, f32, ptr) | 21 | @@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_FSL_IMX31) += fsl-imx31.o kzm.o |
23 | 22 | obj-$(CONFIG_FSL_IMX6) += fsl-imx6.o sabrelite.o | |
24 | DEF_HELPER_3(recps_f32, f32, f32, f32, env) | 23 | obj-$(CONFIG_ASPEED_SOC) += aspeed_soc.o aspeed.o |
25 | DEF_HELPER_3(rsqrts_f32, f32, f32, f32, env) | 24 | obj-$(CONFIG_MPS2) += mps2.o |
26 | +DEF_HELPER_FLAGS_2(recpe_f16, TCG_CALL_NO_RWG, f16, f16, ptr) | 25 | +obj-$(CONFIG_MPS2) += mps2-tz.o |
27 | DEF_HELPER_FLAGS_2(recpe_f32, TCG_CALL_NO_RWG, f32, f32, ptr) | 26 | obj-$(CONFIG_MSF2) += msf2-soc.o msf2-som.o |
28 | DEF_HELPER_FLAGS_2(recpe_f64, TCG_CALL_NO_RWG, f64, f64, ptr) | 27 | obj-$(CONFIG_IOTKIT) += iotkit.o |
29 | DEF_HELPER_FLAGS_2(rsqrte_f32, TCG_CALL_NO_RWG, f32, f32, ptr) | 28 | diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c |
30 | diff --git a/target/arm/helper.c b/target/arm/helper.c | 29 | new file mode 100644 |
31 | index XXXXXXX..XXXXXXX 100644 | 30 | index XXXXXXX..XXXXXXX |
32 | --- a/target/arm/helper.c | 31 | --- /dev/null |
33 | +++ b/target/arm/helper.c | 32 | +++ b/hw/arm/mps2-tz.c |
34 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrts_f32)(float32 a, float32 b, CPUARMState *env) | 33 | @@ -XXX,XX +XXX,XX @@ |
35 | * int->float conversions at run-time. */ | 34 | +/* |
36 | #define float64_256 make_float64(0x4070000000000000LL) | 35 | + * ARM V2M MPS2 board emulation, trustzone aware FPGA images |
37 | #define float64_512 make_float64(0x4080000000000000LL) | ||
38 | +#define float16_maxnorm make_float16(0x7bff) | ||
39 | #define float32_maxnorm make_float32(0x7f7fffff) | ||
40 | #define float64_maxnorm make_float64(0x7fefffffffffffffLL) | ||
41 | |||
42 | /* Reciprocal functions | ||
43 | * | ||
44 | * The algorithm that must be used to calculate the estimate | ||
45 | - * is specified by the ARM ARM, see FPRecipEstimate() | ||
46 | + * is specified by the ARM ARM, see FPRecipEstimate()/RecipEstimate | ||
47 | */ | ||
48 | |||
49 | -static float64 recip_estimate(float64 a, float_status *real_fp_status) | ||
50 | +/* See RecipEstimate() | ||
51 | + * | 36 | + * |
52 | + * input is a 9 bit fixed point number | 37 | + * Copyright (c) 2017 Linaro Limited |
53 | + * input range 256 .. 511 for a number from 0.5 <= x < 1.0. | 38 | + * Written by Peter Maydell |
54 | + * result range 256 .. 511 for a number from 1.0 to 511/256. | 39 | + * |
40 | + * This program is free software; you can redistribute it and/or modify | ||
41 | + * it under the terms of the GNU General Public License version 2 or | ||
42 | + * (at your option) any later version. | ||
55 | + */ | 43 | + */ |
56 | + | 44 | + |
57 | +static int recip_estimate(int input) | 45 | +/* The MPS2 and MPS2+ dev boards are FPGA based (the 2+ has a bigger |
58 | { | 46 | + * FPGA but is otherwise the same as the 2). Since the CPU itself |
59 | - /* These calculations mustn't set any fp exception flags, | 47 | + * and most of the devices are in the FPGA, the details of the board |
60 | - * so we use a local copy of the fp_status. | 48 | + * as seen by the guest depend significantly on the FPGA image. |
61 | - */ | 49 | + * This source file covers the following FPGA images, for TrustZone cores: |
62 | - float_status dummy_status = *real_fp_status; | 50 | + * "mps2-an505" -- Cortex-M33 as documented in ARM Application Note AN505 |
63 | - float_status *s = &dummy_status; | ||
64 | - /* q = (int)(a * 512.0) */ | ||
65 | - float64 q = float64_mul(float64_512, a, s); | ||
66 | - int64_t q_int = float64_to_int64_round_to_zero(q, s); | ||
67 | - | ||
68 | - /* r = 1.0 / (((double)q + 0.5) / 512.0) */ | ||
69 | - q = int64_to_float64(q_int, s); | ||
70 | - q = float64_add(q, float64_half, s); | ||
71 | - q = float64_div(q, float64_512, s); | ||
72 | - q = float64_div(float64_one, q, s); | ||
73 | - | ||
74 | - /* s = (int)(256.0 * r + 0.5) */ | ||
75 | - q = float64_mul(q, float64_256, s); | ||
76 | - q = float64_add(q, float64_half, s); | ||
77 | - q_int = float64_to_int64_round_to_zero(q, s); | ||
78 | - | ||
79 | - /* return (double)s / 256.0 */ | ||
80 | - return float64_div(int64_to_float64(q_int, s), float64_256, s); | ||
81 | + int a, b, r; | ||
82 | + assert(256 <= input && input < 512); | ||
83 | + a = (input * 2) + 1; | ||
84 | + b = (1 << 19) / a; | ||
85 | + r = (b + 1) >> 1; | ||
86 | + assert(256 <= r && r < 512); | ||
87 | + return r; | ||
88 | } | ||
89 | |||
90 | -/* Common wrapper to call recip_estimate */ | ||
91 | -static float64 call_recip_estimate(float64 num, int off, float_status *fpst) | ||
92 | -{ | ||
93 | - uint64_t val64 = float64_val(num); | ||
94 | - uint64_t frac = extract64(val64, 0, 52); | ||
95 | - int64_t exp = extract64(val64, 52, 11); | ||
96 | - uint64_t sbit; | ||
97 | - float64 scaled, estimate; | ||
98 | +/* | ||
99 | + * Common wrapper to call recip_estimate | ||
100 | + * | 51 | + * |
101 | + * The parameters are exponent and 64 bit fraction (without implicit | 52 | + * Links to the TRM for the board itself and to the various Application |
102 | + * bit) where the binary point is nominally at bit 52. Returns a | 53 | + * Notes which document the FPGA images can be found here: |
103 | + * float64 which can then be rounded to the appropriate size by the | 54 | + * https://developer.arm.com/products/system-design/development-boards/fpga-prototyping-boards/mps2 |
104 | + * callee. | 55 | + * |
56 | + * Board TRM: | ||
57 | + * http://infocenter.arm.com/help/topic/com.arm.doc.100112_0200_06_en/versatile_express_cortex_m_prototyping_systems_v2m_mps2_and_v2m_mps2plus_technical_reference_100112_0200_06_en.pdf | ||
58 | + * Application Note AN505: | ||
59 | + * http://infocenter.arm.com/help/topic/com.arm.doc.dai0505b/index.html | ||
60 | + * | ||
61 | + * The AN505 defers to the Cortex-M33 processor ARMv8M IoT Kit FVP User Guide | ||
62 | + * (ARM ECM0601256) for the details of some of the device layout: | ||
63 | + * http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html | ||
105 | + */ | 64 | + */ |
106 | 65 | + | |
107 | - /* Generate the scaled number for the estimate function */ | 66 | +#include "qemu/osdep.h" |
108 | - if (exp == 0) { | 67 | +#include "qapi/error.h" |
109 | +static uint64_t call_recip_estimate(int *exp, int exp_off, uint64_t frac) | 68 | +#include "qemu/error-report.h" |
110 | +{ | 69 | +#include "hw/arm/arm.h" |
111 | + uint32_t scaled, estimate; | 70 | +#include "hw/arm/armv7m.h" |
112 | + uint64_t result_frac; | 71 | +#include "hw/or-irq.h" |
113 | + int result_exp; | 72 | +#include "hw/boards.h" |
114 | + | 73 | +#include "exec/address-spaces.h" |
115 | + /* Handle sub-normals */ | 74 | +#include "sysemu/sysemu.h" |
116 | + if (*exp == 0) { | 75 | +#include "hw/misc/unimp.h" |
117 | if (extract64(frac, 51, 1) == 0) { | 76 | +#include "hw/char/cmsdk-apb-uart.h" |
118 | - exp = -1; | 77 | +#include "hw/timer/cmsdk-apb-timer.h" |
119 | - frac = extract64(frac, 0, 50) << 2; | 78 | +#include "hw/misc/mps2-scc.h" |
120 | + *exp = -1; | 79 | +#include "hw/misc/mps2-fpgaio.h" |
121 | + frac <<= 2; | 80 | +#include "hw/arm/iotkit.h" |
122 | } else { | 81 | +#include "hw/devices.h" |
123 | - frac = extract64(frac, 0, 51) << 1; | 82 | +#include "net/net.h" |
124 | + frac <<= 1; | 83 | +#include "hw/core/split-irq.h" |
125 | } | 84 | + |
126 | } | 85 | +typedef enum MPS2TZFPGAType { |
127 | 86 | + FPGA_AN505, | |
128 | - /* scaled = '0' : '01111111110' : fraction<51:44> : Zeros(44); */ | 87 | +} MPS2TZFPGAType; |
129 | - scaled = make_float64((0x3feULL << 52) | 88 | + |
130 | - | extract64(frac, 44, 8) << 44); | 89 | +typedef struct { |
131 | + /* scaled = UInt('1':fraction<51:44>) */ | 90 | + MachineClass parent; |
132 | + scaled = deposit32(1 << 8, 0, 8, extract64(frac, 44, 8)); | 91 | + MPS2TZFPGAType fpga_type; |
133 | + estimate = recip_estimate(scaled); | 92 | + uint32_t scc_id; |
134 | 93 | +} MPS2TZMachineClass; | |
135 | - estimate = recip_estimate(scaled, fpst); | 94 | + |
136 | - | 95 | +typedef struct { |
137 | - /* Build new result */ | 96 | + MachineState parent; |
138 | - val64 = float64_val(estimate); | 97 | + |
139 | - sbit = 0x8000000000000000ULL & val64; | 98 | + IoTKit iotkit; |
140 | - exp = off - exp; | 99 | + MemoryRegion psram; |
141 | - frac = extract64(val64, 0, 52); | 100 | + MemoryRegion ssram1; |
142 | - | 101 | + MemoryRegion ssram1_m; |
143 | - if (exp == 0) { | 102 | + MemoryRegion ssram23; |
144 | - frac = 1ULL << 51 | extract64(frac, 1, 51); | 103 | + MPS2SCC scc; |
145 | - } else if (exp == -1) { | 104 | + MPS2FPGAIO fpgaio; |
146 | - frac = 1ULL << 50 | extract64(frac, 2, 50); | 105 | + TZPPC ppc[5]; |
147 | - exp = 0; | 106 | + UnimplementedDeviceState ssram_mpc[3]; |
148 | + result_exp = exp_off - *exp; | 107 | + UnimplementedDeviceState spi[5]; |
149 | + result_frac = deposit64(0, 44, 8, estimate); | 108 | + UnimplementedDeviceState i2c[4]; |
150 | + if (result_exp == 0) { | 109 | + UnimplementedDeviceState i2s_audio; |
151 | + result_frac = deposit64(result_frac >> 1, 51, 1, 1); | 110 | + UnimplementedDeviceState gpio[5]; |
152 | + } else if (result_exp == -1) { | 111 | + UnimplementedDeviceState dma[4]; |
153 | + result_frac = deposit64(result_frac >> 2, 50, 2, 1); | 112 | + UnimplementedDeviceState gfx; |
154 | + result_exp = 0; | 113 | + CMSDKAPBUART uart[5]; |
155 | } | 114 | + SplitIRQ sec_resp_splitter; |
156 | 115 | + qemu_or_irq uart_irq_orgate; | |
157 | - return make_float64(sbit | (exp << 52) | frac); | 116 | +} MPS2TZMachineState; |
158 | + *exp = result_exp; | 117 | + |
159 | + | 118 | +#define TYPE_MPS2TZ_MACHINE "mps2tz" |
160 | + return result_frac; | 119 | +#define TYPE_MPS2TZ_AN505_MACHINE MACHINE_TYPE_NAME("mps2-an505") |
161 | } | 120 | + |
162 | 121 | +#define MPS2TZ_MACHINE(obj) \ | |
163 | static bool round_to_inf(float_status *fpst, bool sign_bit) | 122 | + OBJECT_CHECK(MPS2TZMachineState, obj, TYPE_MPS2TZ_MACHINE) |
164 | @@ -XXX,XX +XXX,XX @@ static bool round_to_inf(float_status *fpst, bool sign_bit) | 123 | +#define MPS2TZ_MACHINE_GET_CLASS(obj) \ |
165 | g_assert_not_reached(); | 124 | + OBJECT_GET_CLASS(MPS2TZMachineClass, obj, TYPE_MPS2TZ_MACHINE) |
166 | } | 125 | +#define MPS2TZ_MACHINE_CLASS(klass) \ |
167 | 126 | + OBJECT_CLASS_CHECK(MPS2TZMachineClass, klass, TYPE_MPS2TZ_MACHINE) | |
168 | +float16 HELPER(recpe_f16)(float16 input, void *fpstp) | 127 | + |
169 | +{ | 128 | +/* Main SYSCLK frequency in Hz */ |
170 | + float_status *fpst = fpstp; | 129 | +#define SYSCLK_FRQ 20000000 |
171 | + float16 f16 = float16_squash_input_denormal(input, fpst); | 130 | + |
172 | + uint32_t f16_val = float16_val(f16); | 131 | +/* Initialize the auxiliary RAM region @mr and map it into |
173 | + uint32_t f16_sign = float16_is_neg(f16); | 132 | + * the memory map at @base. |
174 | + int f16_exp = extract32(f16_val, 10, 5); | 133 | + */ |
175 | + uint32_t f16_frac = extract32(f16_val, 0, 10); | 134 | +static void make_ram(MemoryRegion *mr, const char *name, |
176 | + uint64_t f64_frac; | 135 | + hwaddr base, hwaddr size) |
177 | + | 136 | +{ |
178 | + if (float16_is_any_nan(f16)) { | 137 | + memory_region_init_ram(mr, NULL, name, size, &error_fatal); |
179 | + float16 nan = f16; | 138 | + memory_region_add_subregion(get_system_memory(), base, mr); |
180 | + if (float16_is_signaling_nan(f16, fpst)) { | 139 | +} |
181 | + float_raise(float_flag_invalid, fpst); | 140 | + |
182 | + nan = float16_maybe_silence_nan(f16, fpst); | 141 | +/* Create an alias of an entire original MemoryRegion @orig |
142 | + * located at @base in the memory map. | ||
143 | + */ | ||
144 | +static void make_ram_alias(MemoryRegion *mr, const char *name, | ||
145 | + MemoryRegion *orig, hwaddr base) | ||
146 | +{ | ||
147 | + memory_region_init_alias(mr, NULL, name, orig, 0, | ||
148 | + memory_region_size(orig)); | ||
149 | + memory_region_add_subregion(get_system_memory(), base, mr); | ||
150 | +} | ||
151 | + | ||
152 | +static void init_sysbus_child(Object *parent, const char *childname, | ||
153 | + void *child, size_t childsize, | ||
154 | + const char *childtype) | ||
155 | +{ | ||
156 | + object_initialize(child, childsize, childtype); | ||
157 | + object_property_add_child(parent, childname, OBJECT(child), &error_abort); | ||
158 | + qdev_set_parent_bus(DEVICE(child), sysbus_get_default()); | ||
159 | + | ||
160 | +} | ||
161 | + | ||
162 | +/* Most of the devices in the AN505 FPGA image sit behind | ||
163 | + * Peripheral Protection Controllers. These data structures | ||
164 | + * define the layout of which devices sit behind which PPCs. | ||
165 | + * The devfn for each port is a function which creates, configures | ||
166 | + * and initializes the device, returning the MemoryRegion which | ||
167 | + * needs to be plugged into the downstream end of the PPC port. | ||
168 | + */ | ||
169 | +typedef MemoryRegion *MakeDevFn(MPS2TZMachineState *mms, void *opaque, | ||
170 | + const char *name, hwaddr size); | ||
171 | + | ||
172 | +typedef struct PPCPortInfo { | ||
173 | + const char *name; | ||
174 | + MakeDevFn *devfn; | ||
175 | + void *opaque; | ||
176 | + hwaddr addr; | ||
177 | + hwaddr size; | ||
178 | +} PPCPortInfo; | ||
179 | + | ||
180 | +typedef struct PPCInfo { | ||
181 | + const char *name; | ||
182 | + PPCPortInfo ports[TZ_NUM_PORTS]; | ||
183 | +} PPCInfo; | ||
184 | + | ||
185 | +static MemoryRegion *make_unimp_dev(MPS2TZMachineState *mms, | ||
186 | + void *opaque, | ||
187 | + const char *name, hwaddr size) | ||
188 | +{ | ||
189 | + /* Initialize, configure and realize a TYPE_UNIMPLEMENTED_DEVICE, | ||
190 | + * and return a pointer to its MemoryRegion. | ||
191 | + */ | ||
192 | + UnimplementedDeviceState *uds = opaque; | ||
193 | + | ||
194 | + init_sysbus_child(OBJECT(mms), name, uds, | ||
195 | + sizeof(UnimplementedDeviceState), | ||
196 | + TYPE_UNIMPLEMENTED_DEVICE); | ||
197 | + qdev_prop_set_string(DEVICE(uds), "name", name); | ||
198 | + qdev_prop_set_uint64(DEVICE(uds), "size", size); | ||
199 | + object_property_set_bool(OBJECT(uds), true, "realized", &error_fatal); | ||
200 | + return sysbus_mmio_get_region(SYS_BUS_DEVICE(uds), 0); | ||
201 | +} | ||
202 | + | ||
203 | +static MemoryRegion *make_uart(MPS2TZMachineState *mms, void *opaque, | ||
204 | + const char *name, hwaddr size) | ||
205 | +{ | ||
206 | + CMSDKAPBUART *uart = opaque; | ||
207 | + int i = uart - &mms->uart[0]; | ||
208 | + Chardev *uartchr = i < MAX_SERIAL_PORTS ? serial_hds[i] : NULL; | ||
209 | + int rxirqno = i * 2; | ||
210 | + int txirqno = i * 2 + 1; | ||
211 | + int combirqno = i + 10; | ||
212 | + SysBusDevice *s; | ||
213 | + DeviceState *iotkitdev = DEVICE(&mms->iotkit); | ||
214 | + DeviceState *orgate_dev = DEVICE(&mms->uart_irq_orgate); | ||
215 | + | ||
216 | + init_sysbus_child(OBJECT(mms), name, uart, | ||
217 | + sizeof(mms->uart[0]), TYPE_CMSDK_APB_UART); | ||
218 | + qdev_prop_set_chr(DEVICE(uart), "chardev", uartchr); | ||
219 | + qdev_prop_set_uint32(DEVICE(uart), "pclk-frq", SYSCLK_FRQ); | ||
220 | + object_property_set_bool(OBJECT(uart), true, "realized", &error_fatal); | ||
221 | + s = SYS_BUS_DEVICE(uart); | ||
222 | + sysbus_connect_irq(s, 0, qdev_get_gpio_in_named(iotkitdev, | ||
223 | + "EXP_IRQ", txirqno)); | ||
224 | + sysbus_connect_irq(s, 1, qdev_get_gpio_in_named(iotkitdev, | ||
225 | + "EXP_IRQ", rxirqno)); | ||
226 | + sysbus_connect_irq(s, 2, qdev_get_gpio_in(orgate_dev, i * 2)); | ||
227 | + sysbus_connect_irq(s, 3, qdev_get_gpio_in(orgate_dev, i * 2 + 1)); | ||
228 | + sysbus_connect_irq(s, 4, qdev_get_gpio_in_named(iotkitdev, | ||
229 | + "EXP_IRQ", combirqno)); | ||
230 | + return sysbus_mmio_get_region(SYS_BUS_DEVICE(uart), 0); | ||
231 | +} | ||
232 | + | ||
233 | +static MemoryRegion *make_scc(MPS2TZMachineState *mms, void *opaque, | ||
234 | + const char *name, hwaddr size) | ||
235 | +{ | ||
236 | + MPS2SCC *scc = opaque; | ||
237 | + DeviceState *sccdev; | ||
238 | + MPS2TZMachineClass *mmc = MPS2TZ_MACHINE_GET_CLASS(mms); | ||
239 | + | ||
240 | + object_initialize(scc, sizeof(mms->scc), TYPE_MPS2_SCC); | ||
241 | + sccdev = DEVICE(scc); | ||
242 | + qdev_set_parent_bus(sccdev, sysbus_get_default()); | ||
243 | + qdev_prop_set_uint32(sccdev, "scc-cfg4", 0x2); | ||
244 | + qdev_prop_set_uint32(sccdev, "scc-aid", 0x02000008); | ||
245 | + qdev_prop_set_uint32(sccdev, "scc-id", mmc->scc_id); | ||
246 | + object_property_set_bool(OBJECT(scc), true, "realized", &error_fatal); | ||
247 | + return sysbus_mmio_get_region(SYS_BUS_DEVICE(sccdev), 0); | ||
248 | +} | ||
249 | + | ||
250 | +static MemoryRegion *make_fpgaio(MPS2TZMachineState *mms, void *opaque, | ||
251 | + const char *name, hwaddr size) | ||
252 | +{ | ||
253 | + MPS2FPGAIO *fpgaio = opaque; | ||
254 | + | ||
255 | + object_initialize(fpgaio, sizeof(mms->fpgaio), TYPE_MPS2_FPGAIO); | ||
256 | + qdev_set_parent_bus(DEVICE(fpgaio), sysbus_get_default()); | ||
257 | + object_property_set_bool(OBJECT(fpgaio), true, "realized", &error_fatal); | ||
258 | + return sysbus_mmio_get_region(SYS_BUS_DEVICE(fpgaio), 0); | ||
259 | +} | ||
260 | + | ||
261 | +static void mps2tz_common_init(MachineState *machine) | ||
262 | +{ | ||
263 | + MPS2TZMachineState *mms = MPS2TZ_MACHINE(machine); | ||
264 | + MachineClass *mc = MACHINE_GET_CLASS(machine); | ||
265 | + MemoryRegion *system_memory = get_system_memory(); | ||
266 | + DeviceState *iotkitdev; | ||
267 | + DeviceState *dev_splitter; | ||
268 | + int i; | ||
269 | + | ||
270 | + if (strcmp(machine->cpu_type, mc->default_cpu_type) != 0) { | ||
271 | + error_report("This board can only be used with CPU %s", | ||
272 | + mc->default_cpu_type); | ||
273 | + exit(1); | ||
274 | + } | ||
275 | + | ||
276 | + init_sysbus_child(OBJECT(machine), "iotkit", &mms->iotkit, | ||
277 | + sizeof(mms->iotkit), TYPE_IOTKIT); | ||
278 | + iotkitdev = DEVICE(&mms->iotkit); | ||
279 | + object_property_set_link(OBJECT(&mms->iotkit), OBJECT(system_memory), | ||
280 | + "memory", &error_abort); | ||
281 | + qdev_prop_set_uint32(iotkitdev, "EXP_NUMIRQ", 92); | ||
282 | + qdev_prop_set_uint32(iotkitdev, "MAINCLK", SYSCLK_FRQ); | ||
283 | + object_property_set_bool(OBJECT(&mms->iotkit), true, "realized", | ||
284 | + &error_fatal); | ||
285 | + | ||
286 | + /* The sec_resp_cfg output from the IoTKit must be split into multiple | ||
287 | + * lines, one for each of the PPCs we create here. | ||
288 | + */ | ||
289 | + object_initialize(&mms->sec_resp_splitter, sizeof(mms->sec_resp_splitter), | ||
290 | + TYPE_SPLIT_IRQ); | ||
291 | + object_property_add_child(OBJECT(machine), "sec-resp-splitter", | ||
292 | + OBJECT(&mms->sec_resp_splitter), &error_abort); | ||
293 | + object_property_set_int(OBJECT(&mms->sec_resp_splitter), 5, | ||
294 | + "num-lines", &error_fatal); | ||
295 | + object_property_set_bool(OBJECT(&mms->sec_resp_splitter), true, | ||
296 | + "realized", &error_fatal); | ||
297 | + dev_splitter = DEVICE(&mms->sec_resp_splitter); | ||
298 | + qdev_connect_gpio_out_named(iotkitdev, "sec_resp_cfg", 0, | ||
299 | + qdev_get_gpio_in(dev_splitter, 0)); | ||
300 | + | ||
301 | + /* The IoTKit sets up much of the memory layout, including | ||
302 | + * the aliases between secure and non-secure regions in the | ||
303 | + * address space. The FPGA itself contains: | ||
304 | + * | ||
305 | + * 0x00000000..0x003fffff SSRAM1 | ||
306 | + * 0x00400000..0x007fffff alias of SSRAM1 | ||
307 | + * 0x28000000..0x283fffff 4MB SSRAM2 + SSRAM3 | ||
308 | + * 0x40100000..0x4fffffff AHB Master Expansion 1 interface devices | ||
309 | + * 0x80000000..0x80ffffff 16MB PSRAM | ||
310 | + */ | ||
311 | + | ||
312 | + /* The FPGA images have an odd combination of different RAMs, | ||
313 | + * because in hardware they are different implementations and | ||
314 | + * connected to different buses, giving varying performance/size | ||
315 | + * tradeoffs. For QEMU they're all just RAM, though. We arbitrarily | ||
316 | + * call the 16MB our "system memory", as it's the largest lump. | ||
317 | + */ | ||
318 | + memory_region_allocate_system_memory(&mms->psram, | ||
319 | + NULL, "mps.ram", 0x01000000); | ||
320 | + memory_region_add_subregion(system_memory, 0x80000000, &mms->psram); | ||
321 | + | ||
322 | + /* The SSRAM memories should all be behind Memory Protection Controllers, | ||
323 | + * but we don't implement that yet. | ||
324 | + */ | ||
325 | + make_ram(&mms->ssram1, "mps.ssram1", 0x00000000, 0x00400000); | ||
326 | + make_ram_alias(&mms->ssram1_m, "mps.ssram1_m", &mms->ssram1, 0x00400000); | ||
327 | + | ||
328 | + make_ram(&mms->ssram23, "mps.ssram23", 0x28000000, 0x00400000); | ||
329 | + | ||
330 | + /* The overflow IRQs for all UARTs are ORed together. | ||
331 | + * Tx, Rx and "combined" IRQs are sent to the NVIC separately. | ||
332 | + * Create the OR gate for this. | ||
333 | + */ | ||
334 | + object_initialize(&mms->uart_irq_orgate, sizeof(mms->uart_irq_orgate), | ||
335 | + TYPE_OR_IRQ); | ||
336 | + object_property_add_child(OBJECT(mms), "uart-irq-orgate", | ||
337 | + OBJECT(&mms->uart_irq_orgate), &error_abort); | ||
338 | + object_property_set_int(OBJECT(&mms->uart_irq_orgate), 10, "num-lines", | ||
339 | + &error_fatal); | ||
340 | + object_property_set_bool(OBJECT(&mms->uart_irq_orgate), true, | ||
341 | + "realized", &error_fatal); | ||
342 | + qdev_connect_gpio_out(DEVICE(&mms->uart_irq_orgate), 0, | ||
343 | + qdev_get_gpio_in_named(iotkitdev, "EXP_IRQ", 15)); | ||
344 | + | ||
345 | + /* Most of the devices in the FPGA are behind Peripheral Protection | ||
346 | + * Controllers. The required order for initializing things is: | ||
347 | + * + initialize the PPC | ||
348 | + * + initialize, configure and realize downstream devices | ||
349 | + * + connect downstream device MemoryRegions to the PPC | ||
350 | + * + realize the PPC | ||
351 | + * + map the PPC's MemoryRegions to the places in the address map | ||
352 | + * where the downstream devices should appear | ||
353 | + * + wire up the PPC's control lines to the IoTKit object | ||
354 | + */ | ||
355 | + | ||
356 | + const PPCInfo ppcs[] = { { | ||
357 | + .name = "apb_ppcexp0", | ||
358 | + .ports = { | ||
359 | + { "ssram-mpc0", make_unimp_dev, &mms->ssram_mpc[0], | ||
360 | + 0x58007000, 0x1000 }, | ||
361 | + { "ssram-mpc1", make_unimp_dev, &mms->ssram_mpc[1], | ||
362 | + 0x58008000, 0x1000 }, | ||
363 | + { "ssram-mpc2", make_unimp_dev, &mms->ssram_mpc[2], | ||
364 | + 0x58009000, 0x1000 }, | ||
365 | + }, | ||
366 | + }, { | ||
367 | + .name = "apb_ppcexp1", | ||
368 | + .ports = { | ||
369 | + { "spi0", make_unimp_dev, &mms->spi[0], 0x40205000, 0x1000 }, | ||
370 | + { "spi1", make_unimp_dev, &mms->spi[1], 0x40206000, 0x1000 }, | ||
371 | + { "spi2", make_unimp_dev, &mms->spi[2], 0x40209000, 0x1000 }, | ||
372 | + { "spi3", make_unimp_dev, &mms->spi[3], 0x4020a000, 0x1000 }, | ||
373 | + { "spi4", make_unimp_dev, &mms->spi[4], 0x4020b000, 0x1000 }, | ||
374 | + { "uart0", make_uart, &mms->uart[0], 0x40200000, 0x1000 }, | ||
375 | + { "uart1", make_uart, &mms->uart[1], 0x40201000, 0x1000 }, | ||
376 | + { "uart2", make_uart, &mms->uart[2], 0x40202000, 0x1000 }, | ||
377 | + { "uart3", make_uart, &mms->uart[3], 0x40203000, 0x1000 }, | ||
378 | + { "uart4", make_uart, &mms->uart[4], 0x40204000, 0x1000 }, | ||
379 | + { "i2c0", make_unimp_dev, &mms->i2c[0], 0x40207000, 0x1000 }, | ||
380 | + { "i2c1", make_unimp_dev, &mms->i2c[1], 0x40208000, 0x1000 }, | ||
381 | + { "i2c2", make_unimp_dev, &mms->i2c[2], 0x4020c000, 0x1000 }, | ||
382 | + { "i2c3", make_unimp_dev, &mms->i2c[3], 0x4020d000, 0x1000 }, | ||
383 | + }, | ||
384 | + }, { | ||
385 | + .name = "apb_ppcexp2", | ||
386 | + .ports = { | ||
387 | + { "scc", make_scc, &mms->scc, 0x40300000, 0x1000 }, | ||
388 | + { "i2s-audio", make_unimp_dev, &mms->i2s_audio, | ||
389 | + 0x40301000, 0x1000 }, | ||
390 | + { "fpgaio", make_fpgaio, &mms->fpgaio, 0x40302000, 0x1000 }, | ||
391 | + }, | ||
392 | + }, { | ||
393 | + .name = "ahb_ppcexp0", | ||
394 | + .ports = { | ||
395 | + { "gfx", make_unimp_dev, &mms->gfx, 0x41000000, 0x140000 }, | ||
396 | + { "gpio0", make_unimp_dev, &mms->gpio[0], 0x40100000, 0x1000 }, | ||
397 | + { "gpio1", make_unimp_dev, &mms->gpio[1], 0x40101000, 0x1000 }, | ||
398 | + { "gpio2", make_unimp_dev, &mms->gpio[2], 0x40102000, 0x1000 }, | ||
399 | + { "gpio3", make_unimp_dev, &mms->gpio[3], 0x40103000, 0x1000 }, | ||
400 | + { "gpio4", make_unimp_dev, &mms->gpio[4], 0x40104000, 0x1000 }, | ||
401 | + }, | ||
402 | + }, { | ||
403 | + .name = "ahb_ppcexp1", | ||
404 | + .ports = { | ||
405 | + { "dma0", make_unimp_dev, &mms->dma[0], 0x40110000, 0x1000 }, | ||
406 | + { "dma1", make_unimp_dev, &mms->dma[1], 0x40111000, 0x1000 }, | ||
407 | + { "dma2", make_unimp_dev, &mms->dma[2], 0x40112000, 0x1000 }, | ||
408 | + { "dma3", make_unimp_dev, &mms->dma[3], 0x40113000, 0x1000 }, | ||
409 | + }, | ||
410 | + }, | ||
411 | + }; | ||
412 | + | ||
413 | + for (i = 0; i < ARRAY_SIZE(ppcs); i++) { | ||
414 | + const PPCInfo *ppcinfo = &ppcs[i]; | ||
415 | + TZPPC *ppc = &mms->ppc[i]; | ||
416 | + DeviceState *ppcdev; | ||
417 | + int port; | ||
418 | + char *gpioname; | ||
419 | + | ||
420 | + init_sysbus_child(OBJECT(machine), ppcinfo->name, ppc, | ||
421 | + sizeof(TZPPC), TYPE_TZ_PPC); | ||
422 | + ppcdev = DEVICE(ppc); | ||
423 | + | ||
424 | + for (port = 0; port < TZ_NUM_PORTS; port++) { | ||
425 | + const PPCPortInfo *pinfo = &ppcinfo->ports[port]; | ||
426 | + MemoryRegion *mr; | ||
427 | + char *portname; | ||
428 | + | ||
429 | + if (!pinfo->devfn) { | ||
430 | + continue; | ||
431 | + } | ||
432 | + | ||
433 | + mr = pinfo->devfn(mms, pinfo->opaque, pinfo->name, pinfo->size); | ||
434 | + portname = g_strdup_printf("port[%d]", port); | ||
435 | + object_property_set_link(OBJECT(ppc), OBJECT(mr), | ||
436 | + portname, &error_fatal); | ||
437 | + g_free(portname); | ||
183 | + } | 438 | + } |
184 | + if (fpst->default_nan_mode) { | 439 | + |
185 | + nan = float16_default_nan(fpst); | 440 | + object_property_set_bool(OBJECT(ppc), true, "realized", &error_fatal); |
441 | + | ||
442 | + for (port = 0; port < TZ_NUM_PORTS; port++) { | ||
443 | + const PPCPortInfo *pinfo = &ppcinfo->ports[port]; | ||
444 | + | ||
445 | + if (!pinfo->devfn) { | ||
446 | + continue; | ||
447 | + } | ||
448 | + sysbus_mmio_map(SYS_BUS_DEVICE(ppc), port, pinfo->addr); | ||
449 | + | ||
450 | + gpioname = g_strdup_printf("%s_nonsec", ppcinfo->name); | ||
451 | + qdev_connect_gpio_out_named(iotkitdev, gpioname, port, | ||
452 | + qdev_get_gpio_in_named(ppcdev, | ||
453 | + "cfg_nonsec", | ||
454 | + port)); | ||
455 | + g_free(gpioname); | ||
456 | + gpioname = g_strdup_printf("%s_ap", ppcinfo->name); | ||
457 | + qdev_connect_gpio_out_named(iotkitdev, gpioname, port, | ||
458 | + qdev_get_gpio_in_named(ppcdev, | ||
459 | + "cfg_ap", port)); | ||
460 | + g_free(gpioname); | ||
186 | + } | 461 | + } |
187 | + return nan; | 462 | + |
188 | + } else if (float16_is_infinity(f16)) { | 463 | + gpioname = g_strdup_printf("%s_irq_enable", ppcinfo->name); |
189 | + return float16_set_sign(float16_zero, float16_is_neg(f16)); | 464 | + qdev_connect_gpio_out_named(iotkitdev, gpioname, 0, |
190 | + } else if (float16_is_zero(f16)) { | 465 | + qdev_get_gpio_in_named(ppcdev, |
191 | + float_raise(float_flag_divbyzero, fpst); | 466 | + "irq_enable", 0)); |
192 | + return float16_set_sign(float16_infinity, float16_is_neg(f16)); | 467 | + g_free(gpioname); |
193 | + } else if (float16_abs(f16) < (1 << 8)) { | 468 | + gpioname = g_strdup_printf("%s_irq_clear", ppcinfo->name); |
194 | + /* Abs(value) < 2.0^-16 */ | 469 | + qdev_connect_gpio_out_named(iotkitdev, gpioname, 0, |
195 | + float_raise(float_flag_overflow | float_flag_inexact, fpst); | 470 | + qdev_get_gpio_in_named(ppcdev, |
196 | + if (round_to_inf(fpst, f16_sign)) { | 471 | + "irq_clear", 0)); |
197 | + return float16_set_sign(float16_infinity, f16_sign); | 472 | + g_free(gpioname); |
198 | + } else { | 473 | + gpioname = g_strdup_printf("%s_irq_status", ppcinfo->name); |
199 | + return float16_set_sign(float16_maxnorm, f16_sign); | 474 | + qdev_connect_gpio_out_named(ppcdev, "irq", 0, |
200 | + } | 475 | + qdev_get_gpio_in_named(iotkitdev, |
201 | + } else if (f16_exp >= 29 && fpst->flush_to_zero) { | 476 | + gpioname, 0)); |
202 | + float_raise(float_flag_underflow, fpst); | 477 | + g_free(gpioname); |
203 | + return float16_set_sign(float16_zero, float16_is_neg(f16)); | 478 | + |
479 | + qdev_connect_gpio_out(dev_splitter, i, | ||
480 | + qdev_get_gpio_in_named(ppcdev, | ||
481 | + "cfg_sec_resp", 0)); | ||
204 | + } | 482 | + } |
205 | + | 483 | + |
206 | + f64_frac = call_recip_estimate(&f16_exp, 29, | 484 | + /* In hardware this is a LAN9220; the LAN9118 is software compatible |
207 | + ((uint64_t) f16_frac) << (52 - 10)); | 485 | + * except that it doesn't support the checksum-offload feature. |
208 | + | 486 | + * The ethernet controller is not behind a PPC. |
209 | + /* result = sign : result_exp<4:0> : fraction<51:42> */ | 487 | + */ |
210 | + f16_val = deposit32(0, 15, 1, f16_sign); | 488 | + lan9118_init(&nd_table[0], 0x42000000, |
211 | + f16_val = deposit32(f16_val, 10, 5, f16_exp); | 489 | + qdev_get_gpio_in_named(iotkitdev, "EXP_IRQ", 16)); |
212 | + f16_val = deposit32(f16_val, 0, 10, extract64(f64_frac, 52 - 10, 10)); | 490 | + |
213 | + return make_float16(f16_val); | 491 | + create_unimplemented_device("FPGA NS PC", 0x48007000, 0x1000); |
214 | +} | 492 | + |
215 | + | 493 | + armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename, 0x400000); |
216 | float32 HELPER(recpe_f32)(float32 input, void *fpstp) | 494 | +} |
217 | { | 495 | + |
218 | float_status *fpst = fpstp; | 496 | +static void mps2tz_class_init(ObjectClass *oc, void *data) |
219 | float32 f32 = float32_squash_input_denormal(input, fpst); | 497 | +{ |
220 | uint32_t f32_val = float32_val(f32); | 498 | + MachineClass *mc = MACHINE_CLASS(oc); |
221 | - uint32_t f32_sbit = 0x80000000ULL & f32_val; | 499 | + |
222 | - int32_t f32_exp = extract32(f32_val, 23, 8); | 500 | + mc->init = mps2tz_common_init; |
223 | + bool f32_sign = float32_is_neg(f32); | 501 | + mc->max_cpus = 1; |
224 | + int f32_exp = extract32(f32_val, 23, 8); | 502 | +} |
225 | uint32_t f32_frac = extract32(f32_val, 0, 23); | 503 | + |
226 | - float64 f64, r64; | 504 | +static void mps2tz_an505_class_init(ObjectClass *oc, void *data) |
227 | - uint64_t r64_val; | 505 | +{ |
228 | - int64_t r64_exp; | 506 | + MachineClass *mc = MACHINE_CLASS(oc); |
229 | - uint64_t r64_frac; | 507 | + MPS2TZMachineClass *mmc = MPS2TZ_MACHINE_CLASS(oc); |
230 | + uint64_t f64_frac; | 508 | + |
231 | 509 | + mc->desc = "ARM MPS2 with AN505 FPGA image for Cortex-M33"; | |
232 | if (float32_is_any_nan(f32)) { | 510 | + mmc->fpga_type = FPGA_AN505; |
233 | float32 nan = f32; | 511 | + mc->default_cpu_type = ARM_CPU_TYPE_NAME("cortex-m33"); |
234 | @@ -XXX,XX +XXX,XX @@ float32 HELPER(recpe_f32)(float32 input, void *fpstp) | 512 | + mmc->scc_id = 0x41040000 | (505 << 4); |
235 | } else if (float32_is_zero(f32)) { | 513 | +} |
236 | float_raise(float_flag_divbyzero, fpst); | 514 | + |
237 | return float32_set_sign(float32_infinity, float32_is_neg(f32)); | 515 | +static const TypeInfo mps2tz_info = { |
238 | - } else if ((f32_val & ~(1ULL << 31)) < (1ULL << 21)) { | 516 | + .name = TYPE_MPS2TZ_MACHINE, |
239 | + } else if (float32_abs(f32) < (1ULL << 21)) { | 517 | + .parent = TYPE_MACHINE, |
240 | /* Abs(value) < 2.0^-128 */ | 518 | + .abstract = true, |
241 | float_raise(float_flag_overflow | float_flag_inexact, fpst); | 519 | + .instance_size = sizeof(MPS2TZMachineState), |
242 | - if (round_to_inf(fpst, f32_sbit)) { | 520 | + .class_size = sizeof(MPS2TZMachineClass), |
243 | - return float32_set_sign(float32_infinity, float32_is_neg(f32)); | 521 | + .class_init = mps2tz_class_init, |
244 | + if (round_to_inf(fpst, f32_sign)) { | 522 | +}; |
245 | + return float32_set_sign(float32_infinity, f32_sign); | 523 | + |
246 | } else { | 524 | +static const TypeInfo mps2tz_an505_info = { |
247 | - return float32_set_sign(float32_maxnorm, float32_is_neg(f32)); | 525 | + .name = TYPE_MPS2TZ_AN505_MACHINE, |
248 | + return float32_set_sign(float32_maxnorm, f32_sign); | 526 | + .parent = TYPE_MPS2TZ_MACHINE, |
249 | } | 527 | + .class_init = mps2tz_an505_class_init, |
250 | } else if (f32_exp >= 253 && fpst->flush_to_zero) { | 528 | +}; |
251 | float_raise(float_flag_underflow, fpst); | 529 | + |
252 | return float32_set_sign(float32_zero, float32_is_neg(f32)); | 530 | +static void mps2tz_machine_init(void) |
253 | } | 531 | +{ |
254 | 532 | + type_register_static(&mps2tz_info); | |
255 | + f64_frac = call_recip_estimate(&f32_exp, 253, | 533 | + type_register_static(&mps2tz_an505_info); |
256 | + ((uint64_t) f32_frac) << (52 - 23)); | 534 | +} |
257 | 535 | + | |
258 | - f64 = make_float64(((int64_t)(f32_exp) << 52) | (int64_t)(f32_frac) << 29); | 536 | +type_init(mps2tz_machine_init); |
259 | - r64 = call_recip_estimate(f64, 253, fpst); | ||
260 | - r64_val = float64_val(r64); | ||
261 | - r64_exp = extract64(r64_val, 52, 11); | ||
262 | - r64_frac = extract64(r64_val, 0, 52); | ||
263 | - | ||
264 | - /* result = sign : result_exp<7:0> : fraction<51:29>; */ | ||
265 | - return make_float32(f32_sbit | | ||
266 | - (r64_exp & 0xff) << 23 | | ||
267 | - extract64(r64_frac, 29, 24)); | ||
268 | + /* result = sign : result_exp<7:0> : fraction<51:29> */ | ||
269 | + f32_val = deposit32(0, 31, 1, f32_sign); | ||
270 | + f32_val = deposit32(f32_val, 23, 8, f32_exp); | ||
271 | + f32_val = deposit32(f32_val, 0, 23, extract64(f64_frac, 52 - 23, 23)); | ||
272 | + return make_float32(f32_val); | ||
273 | } | ||
274 | |||
275 | float64 HELPER(recpe_f64)(float64 input, void *fpstp) | ||
276 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp) | ||
277 | float_status *fpst = fpstp; | ||
278 | float64 f64 = float64_squash_input_denormal(input, fpst); | ||
279 | uint64_t f64_val = float64_val(f64); | ||
280 | - uint64_t f64_sbit = 0x8000000000000000ULL & f64_val; | ||
281 | - int64_t f64_exp = extract64(f64_val, 52, 11); | ||
282 | - float64 r64; | ||
283 | - uint64_t r64_val; | ||
284 | - int64_t r64_exp; | ||
285 | - uint64_t r64_frac; | ||
286 | + bool f64_sign = float64_is_neg(f64); | ||
287 | + int f64_exp = extract64(f64_val, 52, 11); | ||
288 | + uint64_t f64_frac = extract64(f64_val, 0, 52); | ||
289 | |||
290 | /* Deal with any special cases */ | ||
291 | if (float64_is_any_nan(f64)) { | ||
292 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp) | ||
293 | } else if ((f64_val & ~(1ULL << 63)) < (1ULL << 50)) { | ||
294 | /* Abs(value) < 2.0^-1024 */ | ||
295 | float_raise(float_flag_overflow | float_flag_inexact, fpst); | ||
296 | - if (round_to_inf(fpst, f64_sbit)) { | ||
297 | - return float64_set_sign(float64_infinity, float64_is_neg(f64)); | ||
298 | + if (round_to_inf(fpst, f64_sign)) { | ||
299 | + return float64_set_sign(float64_infinity, f64_sign); | ||
300 | } else { | ||
301 | - return float64_set_sign(float64_maxnorm, float64_is_neg(f64)); | ||
302 | + return float64_set_sign(float64_maxnorm, f64_sign); | ||
303 | } | ||
304 | } else if (f64_exp >= 2045 && fpst->flush_to_zero) { | ||
305 | float_raise(float_flag_underflow, fpst); | ||
306 | return float64_set_sign(float64_zero, float64_is_neg(f64)); | ||
307 | } | ||
308 | |||
309 | - r64 = call_recip_estimate(f64, 2045, fpst); | ||
310 | - r64_val = float64_val(r64); | ||
311 | - r64_exp = extract64(r64_val, 52, 11); | ||
312 | - r64_frac = extract64(r64_val, 0, 52); | ||
313 | + f64_frac = call_recip_estimate(&f64_exp, 2045, f64_frac); | ||
314 | |||
315 | - /* result = sign : result_exp<10:0> : fraction<51:0> */ | ||
316 | - return make_float64(f64_sbit | | ||
317 | - ((r64_exp & 0x7ff) << 52) | | ||
318 | - r64_frac); | ||
319 | + /* result = sign : result_exp<10:0> : fraction<51:0>; */ | ||
320 | + f64_val = deposit64(0, 63, 1, f64_sign); | ||
321 | + f64_val = deposit64(f64_val, 52, 11, f64_exp); | ||
322 | + f64_val = deposit64(f64_val, 0, 52, f64_frac); | ||
323 | + return make_float64(f64_val); | ||
324 | } | ||
325 | |||
326 | /* The algorithm that must be used to calculate the estimate | ||
327 | @@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp) | ||
328 | |||
329 | uint32_t HELPER(recpe_u32)(uint32_t a, void *fpstp) | ||
330 | { | ||
331 | - float_status *s = fpstp; | ||
332 | - float64 f64; | ||
333 | + /* float_status *s = fpstp; */ | ||
334 | + int input, estimate; | ||
335 | |||
336 | if ((a & 0x80000000) == 0) { | ||
337 | return 0xffffffff; | ||
338 | } | ||
339 | |||
340 | - f64 = make_float64((0x3feULL << 52) | ||
341 | - | ((int64_t)(a & 0x7fffffff) << 21)); | ||
342 | + input = extract32(a, 23, 9); | ||
343 | + estimate = recip_estimate(input); | ||
344 | |||
345 | - f64 = recip_estimate(f64, s); | ||
346 | - | ||
347 | - return 0x80000000 | ((float64_val(f64) >> 21) & 0x7fffffff); | ||
348 | + return deposit32(0, (32 - 9), 9, estimate); | ||
349 | } | ||
350 | |||
351 | uint32_t HELPER(rsqrte_u32)(uint32_t a, void *fpstp) | ||
352 | -- | 537 | -- |
353 | 2.16.2 | 538 | 2.16.2 |
354 | 539 | ||
355 | 540 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 3 | Not enabled anywhere yet. |
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 4 | |
5 | Message-id: 20180227143852.11175-3-alex.bennee@linaro.org | 5 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> |
6 | [PMM: postpone actually enabling feature until end of the | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | patch series] | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Message-id: 20180228193125.20577-2-richard.henderson@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 10 | --- |
10 | target/arm/cpu.h | 1 + | 11 | target/arm/cpu.h | 1 + |
11 | 1 file changed, 1 insertion(+) | 12 | linux-user/elfload.c | 1 + |
13 | 2 files changed, 2 insertions(+) | ||
12 | 14 | ||
13 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h | 15 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h |
14 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/cpu.h | 17 | --- a/target/arm/cpu.h |
16 | +++ b/target/arm/cpu.h | 18 | +++ b/target/arm/cpu.h |
17 | @@ -XXX,XX +XXX,XX @@ enum arm_features { | 19 | @@ -XXX,XX +XXX,XX @@ enum arm_features { |
18 | ARM_FEATURE_V8_SHA3, /* implements SHA3 part of v8 Crypto Extensions */ | 20 | ARM_FEATURE_V8_SHA3, /* implements SHA3 part of v8 Crypto Extensions */ |
19 | ARM_FEATURE_V8_SM3, /* implements SM3 part of v8 Crypto Extensions */ | 21 | ARM_FEATURE_V8_SM3, /* implements SM3 part of v8 Crypto Extensions */ |
20 | ARM_FEATURE_V8_SM4, /* implements SM4 part of v8 Crypto Extensions */ | 22 | ARM_FEATURE_V8_SM4, /* implements SM4 part of v8 Crypto Extensions */ |
21 | + ARM_FEATURE_V8_FP16, /* implements v8.2 half-precision float */ | 23 | + ARM_FEATURE_V8_RDM, /* implements v8.1 simd round multiply */ |
24 | ARM_FEATURE_V8_FP16, /* implements v8.2 half-precision float */ | ||
22 | }; | 25 | }; |
23 | 26 | ||
24 | static inline int arm_feature(CPUARMState *env, int feature) | 27 | diff --git a/linux-user/elfload.c b/linux-user/elfload.c |
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/linux-user/elfload.c | ||
30 | +++ b/linux-user/elfload.c | ||
31 | @@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap(void) | ||
32 | GET_FEATURE(ARM_FEATURE_V8_SHA512, ARM_HWCAP_A64_SHA512); | ||
33 | GET_FEATURE(ARM_FEATURE_V8_FP16, | ||
34 | ARM_HWCAP_A64_FPHP | ARM_HWCAP_A64_ASIMDHP); | ||
35 | + GET_FEATURE(ARM_FEATURE_V8_RDM, ARM_HWCAP_A64_ASIMDRDM); | ||
36 | #undef GET_FEATURE | ||
37 | |||
38 | return hwcaps; | ||
25 | -- | 39 | -- |
26 | 2.16.2 | 40 | 2.16.2 |
27 | 41 | ||
28 | 42 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | The helpers use the new re-factored muladd support in SoftFloat for | 3 | Include the U bit in the switches rather than testing separately. |
4 | the float16 work. | 4 | |
5 | 5 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | |
6 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Message-id: 20180227143852.11175-15-alex.bennee@linaro.org | 7 | Message-id: 20180228193125.20577-3-richard.henderson@linaro.org |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
10 | --- | 9 | --- |
11 | target/arm/translate-a64.c | 82 +++++++++++++++++++++++++++++++++++++--------- | 10 | target/arm/translate-a64.c | 129 +++++++++++++++++++++------------------------ |
12 | 1 file changed, 66 insertions(+), 16 deletions(-) | 11 | 1 file changed, 61 insertions(+), 68 deletions(-) |
13 | 12 | ||
14 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 13 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
15 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
16 | --- a/target/arm/translate-a64.c | 15 | --- a/target/arm/translate-a64.c |
17 | +++ b/target/arm/translate-a64.c | 16 | +++ b/target/arm/translate-a64.c |
18 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | 17 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
19 | int rd = extract32(insn, 0, 5); | ||
20 | bool is_long = false; | ||
21 | bool is_fp = false; | ||
22 | + bool is_fp16 = false; | ||
23 | int index; | 18 | int index; |
24 | TCGv_ptr fpst; | 19 | TCGv_ptr fpst; |
25 | 20 | ||
26 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | 21 | - switch (opcode) { |
27 | } | 22 | - case 0x0: /* MLA */ |
28 | /* fall through */ | 23 | - case 0x4: /* MLS */ |
29 | case 0x9: /* FMUL, FMULX */ | 24 | - if (!u || is_scalar) { |
30 | - if (!extract32(size, 1, 1)) { | 25 | + switch (16 * u + opcode) { |
31 | + if (size == 1) { | 26 | + case 0x08: /* MUL */ |
27 | + case 0x10: /* MLA */ | ||
28 | + case 0x14: /* MLS */ | ||
29 | + if (is_scalar) { | ||
32 | unallocated_encoding(s); | 30 | unallocated_encoding(s); |
33 | return; | 31 | return; |
34 | } | 32 | } |
35 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | 33 | break; |
36 | } | 34 | - case 0x2: /* SMLAL, SMLAL2, UMLAL, UMLAL2 */ |
37 | 35 | - case 0x6: /* SMLSL, SMLSL2, UMLSL, UMLSL2 */ | |
38 | if (is_fp) { | 36 | - case 0xa: /* SMULL, SMULL2, UMULL, UMULL2 */ |
39 | - /* low bit of size indicates single/double */ | 37 | + case 0x02: /* SMLAL, SMLAL2 */ |
40 | - size = extract32(size, 0, 1) ? 3 : 2; | 38 | + case 0x12: /* UMLAL, UMLAL2 */ |
41 | - if (size == 2) { | 39 | + case 0x06: /* SMLSL, SMLSL2 */ |
42 | + /* convert insn encoded size to TCGMemOp size */ | 40 | + case 0x16: /* UMLSL, UMLSL2 */ |
43 | + switch (size) { | 41 | + case 0x0a: /* SMULL, SMULL2 */ |
44 | + case 2: /* single precision */ | 42 | + case 0x1a: /* UMULL, UMULL2 */ |
45 | + size = MO_32; | 43 | if (is_scalar) { |
46 | index = h << 1 | l; | 44 | unallocated_encoding(s); |
47 | - } else { | 45 | return; |
48 | + rm |= (m << 4); | 46 | } |
49 | + break; | 47 | is_long = true; |
50 | + case 3: /* double precision */ | 48 | break; |
51 | + size = MO_64; | 49 | - case 0x3: /* SQDMLAL, SQDMLAL2 */ |
52 | if (l || !is_q) { | 50 | - case 0x7: /* SQDMLSL, SQDMLSL2 */ |
53 | unallocated_encoding(s); | 51 | - case 0xb: /* SQDMULL, SQDMULL2 */ |
54 | return; | 52 | + case 0x03: /* SQDMLAL, SQDMLAL2 */ |
53 | + case 0x07: /* SQDMLSL, SQDMLSL2 */ | ||
54 | + case 0x0b: /* SQDMULL, SQDMULL2 */ | ||
55 | is_long = true; | ||
56 | - /* fall through */ | ||
57 | - case 0xc: /* SQDMULH */ | ||
58 | - case 0xd: /* SQRDMULH */ | ||
59 | - if (u) { | ||
60 | - unallocated_encoding(s); | ||
61 | - return; | ||
62 | - } | ||
63 | break; | ||
64 | - case 0x8: /* MUL */ | ||
65 | - if (u || is_scalar) { | ||
66 | - unallocated_encoding(s); | ||
67 | - return; | ||
68 | - } | ||
69 | + case 0x0c: /* SQDMULH */ | ||
70 | + case 0x0d: /* SQRDMULH */ | ||
71 | break; | ||
72 | - case 0x1: /* FMLA */ | ||
73 | - case 0x5: /* FMLS */ | ||
74 | - if (u) { | ||
75 | - unallocated_encoding(s); | ||
76 | - return; | ||
77 | - } | ||
78 | - /* fall through */ | ||
79 | - case 0x9: /* FMUL, FMULX */ | ||
80 | + case 0x01: /* FMLA */ | ||
81 | + case 0x05: /* FMLS */ | ||
82 | + case 0x09: /* FMUL */ | ||
83 | + case 0x19: /* FMULX */ | ||
84 | if (size == 1) { | ||
85 | unallocated_encoding(s); | ||
86 | return; | ||
87 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
88 | |||
89 | read_vec_element(s, tcg_op, rn, pass, MO_64); | ||
90 | |||
91 | - switch (opcode) { | ||
92 | - case 0x5: /* FMLS */ | ||
93 | + switch (16 * u + opcode) { | ||
94 | + case 0x05: /* FMLS */ | ||
95 | /* As usual for ARM, separate negation for fused multiply-add */ | ||
96 | gen_helper_vfp_negd(tcg_op, tcg_op); | ||
97 | /* fall through */ | ||
98 | - case 0x1: /* FMLA */ | ||
99 | + case 0x01: /* FMLA */ | ||
100 | read_vec_element(s, tcg_res, rd, pass, MO_64); | ||
101 | gen_helper_vfp_muladdd(tcg_res, tcg_op, tcg_idx, tcg_res, fpst); | ||
102 | break; | ||
103 | - case 0x9: /* FMUL, FMULX */ | ||
104 | - if (u) { | ||
105 | - gen_helper_vfp_mulxd(tcg_res, tcg_op, tcg_idx, fpst); | ||
106 | - } else { | ||
107 | - gen_helper_vfp_muld(tcg_res, tcg_op, tcg_idx, fpst); | ||
108 | - } | ||
109 | + case 0x09: /* FMUL */ | ||
110 | + gen_helper_vfp_muld(tcg_res, tcg_op, tcg_idx, fpst); | ||
111 | + break; | ||
112 | + case 0x19: /* FMULX */ | ||
113 | + gen_helper_vfp_mulxd(tcg_res, tcg_op, tcg_idx, fpst); | ||
114 | break; | ||
115 | default: | ||
116 | g_assert_not_reached(); | ||
117 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
118 | |||
119 | read_vec_element_i32(s, tcg_op, rn, pass, is_scalar ? size : MO_32); | ||
120 | |||
121 | - switch (opcode) { | ||
122 | - case 0x0: /* MLA */ | ||
123 | - case 0x4: /* MLS */ | ||
124 | - case 0x8: /* MUL */ | ||
125 | + switch (16 * u + opcode) { | ||
126 | + case 0x08: /* MUL */ | ||
127 | + case 0x10: /* MLA */ | ||
128 | + case 0x14: /* MLS */ | ||
129 | { | ||
130 | static NeonGenTwoOpFn * const fns[2][2] = { | ||
131 | { gen_helper_neon_add_u16, gen_helper_neon_sub_u16 }, | ||
132 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
133 | genfn(tcg_res, tcg_op, tcg_res); | ||
134 | break; | ||
55 | } | 135 | } |
56 | index = h; | 136 | - case 0x5: /* FMLS */ |
57 | + rm |= (m << 4); | 137 | - case 0x1: /* FMLA */ |
58 | + break; | 138 | + case 0x05: /* FMLS */ |
59 | + case 0: /* half precision */ | 139 | + case 0x01: /* FMLA */ |
60 | + size = MO_16; | 140 | read_vec_element_i32(s, tcg_res, rd, pass, |
61 | + index = h << 2 | l << 1 | m; | 141 | is_scalar ? size : MO_32); |
62 | + is_fp16 = true; | 142 | switch (size) { |
63 | + if (arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 143 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
64 | + break; | 144 | g_assert_not_reached(); |
65 | + } | 145 | } |
66 | + /* fallthru */ | 146 | break; |
67 | + default: /* unallocated */ | 147 | - case 0x9: /* FMUL, FMULX */ |
68 | + unallocated_encoding(s); | 148 | + case 0x09: /* FMUL */ |
69 | + return; | 149 | switch (size) { |
70 | } | 150 | case 1: |
71 | - rm |= (m << 4); | 151 | - if (u) { |
72 | } else { | 152 | - if (is_scalar) { |
73 | switch (size) { | 153 | - gen_helper_advsimd_mulxh(tcg_res, tcg_op, |
74 | case 1: | 154 | - tcg_idx, fpst); |
75 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | 155 | - } else { |
76 | } | 156 | - gen_helper_advsimd_mulx2h(tcg_res, tcg_op, |
77 | 157 | - tcg_idx, fpst); | |
78 | if (is_fp) { | 158 | - } |
79 | - fpst = get_fpstatus_ptr(false); | 159 | + if (is_scalar) { |
80 | + fpst = get_fpstatus_ptr(is_fp16); | 160 | + gen_helper_advsimd_mulh(tcg_res, tcg_op, |
81 | } else { | 161 | + tcg_idx, fpst); |
82 | fpst = NULL; | 162 | } else { |
83 | } | 163 | - if (is_scalar) { |
84 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | 164 | - gen_helper_advsimd_mulh(tcg_res, tcg_op, |
85 | break; | 165 | - tcg_idx, fpst); |
86 | } | 166 | - } else { |
87 | case 0x5: /* FMLS */ | 167 | - gen_helper_advsimd_mul2h(tcg_res, tcg_op, |
88 | - /* As usual for ARM, separate negation for fused multiply-add */ | 168 | - tcg_idx, fpst); |
89 | - gen_helper_vfp_negs(tcg_op, tcg_op); | 169 | - } |
90 | - /* fall through */ | 170 | + gen_helper_advsimd_mul2h(tcg_res, tcg_op, |
91 | case 0x1: /* FMLA */ | 171 | + tcg_idx, fpst); |
92 | - read_vec_element_i32(s, tcg_res, rd, pass, MO_32); | 172 | } |
93 | - gen_helper_vfp_muladds(tcg_res, tcg_op, tcg_idx, tcg_res, fpst); | 173 | break; |
94 | + read_vec_element_i32(s, tcg_res, rd, pass, | 174 | case 2: |
95 | + is_scalar ? size : MO_32); | 175 | - if (u) { |
176 | - gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst); | ||
177 | - } else { | ||
178 | - gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst); | ||
179 | - } | ||
180 | + gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst); | ||
181 | break; | ||
182 | default: | ||
183 | g_assert_not_reached(); | ||
184 | } | ||
185 | break; | ||
186 | - case 0xc: /* SQDMULH */ | ||
187 | + case 0x19: /* FMULX */ | ||
96 | + switch (size) { | 188 | + switch (size) { |
97 | + case 1: | 189 | + case 1: |
98 | + if (opcode == 0x5) { | 190 | + if (is_scalar) { |
99 | + /* As usual for ARM, separate negation for fused | 191 | + gen_helper_advsimd_mulxh(tcg_res, tcg_op, |
100 | + * multiply-add */ | 192 | + tcg_idx, fpst); |
101 | + tcg_gen_xori_i32(tcg_op, tcg_op, 0x80008000); | 193 | + } else { |
194 | + gen_helper_advsimd_mulx2h(tcg_res, tcg_op, | ||
195 | + tcg_idx, fpst); | ||
102 | + } | 196 | + } |
103 | + gen_helper_advsimd_muladdh(tcg_res, tcg_op, tcg_idx, | ||
104 | + tcg_res, fpst); | ||
105 | + break; | 197 | + break; |
106 | + case 2: | 198 | + case 2: |
107 | + if (opcode == 0x5) { | 199 | + gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst); |
108 | + /* As usual for ARM, separate negation for | ||
109 | + * fused multiply-add */ | ||
110 | + tcg_gen_xori_i32(tcg_op, tcg_op, 0x80000000); | ||
111 | + } | ||
112 | + gen_helper_vfp_muladds(tcg_res, tcg_op, tcg_idx, | ||
113 | + tcg_res, fpst); | ||
114 | + break; | 200 | + break; |
115 | + default: | 201 | + default: |
116 | + g_assert_not_reached(); | 202 | + g_assert_not_reached(); |
117 | + } | 203 | + } |
118 | break; | 204 | + break; |
119 | case 0x9: /* FMUL, FMULX */ | 205 | + case 0x0c: /* SQDMULH */ |
120 | - if (u) { | 206 | if (size == 1) { |
121 | - gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst); | 207 | gen_helper_neon_qdmulh_s16(tcg_res, cpu_env, |
122 | - } else { | 208 | tcg_op, tcg_idx); |
123 | - gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst); | 209 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
124 | + switch (size) { | 210 | tcg_op, tcg_idx); |
125 | + case 1: | ||
126 | + if (u) { | ||
127 | + gen_helper_advsimd_mulxh(tcg_res, tcg_op, tcg_idx, | ||
128 | + fpst); | ||
129 | + } else { | ||
130 | + g_assert_not_reached(); | ||
131 | + } | ||
132 | + break; | ||
133 | + case 2: | ||
134 | + if (u) { | ||
135 | + gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst); | ||
136 | + } else { | ||
137 | + gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst); | ||
138 | + } | ||
139 | + break; | ||
140 | + default: | ||
141 | + g_assert_not_reached(); | ||
142 | } | 211 | } |
143 | break; | 212 | break; |
144 | case 0xc: /* SQDMULH */ | 213 | - case 0xd: /* SQRDMULH */ |
214 | + case 0x0d: /* SQRDMULH */ | ||
215 | if (size == 1) { | ||
216 | gen_helper_neon_qrdmulh_s16(tcg_res, cpu_env, | ||
217 | tcg_op, tcg_idx); | ||
145 | -- | 218 | -- |
146 | 2.16.2 | 219 | 2.16.2 |
147 | 220 | ||
148 | 221 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Only one half-precision instruction has been added to this group. | 3 | The integer size check was already outside of the opcode switch; |
4 | move the floating-point size check outside as well. Unify the | ||
5 | size vs index adjustment between fp and integer paths. | ||
4 | 6 | ||
5 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 7 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
7 | Message-id: 20180227143852.11175-29-alex.bennee@linaro.org | 9 | Message-id: 20180228193125.20577-4-richard.henderson@linaro.org |
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 11 | --- |
10 | target/arm/translate-a64.c | 35 +++++++++++++++++++++++++---------- | 12 | target/arm/translate-a64.c | 65 +++++++++++++++++++++++----------------------- |
11 | 1 file changed, 25 insertions(+), 10 deletions(-) | 13 | 1 file changed, 32 insertions(+), 33 deletions(-) |
12 | 14 | ||
13 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 15 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
14 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/translate-a64.c | 17 | --- a/target/arm/translate-a64.c |
16 | +++ b/target/arm/translate-a64.c | 18 | +++ b/target/arm/translate-a64.c |
17 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_copy(DisasContext *s, uint32_t insn) | 19 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
18 | * MVNI - move inverted (shifted) imm into register | 20 | case 0x05: /* FMLS */ |
19 | * ORR - bitwise OR of (shifted) imm with register | 21 | case 0x09: /* FMUL */ |
20 | * BIC - bitwise clear of (shifted) imm with register | 22 | case 0x19: /* FMULX */ |
21 | + * With ARMv8.2 we also have: | 23 | - if (size == 1) { |
22 | + * FMOV half-precision | 24 | - unallocated_encoding(s); |
23 | */ | 25 | - return; |
24 | static void disas_simd_mod_imm(DisasContext *s, uint32_t insn) | 26 | - } |
25 | { | 27 | is_fp = true; |
26 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn) | 28 | break; |
27 | uint64_t imm = 0; | 29 | default: |
28 | 30 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | |
29 | if (o2 != 0 || ((cmode == 0xf) && is_neg && !is_q)) { | 31 | if (is_fp) { |
30 | - unallocated_encoding(s); | 32 | /* convert insn encoded size to TCGMemOp size */ |
31 | - return; | 33 | switch (size) { |
32 | + /* Check for FMOV (vector, immediate) - half-precision */ | 34 | - case 2: /* single precision */ |
33 | + if (!(arm_dc_feature(s, ARM_FEATURE_V8_FP16) && o2 && cmode == 0xf)) { | 35 | - size = MO_32; |
36 | - index = h << 1 | l; | ||
37 | - rm |= (m << 4); | ||
38 | - break; | ||
39 | - case 3: /* double precision */ | ||
40 | - size = MO_64; | ||
41 | - if (l || !is_q) { | ||
42 | + case 0: /* half-precision */ | ||
43 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | ||
44 | unallocated_encoding(s); | ||
45 | return; | ||
46 | } | ||
47 | - index = h; | ||
48 | - rm |= (m << 4); | ||
49 | - break; | ||
50 | - case 0: /* half precision */ | ||
51 | size = MO_16; | ||
52 | - index = h << 2 | l << 1 | m; | ||
53 | - is_fp16 = true; | ||
54 | - if (arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | ||
55 | - break; | ||
56 | - } | ||
57 | - /* fallthru */ | ||
58 | - default: /* unallocated */ | ||
59 | - unallocated_encoding(s); | ||
60 | - return; | ||
61 | - } | ||
62 | - } else { | ||
63 | - switch (size) { | ||
64 | - case 1: | ||
65 | - index = h << 2 | l << 1 | m; | ||
66 | break; | ||
67 | - case 2: | ||
68 | - index = h << 1 | l; | ||
69 | - rm |= (m << 4); | ||
70 | + case MO_32: /* single precision */ | ||
71 | + case MO_64: /* double precision */ | ||
72 | break; | ||
73 | default: | ||
74 | unallocated_encoding(s); | ||
75 | return; | ||
76 | } | ||
77 | + } else { | ||
78 | + switch (size) { | ||
79 | + case MO_8: | ||
80 | + case MO_64: | ||
34 | + unallocated_encoding(s); | 81 | + unallocated_encoding(s); |
35 | + return; | 82 | + return; |
36 | + } | 83 | + } |
37 | } | 84 | + } |
38 | 85 | + | |
39 | if (!fp_access_check(s)) { | 86 | + /* Given TCGMemOp size, adjust register and indexing. */ |
40 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn) | 87 | + switch (size) { |
41 | imm |= 0x4000000000000000ULL; | 88 | + case MO_16: |
42 | } | 89 | + index = h << 2 | l << 1 | m; |
43 | } else { | 90 | + break; |
44 | - imm = (abcdefgh & 0x3f) << 19; | 91 | + case MO_32: |
45 | - if (abcdefgh & 0x80) { | 92 | + index = h << 1 | l; |
46 | - imm |= 0x80000000; | 93 | + rm |= m << 4; |
47 | - } | 94 | + break; |
48 | - if (abcdefgh & 0x40) { | 95 | + case MO_64: |
49 | - imm |= 0x3e000000; | 96 | + if (l || !is_q) { |
50 | + if (o2) { | 97 | + unallocated_encoding(s); |
51 | + /* FMOV (vector, immediate) - half-precision */ | 98 | + return; |
52 | + imm = vfp_expand_imm(MO_16, abcdefgh); | 99 | + } |
53 | + /* now duplicate across the lanes */ | 100 | + index = h; |
54 | + imm = bitfield_replicate(imm, 16); | 101 | + rm |= m << 4; |
55 | } else { | 102 | + break; |
56 | - imm |= 0x40000000; | ||
57 | + imm = (abcdefgh & 0x3f) << 19; | ||
58 | + if (abcdefgh & 0x80) { | ||
59 | + imm |= 0x80000000; | ||
60 | + } | ||
61 | + if (abcdefgh & 0x40) { | ||
62 | + imm |= 0x3e000000; | ||
63 | + } else { | ||
64 | + imm |= 0x40000000; | ||
65 | + } | ||
66 | + imm |= (imm << 32); | ||
67 | } | ||
68 | - imm |= (imm << 32); | ||
69 | } | ||
70 | } | ||
71 | break; | ||
72 | + default: | 103 | + default: |
73 | + fprintf(stderr, "%s: cmode_3_1: %x\n", __func__, cmode_3_1); | ||
74 | + g_assert_not_reached(); | 104 | + g_assert_not_reached(); |
75 | } | 105 | } |
76 | 106 | ||
77 | if (cmode_3_1 != 7 && is_neg) { | 107 | if (!fp_access_check(s)) { |
78 | -- | 108 | -- |
79 | 2.16.2 | 109 | 2.16.2 |
80 | 110 | ||
81 | 111 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This covers the encoding group: | 3 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> |
4 | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | |
5 | Advanced SIMD scalar three same FP16 | 5 | Message-id: 20180228193125.20577-5-richard.henderson@linaro.org |
6 | |||
7 | As all the helpers are already there it is simply a case of calling the | ||
8 | existing helpers in the scalar context. | ||
9 | |||
10 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | ||
11 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
12 | Message-id: 20180227143852.11175-31-alex.bennee@linaro.org | ||
13 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
14 | --- | 7 | --- |
15 | target/arm/translate-a64.c | 99 ++++++++++++++++++++++++++++++++++++++++++++++ | 8 | target/arm/Makefile.objs | 2 +- |
16 | 1 file changed, 99 insertions(+) | 9 | target/arm/helper.h | 4 ++ |
17 | 10 | target/arm/translate-a64.c | 84 ++++++++++++++++++++++++++++++++++ | |
11 | target/arm/vec_helper.c | 109 +++++++++++++++++++++++++++++++++++++++++++++ | ||
12 | 4 files changed, 198 insertions(+), 1 deletion(-) | ||
13 | create mode 100644 target/arm/vec_helper.c | ||
14 | |||
15 | diff --git a/target/arm/Makefile.objs b/target/arm/Makefile.objs | ||
16 | index XXXXXXX..XXXXXXX 100644 | ||
17 | --- a/target/arm/Makefile.objs | ||
18 | +++ b/target/arm/Makefile.objs | ||
19 | @@ -XXX,XX +XXX,XX @@ obj-$(call land,$(CONFIG_KVM),$(call lnot,$(TARGET_AARCH64))) += kvm32.o | ||
20 | obj-$(call land,$(CONFIG_KVM),$(TARGET_AARCH64)) += kvm64.o | ||
21 | obj-$(call lnot,$(CONFIG_KVM)) += kvm-stub.o | ||
22 | obj-y += translate.o op_helper.o helper.o cpu.o | ||
23 | -obj-y += neon_helper.o iwmmxt_helper.o | ||
24 | +obj-y += neon_helper.o iwmmxt_helper.o vec_helper.o | ||
25 | obj-y += gdbstub.o | ||
26 | obj-$(TARGET_AARCH64) += cpu64.o translate-a64.o helper-a64.o gdbstub64.o | ||
27 | obj-y += crypto_helper.o | ||
28 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
29 | index XXXXXXX..XXXXXXX 100644 | ||
30 | --- a/target/arm/helper.h | ||
31 | +++ b/target/arm/helper.h | ||
32 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_1(neon_rbit_u8, TCG_CALL_NO_RWG_SE, i32, i32) | ||
33 | |||
34 | DEF_HELPER_3(neon_qdmulh_s16, i32, env, i32, i32) | ||
35 | DEF_HELPER_3(neon_qrdmulh_s16, i32, env, i32, i32) | ||
36 | +DEF_HELPER_4(neon_qrdmlah_s16, i32, env, i32, i32, i32) | ||
37 | +DEF_HELPER_4(neon_qrdmlsh_s16, i32, env, i32, i32, i32) | ||
38 | DEF_HELPER_3(neon_qdmulh_s32, i32, env, i32, i32) | ||
39 | DEF_HELPER_3(neon_qrdmulh_s32, i32, env, i32, i32) | ||
40 | +DEF_HELPER_4(neon_qrdmlah_s32, i32, env, s32, s32, s32) | ||
41 | +DEF_HELPER_4(neon_qrdmlsh_s32, i32, env, s32, s32, s32) | ||
42 | |||
43 | DEF_HELPER_1(neon_narrow_u8, i32, i64) | ||
44 | DEF_HELPER_1(neon_narrow_u16, i32, i64) | ||
18 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 45 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
19 | index XXXXXXX..XXXXXXX 100644 | 46 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/translate-a64.c | 47 | --- a/target/arm/translate-a64.c |
21 | +++ b/target/arm/translate-a64.c | 48 | +++ b/target/arm/translate-a64.c |
22 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_three_reg_same(DisasContext *s, uint32_t insn) | 49 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_three_reg_same_fp16(DisasContext *s, |
23 | tcg_temp_free_i64(tcg_rd); | 50 | tcg_temp_free_ptr(fpst); |
24 | } | 51 | } |
25 | 52 | ||
26 | +/* AdvSIMD scalar three same FP16 | 53 | +/* AdvSIMD scalar three same extra |
27 | + * 31 30 29 28 24 23 22 21 20 16 15 14 13 11 10 9 5 4 0 | 54 | + * 31 30 29 28 24 23 22 21 20 16 15 14 11 10 9 5 4 0 |
28 | + * +-----+---+-----------+---+-----+------+-----+--------+---+----+----+ | 55 | + * +-----+---+-----------+------+---+------+---+--------+---+----+----+ |
29 | + * | 0 1 | U | 1 1 1 1 0 | a | 1 0 | Rm | 0 0 | opcode | 1 | Rn | Rd | | 56 | + * | 0 1 | U | 1 1 1 1 0 | size | 0 | Rm | 1 | opcode | 1 | Rn | Rd | |
30 | + * +-----+---+-----------+---+-----+------+-----+--------+---+----+----+ | 57 | + * +-----+---+-----------+------+---+------+---+--------+---+----+----+ |
31 | + * v: 0101 1110 0100 0000 0000 0100 0000 0000 => 5e400400 | ||
32 | + * m: 1101 1111 0110 0000 1100 0100 0000 0000 => df60c400 | ||
33 | + */ | 58 | + */ |
34 | +static void disas_simd_scalar_three_reg_same_fp16(DisasContext *s, | 59 | +static void disas_simd_scalar_three_reg_same_extra(DisasContext *s, |
35 | + uint32_t insn) | 60 | + uint32_t insn) |
36 | +{ | 61 | +{ |
37 | + int rd = extract32(insn, 0, 5); | 62 | + int rd = extract32(insn, 0, 5); |
38 | + int rn = extract32(insn, 5, 5); | 63 | + int rn = extract32(insn, 5, 5); |
39 | + int opcode = extract32(insn, 11, 3); | 64 | + int opcode = extract32(insn, 11, 4); |
40 | + int rm = extract32(insn, 16, 5); | 65 | + int rm = extract32(insn, 16, 5); |
66 | + int size = extract32(insn, 22, 2); | ||
41 | + bool u = extract32(insn, 29, 1); | 67 | + bool u = extract32(insn, 29, 1); |
42 | + bool a = extract32(insn, 23, 1); | 68 | + TCGv_i32 ele1, ele2, ele3; |
43 | + int fpopcode = opcode | (a << 3) | (u << 4); | 69 | + TCGv_i64 res; |
44 | + TCGv_ptr fpst; | 70 | + int feature; |
45 | + TCGv_i32 tcg_op1; | 71 | + |
46 | + TCGv_i32 tcg_op2; | 72 | + switch (u * 16 + opcode) { |
47 | + TCGv_i32 tcg_res; | 73 | + case 0x10: /* SQRDMLAH (vector) */ |
48 | + | 74 | + case 0x11: /* SQRDMLSH (vector) */ |
49 | + switch (fpopcode) { | 75 | + if (size != 1 && size != 2) { |
50 | + case 0x03: /* FMULX */ | 76 | + unallocated_encoding(s); |
51 | + case 0x04: /* FCMEQ (reg) */ | 77 | + return; |
52 | + case 0x07: /* FRECPS */ | 78 | + } |
53 | + case 0x0f: /* FRSQRTS */ | 79 | + feature = ARM_FEATURE_V8_RDM; |
54 | + case 0x14: /* FCMGE (reg) */ | ||
55 | + case 0x15: /* FACGE */ | ||
56 | + case 0x1a: /* FABD */ | ||
57 | + case 0x1c: /* FCMGT (reg) */ | ||
58 | + case 0x1d: /* FACGT */ | ||
59 | + break; | 80 | + break; |
60 | + default: | 81 | + default: |
61 | + unallocated_encoding(s); | 82 | + unallocated_encoding(s); |
62 | + return; | 83 | + return; |
63 | + } | 84 | + } |
64 | + | 85 | + if (!arm_dc_feature(s, feature)) { |
65 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | ||
66 | + unallocated_encoding(s); | 86 | + unallocated_encoding(s); |
67 | + } | 87 | + return; |
68 | + | 88 | + } |
69 | + if (!fp_access_check(s)) { | 89 | + if (!fp_access_check(s)) { |
70 | + return; | 90 | + return; |
71 | + } | 91 | + } |
72 | + | 92 | + |
73 | + fpst = get_fpstatus_ptr(true); | 93 | + /* Do a single operation on the lowest element in the vector. |
74 | + | 94 | + * We use the standard Neon helpers and rely on 0 OP 0 == 0 |
75 | + tcg_op1 = tcg_temp_new_i32(); | 95 | + * with no side effects for all these operations. |
76 | + tcg_op2 = tcg_temp_new_i32(); | 96 | + * OPTME: special-purpose helpers would avoid doing some |
77 | + tcg_res = tcg_temp_new_i32(); | 97 | + * unnecessary work in the helper for the 16 bit cases. |
78 | + | 98 | + */ |
79 | + read_vec_element_i32(s, tcg_op1, rn, 0, MO_16); | 99 | + ele1 = tcg_temp_new_i32(); |
80 | + read_vec_element_i32(s, tcg_op2, rm, 0, MO_16); | 100 | + ele2 = tcg_temp_new_i32(); |
81 | + | 101 | + ele3 = tcg_temp_new_i32(); |
82 | + switch (fpopcode) { | 102 | + |
83 | + case 0x03: /* FMULX */ | 103 | + read_vec_element_i32(s, ele1, rn, 0, size); |
84 | + gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst); | 104 | + read_vec_element_i32(s, ele2, rm, 0, size); |
105 | + read_vec_element_i32(s, ele3, rd, 0, size); | ||
106 | + | ||
107 | + switch (opcode) { | ||
108 | + case 0x0: /* SQRDMLAH */ | ||
109 | + if (size == 1) { | ||
110 | + gen_helper_neon_qrdmlah_s16(ele3, cpu_env, ele1, ele2, ele3); | ||
111 | + } else { | ||
112 | + gen_helper_neon_qrdmlah_s32(ele3, cpu_env, ele1, ele2, ele3); | ||
113 | + } | ||
85 | + break; | 114 | + break; |
86 | + case 0x04: /* FCMEQ (reg) */ | 115 | + case 0x1: /* SQRDMLSH */ |
87 | + gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 116 | + if (size == 1) { |
88 | + break; | 117 | + gen_helper_neon_qrdmlsh_s16(ele3, cpu_env, ele1, ele2, ele3); |
89 | + case 0x07: /* FRECPS */ | 118 | + } else { |
90 | + gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | 119 | + gen_helper_neon_qrdmlsh_s32(ele3, cpu_env, ele1, ele2, ele3); |
91 | + break; | 120 | + } |
92 | + case 0x0f: /* FRSQRTS */ | ||
93 | + gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
94 | + break; | ||
95 | + case 0x14: /* FCMGE (reg) */ | ||
96 | + gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
97 | + break; | ||
98 | + case 0x15: /* FACGE */ | ||
99 | + gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
100 | + break; | ||
101 | + case 0x1a: /* FABD */ | ||
102 | + gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
103 | + tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff); | ||
104 | + break; | ||
105 | + case 0x1c: /* FCMGT (reg) */ | ||
106 | + gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
107 | + break; | ||
108 | + case 0x1d: /* FACGT */ | ||
109 | + gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
110 | + break; | 121 | + break; |
111 | + default: | 122 | + default: |
112 | + g_assert_not_reached(); | 123 | + g_assert_not_reached(); |
113 | + } | 124 | + } |
114 | + | 125 | + tcg_temp_free_i32(ele1); |
115 | + write_fp_sreg(s, rd, tcg_res); | 126 | + tcg_temp_free_i32(ele2); |
116 | + | 127 | + |
117 | + | 128 | + res = tcg_temp_new_i64(); |
118 | + tcg_temp_free_i32(tcg_res); | 129 | + tcg_gen_extu_i32_i64(res, ele3); |
119 | + tcg_temp_free_i32(tcg_op1); | 130 | + tcg_temp_free_i32(ele3); |
120 | + tcg_temp_free_i32(tcg_op2); | 131 | + |
121 | + tcg_temp_free_ptr(fpst); | 132 | + write_fp_dreg(s, rd, res); |
133 | + tcg_temp_free_i64(res); | ||
122 | +} | 134 | +} |
123 | + | 135 | + |
124 | static void handle_2misc_64(DisasContext *s, int opcode, bool u, | 136 | static void handle_2misc_64(DisasContext *s, int opcode, bool u, |
125 | TCGv_i64 tcg_rd, TCGv_i64 tcg_rn, | 137 | TCGv_i64 tcg_rd, TCGv_i64 tcg_rn, |
126 | TCGv_i32 tcg_rmode, TCGv_ptr tcg_fpstatus) | 138 | TCGv_i32 tcg_rmode, TCGv_ptr tcg_fpstatus) |
127 | @@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = { | 139 | @@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = { |
128 | { 0xce408000, 0xffe0c000, disas_crypto_three_reg_imm2 }, | 140 | { 0x0e000800, 0xbf208c00, disas_simd_zip_trn }, |
129 | { 0x0e400400, 0x9f60c400, disas_simd_three_reg_same_fp16 }, | 141 | { 0x2e000000, 0xbf208400, disas_simd_ext }, |
130 | { 0x0e780800, 0x8f7e0c00, disas_simd_two_reg_misc_fp16 }, | 142 | { 0x5e200400, 0xdf200400, disas_simd_scalar_three_reg_same }, |
131 | + { 0x5e400400, 0xdf60c400, disas_simd_scalar_three_reg_same_fp16 }, | 143 | + { 0x5e008400, 0xdf208400, disas_simd_scalar_three_reg_same_extra }, |
132 | { 0x00000000, 0x00000000, NULL } | 144 | { 0x5e200000, 0xdf200c00, disas_simd_scalar_three_reg_diff }, |
133 | }; | 145 | { 0x5e200800, 0xdf3e0c00, disas_simd_scalar_two_reg_misc }, |
134 | 146 | { 0x5e300800, 0xdf3e0c00, disas_simd_scalar_pairwise }, | |
147 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
148 | new file mode 100644 | ||
149 | index XXXXXXX..XXXXXXX | ||
150 | --- /dev/null | ||
151 | +++ b/target/arm/vec_helper.c | ||
152 | @@ -XXX,XX +XXX,XX @@ | ||
153 | +/* | ||
154 | + * ARM AdvSIMD / SVE Vector Operations | ||
155 | + * | ||
156 | + * Copyright (c) 2018 Linaro | ||
157 | + * | ||
158 | + * This library is free software; you can redistribute it and/or | ||
159 | + * modify it under the terms of the GNU Lesser General Public | ||
160 | + * License as published by the Free Software Foundation; either | ||
161 | + * version 2 of the License, or (at your option) any later version. | ||
162 | + * | ||
163 | + * This library is distributed in the hope that it will be useful, | ||
164 | + * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
165 | + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
166 | + * Lesser General Public License for more details. | ||
167 | + * | ||
168 | + * You should have received a copy of the GNU Lesser General Public | ||
169 | + * License along with this library; if not, see <http://www.gnu.org/licenses/>. | ||
170 | + */ | ||
171 | + | ||
172 | +#include "qemu/osdep.h" | ||
173 | +#include "cpu.h" | ||
174 | +#include "exec/exec-all.h" | ||
175 | +#include "exec/helper-proto.h" | ||
176 | +#include "tcg/tcg-gvec-desc.h" | ||
177 | + | ||
178 | + | ||
179 | +#define SET_QC() env->vfp.xregs[ARM_VFP_FPSCR] |= CPSR_Q | ||
180 | + | ||
181 | +/* Signed saturating rounding doubling multiply-accumulate high half, 16-bit */ | ||
182 | +static uint16_t inl_qrdmlah_s16(CPUARMState *env, int16_t src1, | ||
183 | + int16_t src2, int16_t src3) | ||
184 | +{ | ||
185 | + /* Simplify: | ||
186 | + * = ((a3 << 16) + ((e1 * e2) << 1) + (1 << 15)) >> 16 | ||
187 | + * = ((a3 << 15) + (e1 * e2) + (1 << 14)) >> 15 | ||
188 | + */ | ||
189 | + int32_t ret = (int32_t)src1 * src2; | ||
190 | + ret = ((int32_t)src3 << 15) + ret + (1 << 14); | ||
191 | + ret >>= 15; | ||
192 | + if (ret != (int16_t)ret) { | ||
193 | + SET_QC(); | ||
194 | + ret = (ret < 0 ? -0x8000 : 0x7fff); | ||
195 | + } | ||
196 | + return ret; | ||
197 | +} | ||
198 | + | ||
199 | +uint32_t HELPER(neon_qrdmlah_s16)(CPUARMState *env, uint32_t src1, | ||
200 | + uint32_t src2, uint32_t src3) | ||
201 | +{ | ||
202 | + uint16_t e1 = inl_qrdmlah_s16(env, src1, src2, src3); | ||
203 | + uint16_t e2 = inl_qrdmlah_s16(env, src1 >> 16, src2 >> 16, src3 >> 16); | ||
204 | + return deposit32(e1, 16, 16, e2); | ||
205 | +} | ||
206 | + | ||
207 | +/* Signed saturating rounding doubling multiply-subtract high half, 16-bit */ | ||
208 | +static uint16_t inl_qrdmlsh_s16(CPUARMState *env, int16_t src1, | ||
209 | + int16_t src2, int16_t src3) | ||
210 | +{ | ||
211 | + /* Similarly, using subtraction: | ||
212 | + * = ((a3 << 16) - ((e1 * e2) << 1) + (1 << 15)) >> 16 | ||
213 | + * = ((a3 << 15) - (e1 * e2) + (1 << 14)) >> 15 | ||
214 | + */ | ||
215 | + int32_t ret = (int32_t)src1 * src2; | ||
216 | + ret = ((int32_t)src3 << 15) - ret + (1 << 14); | ||
217 | + ret >>= 15; | ||
218 | + if (ret != (int16_t)ret) { | ||
219 | + SET_QC(); | ||
220 | + ret = (ret < 0 ? -0x8000 : 0x7fff); | ||
221 | + } | ||
222 | + return ret; | ||
223 | +} | ||
224 | + | ||
225 | +uint32_t HELPER(neon_qrdmlsh_s16)(CPUARMState *env, uint32_t src1, | ||
226 | + uint32_t src2, uint32_t src3) | ||
227 | +{ | ||
228 | + uint16_t e1 = inl_qrdmlsh_s16(env, src1, src2, src3); | ||
229 | + uint16_t e2 = inl_qrdmlsh_s16(env, src1 >> 16, src2 >> 16, src3 >> 16); | ||
230 | + return deposit32(e1, 16, 16, e2); | ||
231 | +} | ||
232 | + | ||
233 | +/* Signed saturating rounding doubling multiply-accumulate high half, 32-bit */ | ||
234 | +uint32_t HELPER(neon_qrdmlah_s32)(CPUARMState *env, int32_t src1, | ||
235 | + int32_t src2, int32_t src3) | ||
236 | +{ | ||
237 | + /* Simplify similarly to int_qrdmlah_s16 above. */ | ||
238 | + int64_t ret = (int64_t)src1 * src2; | ||
239 | + ret = ((int64_t)src3 << 31) + ret + (1 << 30); | ||
240 | + ret >>= 31; | ||
241 | + if (ret != (int32_t)ret) { | ||
242 | + SET_QC(); | ||
243 | + ret = (ret < 0 ? INT32_MIN : INT32_MAX); | ||
244 | + } | ||
245 | + return ret; | ||
246 | +} | ||
247 | + | ||
248 | +/* Signed saturating rounding doubling multiply-subtract high half, 32-bit */ | ||
249 | +uint32_t HELPER(neon_qrdmlsh_s32)(CPUARMState *env, int32_t src1, | ||
250 | + int32_t src2, int32_t src3) | ||
251 | +{ | ||
252 | + /* Simplify similarly to int_qrdmlsh_s16 above. */ | ||
253 | + int64_t ret = (int64_t)src1 * src2; | ||
254 | + ret = ((int64_t)src3 << 31) - ret + (1 << 30); | ||
255 | + ret >>= 31; | ||
256 | + if (ret != (int32_t)ret) { | ||
257 | + SET_QC(); | ||
258 | + ret = (ret < 0 ? INT32_MIN : INT32_MAX); | ||
259 | + } | ||
260 | + return ret; | ||
261 | +} | ||
135 | -- | 262 | -- |
136 | 2.16.2 | 263 | 2.16.2 |
137 | 264 | ||
138 | 265 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This is the initial decode skeleton for the Advanced SIMD three same | 3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
4 | instruction group. | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
5 | 5 | Message-id: 20180228193125.20577-6-richard.henderson@linaro.org | |
6 | The fprintf is purely to aid debugging as the additional instructions | ||
7 | are added. It will be removed once the group is complete. | ||
8 | |||
9 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | ||
10 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
11 | Message-id: 20180227143852.11175-9-alex.bennee@linaro.org | ||
12 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
13 | --- | 7 | --- |
14 | target/arm/translate-a64.c | 73 ++++++++++++++++++++++++++++++++++++++++++++++ | 8 | target/arm/helper.h | 9 +++++ |
15 | 1 file changed, 73 insertions(+) | 9 | target/arm/translate-a64.c | 83 ++++++++++++++++++++++++++++++++++++++++++++++ |
16 | 10 | target/arm/vec_helper.c | 74 +++++++++++++++++++++++++++++++++++++++++ | |
11 | 3 files changed, 166 insertions(+) | ||
12 | |||
13 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
14 | index XXXXXXX..XXXXXXX 100644 | ||
15 | --- a/target/arm/helper.h | ||
16 | +++ b/target/arm/helper.h | ||
17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_2(dc_zva, void, env, i64) | ||
18 | DEF_HELPER_FLAGS_2(neon_pmull_64_lo, TCG_CALL_NO_RWG_SE, i64, i64, i64) | ||
19 | DEF_HELPER_FLAGS_2(neon_pmull_64_hi, TCG_CALL_NO_RWG_SE, i64, i64, i64) | ||
20 | |||
21 | +DEF_HELPER_FLAGS_5(gvec_qrdmlah_s16, TCG_CALL_NO_RWG, | ||
22 | + void, ptr, ptr, ptr, ptr, i32) | ||
23 | +DEF_HELPER_FLAGS_5(gvec_qrdmlsh_s16, TCG_CALL_NO_RWG, | ||
24 | + void, ptr, ptr, ptr, ptr, i32) | ||
25 | +DEF_HELPER_FLAGS_5(gvec_qrdmlah_s32, TCG_CALL_NO_RWG, | ||
26 | + void, ptr, ptr, ptr, ptr, i32) | ||
27 | +DEF_HELPER_FLAGS_5(gvec_qrdmlsh_s32, TCG_CALL_NO_RWG, | ||
28 | + void, ptr, ptr, ptr, ptr, i32) | ||
29 | + | ||
30 | #ifdef TARGET_AARCH64 | ||
31 | #include "helper-a64.h" | ||
32 | #endif | ||
17 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 33 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
18 | index XXXXXXX..XXXXXXX 100644 | 34 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/target/arm/translate-a64.c | 35 | --- a/target/arm/translate-a64.c |
20 | +++ b/target/arm/translate-a64.c | 36 | +++ b/target/arm/translate-a64.c |
21 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same(DisasContext *s, uint32_t insn) | 37 | @@ -XXX,XX +XXX,XX @@ static void gen_gvec_op3(DisasContext *s, bool is_q, int rd, |
22 | } | 38 | vec_full_reg_size(s), gvec_op); |
23 | } | 39 | } |
24 | 40 | ||
25 | +/* | 41 | +/* Expand a 3-operand + env pointer operation using |
26 | + * Advanced SIMD three same (ARMv8.2 FP16 variants) | 42 | + * an out-of-line helper. |
27 | + * | ||
28 | + * 31 30 29 28 24 23 22 21 20 16 15 14 13 11 10 9 5 4 0 | ||
29 | + * +---+---+---+-----------+---------+------+-----+--------+---+------+------+ | ||
30 | + * | 0 | Q | U | 0 1 1 1 0 | a | 1 0 | Rm | 0 0 | opcode | 1 | Rn | Rd | | ||
31 | + * +---+---+---+-----------+---------+------+-----+--------+---+------+------+ | ||
32 | + * | ||
33 | + * This includes FMULX, FCMEQ (register), FRECPS, FRSQRTS, FCMGE | ||
34 | + * (register), FACGE, FABD, FCMGT (register) and FACGT. | ||
35 | + * | ||
36 | + */ | 43 | + */ |
37 | +static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | 44 | +static void gen_gvec_op3_env(DisasContext *s, bool is_q, int rd, |
38 | +{ | 45 | + int rn, int rm, gen_helper_gvec_3_ptr *fn) |
39 | + int opcode, fpopcode; | 46 | +{ |
40 | + int is_q, u, a, rm, rn, rd; | 47 | + tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd), |
41 | + int datasize, elements; | 48 | + vec_full_reg_offset(s, rn), |
42 | + int pass; | 49 | + vec_full_reg_offset(s, rm), cpu_env, |
43 | + TCGv_ptr fpst; | 50 | + is_q ? 16 : 8, vec_full_reg_size(s), 0, fn); |
44 | + | 51 | +} |
45 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 52 | + |
53 | /* Set ZF and NF based on a 64 bit result. This is alas fiddlier | ||
54 | * than the 32 bit equivalent. | ||
55 | */ | ||
56 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | ||
57 | clear_vec_high(s, is_q, rd); | ||
58 | } | ||
59 | |||
60 | +/* AdvSIMD three same extra | ||
61 | + * 31 30 29 28 24 23 22 21 20 16 15 14 11 10 9 5 4 0 | ||
62 | + * +---+---+---+-----------+------+---+------+---+--------+---+----+----+ | ||
63 | + * | 0 | Q | U | 0 1 1 1 0 | size | 0 | Rm | 1 | opcode | 1 | Rn | Rd | | ||
64 | + * +---+---+---+-----------+------+---+------+---+--------+---+----+----+ | ||
65 | + */ | ||
66 | +static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn) | ||
67 | +{ | ||
68 | + int rd = extract32(insn, 0, 5); | ||
69 | + int rn = extract32(insn, 5, 5); | ||
70 | + int opcode = extract32(insn, 11, 4); | ||
71 | + int rm = extract32(insn, 16, 5); | ||
72 | + int size = extract32(insn, 22, 2); | ||
73 | + bool u = extract32(insn, 29, 1); | ||
74 | + bool is_q = extract32(insn, 30, 1); | ||
75 | + int feature; | ||
76 | + | ||
77 | + switch (u * 16 + opcode) { | ||
78 | + case 0x10: /* SQRDMLAH (vector) */ | ||
79 | + case 0x11: /* SQRDMLSH (vector) */ | ||
80 | + if (size != 1 && size != 2) { | ||
81 | + unallocated_encoding(s); | ||
82 | + return; | ||
83 | + } | ||
84 | + feature = ARM_FEATURE_V8_RDM; | ||
85 | + break; | ||
86 | + default: | ||
46 | + unallocated_encoding(s); | 87 | + unallocated_encoding(s); |
47 | + return; | 88 | + return; |
48 | + } | 89 | + } |
49 | + | 90 | + if (!arm_dc_feature(s, feature)) { |
91 | + unallocated_encoding(s); | ||
92 | + return; | ||
93 | + } | ||
50 | + if (!fp_access_check(s)) { | 94 | + if (!fp_access_check(s)) { |
51 | + return; | 95 | + return; |
52 | + } | 96 | + } |
53 | + | 97 | + |
54 | + /* For these floating point ops, the U, a and opcode bits | 98 | + switch (opcode) { |
55 | + * together indicate the operation. | 99 | + case 0x0: /* SQRDMLAH (vector) */ |
56 | + */ | 100 | + switch (size) { |
57 | + opcode = extract32(insn, 11, 3); | 101 | + case 1: |
58 | + u = extract32(insn, 29, 1); | 102 | + gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlah_s16); |
59 | + a = extract32(insn, 23, 1); | 103 | + break; |
60 | + is_q = extract32(insn, 30, 1); | 104 | + case 2: |
61 | + rm = extract32(insn, 16, 5); | 105 | + gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlah_s32); |
62 | + rn = extract32(insn, 5, 5); | 106 | + break; |
63 | + rd = extract32(insn, 0, 5); | ||
64 | + | ||
65 | + fpopcode = opcode | (a << 3) | (u << 4); | ||
66 | + datasize = is_q ? 128 : 64; | ||
67 | + elements = datasize / 16; | ||
68 | + | ||
69 | + fpst = get_fpstatus_ptr(true); | ||
70 | + | ||
71 | + for (pass = 0; pass < elements; pass++) { | ||
72 | + TCGv_i32 tcg_op1 = tcg_temp_new_i32(); | ||
73 | + TCGv_i32 tcg_op2 = tcg_temp_new_i32(); | ||
74 | + TCGv_i32 tcg_res = tcg_temp_new_i32(); | ||
75 | + | ||
76 | + read_vec_element_i32(s, tcg_op1, rn, pass, MO_16); | ||
77 | + read_vec_element_i32(s, tcg_op2, rm, pass, MO_16); | ||
78 | + | ||
79 | + switch (fpopcode) { | ||
80 | + default: | 107 | + default: |
81 | + fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n", | ||
82 | + __func__, insn, fpopcode, s->pc); | ||
83 | + g_assert_not_reached(); | 108 | + g_assert_not_reached(); |
84 | + } | 109 | + } |
85 | + | 110 | + return; |
86 | + write_vec_element_i32(s, tcg_res, rd, pass, MO_16); | 111 | + |
87 | + tcg_temp_free_i32(tcg_res); | 112 | + case 0x1: /* SQRDMLSH (vector) */ |
88 | + tcg_temp_free_i32(tcg_op1); | 113 | + switch (size) { |
89 | + tcg_temp_free_i32(tcg_op2); | 114 | + case 1: |
90 | + } | 115 | + gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlsh_s16); |
91 | + | 116 | + break; |
92 | + tcg_temp_free_ptr(fpst); | 117 | + case 2: |
93 | + | 118 | + gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlsh_s32); |
94 | + clear_vec_high(s, is_q, rd); | 119 | + break; |
120 | + default: | ||
121 | + g_assert_not_reached(); | ||
122 | + } | ||
123 | + return; | ||
124 | + | ||
125 | + default: | ||
126 | + g_assert_not_reached(); | ||
127 | + } | ||
95 | +} | 128 | +} |
96 | + | 129 | + |
97 | static void handle_2misc_widening(DisasContext *s, int opcode, bool is_q, | 130 | static void handle_2misc_widening(DisasContext *s, int opcode, bool is_q, |
98 | int size, int rn, int rd) | 131 | int size, int rn, int rd) |
99 | { | 132 | { |
100 | @@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = { | 133 | @@ -XXX,XX +XXX,XX @@ static void disas_crypto_three_reg_imm2(DisasContext *s, uint32_t insn) |
101 | { 0xce000000, 0xff808000, disas_crypto_four_reg }, | 134 | static const AArch64DecodeTable data_proc_simd[] = { |
102 | { 0xce800000, 0xffe00000, disas_crypto_xar }, | 135 | /* pattern , mask , fn */ |
103 | { 0xce408000, 0xffe0c000, disas_crypto_three_reg_imm2 }, | 136 | { 0x0e200400, 0x9f200400, disas_simd_three_reg_same }, |
104 | + { 0x0e400400, 0x9f60c400, disas_simd_three_reg_same_fp16 }, | 137 | + { 0x0e008400, 0x9f208400, disas_simd_three_reg_same_extra }, |
105 | { 0x00000000, 0x00000000, NULL } | 138 | { 0x0e200000, 0x9f200c00, disas_simd_three_reg_diff }, |
106 | }; | 139 | { 0x0e200800, 0x9f3e0c00, disas_simd_two_reg_misc }, |
107 | 140 | { 0x0e300800, 0x9f3e0c00, disas_simd_across_lanes }, | |
141 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
142 | index XXXXXXX..XXXXXXX 100644 | ||
143 | --- a/target/arm/vec_helper.c | ||
144 | +++ b/target/arm/vec_helper.c | ||
145 | @@ -XXX,XX +XXX,XX @@ | ||
146 | |||
147 | #define SET_QC() env->vfp.xregs[ARM_VFP_FPSCR] |= CPSR_Q | ||
148 | |||
149 | +static void clear_tail(void *vd, uintptr_t opr_sz, uintptr_t max_sz) | ||
150 | +{ | ||
151 | + uint64_t *d = vd + opr_sz; | ||
152 | + uintptr_t i; | ||
153 | + | ||
154 | + for (i = opr_sz; i < max_sz; i += 8) { | ||
155 | + *d++ = 0; | ||
156 | + } | ||
157 | +} | ||
158 | + | ||
159 | /* Signed saturating rounding doubling multiply-accumulate high half, 16-bit */ | ||
160 | static uint16_t inl_qrdmlah_s16(CPUARMState *env, int16_t src1, | ||
161 | int16_t src2, int16_t src3) | ||
162 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlah_s16)(CPUARMState *env, uint32_t src1, | ||
163 | return deposit32(e1, 16, 16, e2); | ||
164 | } | ||
165 | |||
166 | +void HELPER(gvec_qrdmlah_s16)(void *vd, void *vn, void *vm, | ||
167 | + void *ve, uint32_t desc) | ||
168 | +{ | ||
169 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
170 | + int16_t *d = vd; | ||
171 | + int16_t *n = vn; | ||
172 | + int16_t *m = vm; | ||
173 | + CPUARMState *env = ve; | ||
174 | + uintptr_t i; | ||
175 | + | ||
176 | + for (i = 0; i < opr_sz / 2; ++i) { | ||
177 | + d[i] = inl_qrdmlah_s16(env, n[i], m[i], d[i]); | ||
178 | + } | ||
179 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
180 | +} | ||
181 | + | ||
182 | /* Signed saturating rounding doubling multiply-subtract high half, 16-bit */ | ||
183 | static uint16_t inl_qrdmlsh_s16(CPUARMState *env, int16_t src1, | ||
184 | int16_t src2, int16_t src3) | ||
185 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlsh_s16)(CPUARMState *env, uint32_t src1, | ||
186 | return deposit32(e1, 16, 16, e2); | ||
187 | } | ||
188 | |||
189 | +void HELPER(gvec_qrdmlsh_s16)(void *vd, void *vn, void *vm, | ||
190 | + void *ve, uint32_t desc) | ||
191 | +{ | ||
192 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
193 | + int16_t *d = vd; | ||
194 | + int16_t *n = vn; | ||
195 | + int16_t *m = vm; | ||
196 | + CPUARMState *env = ve; | ||
197 | + uintptr_t i; | ||
198 | + | ||
199 | + for (i = 0; i < opr_sz / 2; ++i) { | ||
200 | + d[i] = inl_qrdmlsh_s16(env, n[i], m[i], d[i]); | ||
201 | + } | ||
202 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
203 | +} | ||
204 | + | ||
205 | /* Signed saturating rounding doubling multiply-accumulate high half, 32-bit */ | ||
206 | uint32_t HELPER(neon_qrdmlah_s32)(CPUARMState *env, int32_t src1, | ||
207 | int32_t src2, int32_t src3) | ||
208 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlah_s32)(CPUARMState *env, int32_t src1, | ||
209 | return ret; | ||
210 | } | ||
211 | |||
212 | +void HELPER(gvec_qrdmlah_s32)(void *vd, void *vn, void *vm, | ||
213 | + void *ve, uint32_t desc) | ||
214 | +{ | ||
215 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
216 | + int32_t *d = vd; | ||
217 | + int32_t *n = vn; | ||
218 | + int32_t *m = vm; | ||
219 | + CPUARMState *env = ve; | ||
220 | + uintptr_t i; | ||
221 | + | ||
222 | + for (i = 0; i < opr_sz / 4; ++i) { | ||
223 | + d[i] = helper_neon_qrdmlah_s32(env, n[i], m[i], d[i]); | ||
224 | + } | ||
225 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
226 | +} | ||
227 | + | ||
228 | /* Signed saturating rounding doubling multiply-subtract high half, 32-bit */ | ||
229 | uint32_t HELPER(neon_qrdmlsh_s32)(CPUARMState *env, int32_t src1, | ||
230 | int32_t src2, int32_t src3) | ||
231 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlsh_s32)(CPUARMState *env, int32_t src1, | ||
232 | } | ||
233 | return ret; | ||
234 | } | ||
235 | + | ||
236 | +void HELPER(gvec_qrdmlsh_s32)(void *vd, void *vn, void *vm, | ||
237 | + void *ve, uint32_t desc) | ||
238 | +{ | ||
239 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
240 | + int32_t *d = vd; | ||
241 | + int32_t *n = vn; | ||
242 | + int32_t *m = vm; | ||
243 | + CPUARMState *env = ve; | ||
244 | + uintptr_t i; | ||
245 | + | ||
246 | + for (i = 0; i < opr_sz / 4; ++i) { | ||
247 | + d[i] = helper_neon_qrdmlsh_s32(env, n[i], m[i], d[i]); | ||
248 | + } | ||
249 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
250 | +} | ||
108 | -- | 251 | -- |
109 | 2.16.2 | 252 | 2.16.2 |
110 | 253 | ||
111 | 254 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 3 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> |
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Message-id: 20180227143852.11175-26-alex.bennee@linaro.org | 5 | Message-id: 20180228193125.20577-7-richard.henderson@linaro.org |
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 7 | --- |
8 | target/arm/helper-a64.h | 1 + | 8 | target/arm/translate-a64.c | 29 +++++++++++++++++++++++++++++ |
9 | target/arm/helper-a64.c | 13 +++++++++++++ | 9 | 1 file changed, 29 insertions(+) |
10 | target/arm/translate-a64.c | 5 +++++ | ||
11 | 3 files changed, 19 insertions(+) | ||
12 | 10 | ||
13 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | ||
14 | index XXXXXXX..XXXXXXX 100644 | ||
15 | --- a/target/arm/helper-a64.h | ||
16 | +++ b/target/arm/helper-a64.h | ||
17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_2(advsimd_rinth_exact, f16, f16, ptr) | ||
18 | DEF_HELPER_2(advsimd_rinth, f16, f16, ptr) | ||
19 | DEF_HELPER_2(advsimd_f16tosinth, i32, f16, ptr) | ||
20 | DEF_HELPER_2(advsimd_f16touinth, i32, f16, ptr) | ||
21 | +DEF_HELPER_2(sqrt_f16, f16, f16, ptr) | ||
22 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | ||
23 | index XXXXXXX..XXXXXXX 100644 | ||
24 | --- a/target/arm/helper-a64.c | ||
25 | +++ b/target/arm/helper-a64.c | ||
26 | @@ -XXX,XX +XXX,XX @@ uint32_t HELPER(advsimd_f16touinth)(float16 a, void *fpstp) | ||
27 | } | ||
28 | return float16_to_uint16(a, fpst); | ||
29 | } | ||
30 | + | ||
31 | +/* | ||
32 | + * Square Root and Reciprocal square root | ||
33 | + */ | ||
34 | + | ||
35 | +float16 HELPER(sqrt_f16)(float16 a, void *fpstp) | ||
36 | +{ | ||
37 | + float_status *s = fpstp; | ||
38 | + | ||
39 | + return float16_sqrt(a, s); | ||
40 | +} | ||
41 | + | ||
42 | + | ||
43 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 11 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
44 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
45 | --- a/target/arm/translate-a64.c | 13 | --- a/target/arm/translate-a64.c |
46 | +++ b/target/arm/translate-a64.c | 14 | +++ b/target/arm/translate-a64.c |
47 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 15 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
48 | case 0x6f: /* FNEG */ | 16 | case 0x19: /* FMULX */ |
49 | need_fpst = false; | 17 | is_fp = true; |
50 | break; | 18 | break; |
51 | + case 0x7f: /* FSQRT (vector) */ | 19 | + case 0x1d: /* SQRDMLAH */ |
20 | + case 0x1f: /* SQRDMLSH */ | ||
21 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_RDM)) { | ||
22 | + unallocated_encoding(s); | ||
23 | + return; | ||
24 | + } | ||
52 | + break; | 25 | + break; |
53 | default: | 26 | default: |
54 | fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop); | 27 | unallocated_encoding(s); |
55 | g_assert_not_reached(); | 28 | return; |
56 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 29 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
57 | case 0x6f: /* FNEG */ | 30 | tcg_op, tcg_idx); |
58 | tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000); | 31 | } |
59 | break; | 32 | break; |
60 | + case 0x7f: /* FSQRT */ | 33 | + case 0x1d: /* SQRDMLAH */ |
61 | + gen_helper_sqrt_f16(tcg_res, tcg_op, tcg_fpstatus); | 34 | + read_vec_element_i32(s, tcg_res, rd, pass, |
35 | + is_scalar ? size : MO_32); | ||
36 | + if (size == 1) { | ||
37 | + gen_helper_neon_qrdmlah_s16(tcg_res, cpu_env, | ||
38 | + tcg_op, tcg_idx, tcg_res); | ||
39 | + } else { | ||
40 | + gen_helper_neon_qrdmlah_s32(tcg_res, cpu_env, | ||
41 | + tcg_op, tcg_idx, tcg_res); | ||
42 | + } | ||
43 | + break; | ||
44 | + case 0x1f: /* SQRDMLSH */ | ||
45 | + read_vec_element_i32(s, tcg_res, rd, pass, | ||
46 | + is_scalar ? size : MO_32); | ||
47 | + if (size == 1) { | ||
48 | + gen_helper_neon_qrdmlsh_s16(tcg_res, cpu_env, | ||
49 | + tcg_op, tcg_idx, tcg_res); | ||
50 | + } else { | ||
51 | + gen_helper_neon_qrdmlsh_s32(tcg_res, cpu_env, | ||
52 | + tcg_op, tcg_idx, tcg_res); | ||
53 | + } | ||
62 | + break; | 54 | + break; |
63 | default: | 55 | default: |
64 | g_assert_not_reached(); | 56 | g_assert_not_reached(); |
65 | } | 57 | } |
66 | -- | 58 | -- |
67 | 2.16.2 | 59 | 2.16.2 |
68 | 60 | ||
69 | 61 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This covers all the floating point convert operations. | 3 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
4 | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | |
5 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | Message-id: 20180228193125.20577-8-richard.henderson@linaro.org |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20180227143852.11175-19-alex.bennee@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 7 | --- |
10 | target/arm/helper-a64.h | 2 ++ | 8 | target/arm/translate.c | 86 +++++++++++++++++++++++++++++++++++++++----------- |
11 | target/arm/helper-a64.c | 32 +++++++++++++++++ | 9 | 1 file changed, 67 insertions(+), 19 deletions(-) |
12 | target/arm/translate-a64.c | 85 +++++++++++++++++++++++++++++++++++++++++++++- | ||
13 | 3 files changed, 118 insertions(+), 1 deletion(-) | ||
14 | 10 | ||
15 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 11 | diff --git a/target/arm/translate.c b/target/arm/translate.c |
16 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/helper-a64.h | 13 | --- a/target/arm/translate.c |
18 | +++ b/target/arm/helper-a64.h | 14 | +++ b/target/arm/translate.c |
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_mulx2h, i32, i32, i32, ptr) | 15 | @@ -XXX,XX +XXX,XX @@ |
20 | DEF_HELPER_4(advsimd_muladd2h, i32, i32, i32, i32, ptr) | 16 | #include "disas/disas.h" |
21 | DEF_HELPER_2(advsimd_rinth_exact, f16, f16, ptr) | 17 | #include "exec/exec-all.h" |
22 | DEF_HELPER_2(advsimd_rinth, f16, f16, ptr) | 18 | #include "tcg-op.h" |
23 | +DEF_HELPER_2(advsimd_f16tosinth, i32, f16, ptr) | 19 | +#include "tcg-op-gvec.h" |
24 | +DEF_HELPER_2(advsimd_f16touinth, i32, f16, ptr) | 20 | #include "qemu/log.h" |
25 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 21 | #include "qemu/bitops.h" |
26 | index XXXXXXX..XXXXXXX 100644 | 22 | #include "arm_ldst.h" |
27 | --- a/target/arm/helper-a64.c | 23 | @@ -XXX,XX +XXX,XX @@ static void gen_neon_narrow_op(int op, int u, int size, |
28 | +++ b/target/arm/helper-a64.c | 24 | #define NEON_3R_VPMAX 20 |
29 | @@ -XXX,XX +XXX,XX @@ float16 HELPER(advsimd_rinth)(float16 x, void *fp_status) | 25 | #define NEON_3R_VPMIN 21 |
30 | 26 | #define NEON_3R_VQDMULH_VQRDMULH 22 | |
31 | return ret; | 27 | -#define NEON_3R_VPADD 23 |
32 | } | 28 | +#define NEON_3R_VPADD_VQRDMLAH 23 |
29 | #define NEON_3R_SHA 24 /* SHA1C,SHA1P,SHA1M,SHA1SU0,SHA256H{2},SHA256SU1 */ | ||
30 | -#define NEON_3R_VFM 25 /* VFMA, VFMS : float fused multiply-add */ | ||
31 | +#define NEON_3R_VFM_VQRDMLSH 25 /* VFMA, VFMS, VQRDMLSH */ | ||
32 | #define NEON_3R_FLOAT_ARITH 26 /* float VADD, VSUB, VPADD, VABD */ | ||
33 | #define NEON_3R_FLOAT_MULTIPLY 27 /* float VMLA, VMLS, VMUL */ | ||
34 | #define NEON_3R_FLOAT_CMP 28 /* float VCEQ, VCGE, VCGT */ | ||
35 | @@ -XXX,XX +XXX,XX @@ static const uint8_t neon_3r_sizes[] = { | ||
36 | [NEON_3R_VPMAX] = 0x7, | ||
37 | [NEON_3R_VPMIN] = 0x7, | ||
38 | [NEON_3R_VQDMULH_VQRDMULH] = 0x6, | ||
39 | - [NEON_3R_VPADD] = 0x7, | ||
40 | + [NEON_3R_VPADD_VQRDMLAH] = 0x7, | ||
41 | [NEON_3R_SHA] = 0xf, /* size field encodes op type */ | ||
42 | - [NEON_3R_VFM] = 0x5, /* size bit 1 encodes op */ | ||
43 | + [NEON_3R_VFM_VQRDMLSH] = 0x7, /* For VFM, size bit 1 encodes op */ | ||
44 | [NEON_3R_FLOAT_ARITH] = 0x5, /* size bit 1 encodes op */ | ||
45 | [NEON_3R_FLOAT_MULTIPLY] = 0x5, /* size bit 1 encodes op */ | ||
46 | [NEON_3R_FLOAT_CMP] = 0x5, /* size bit 1 encodes op */ | ||
47 | @@ -XXX,XX +XXX,XX @@ static const uint8_t neon_2rm_sizes[] = { | ||
48 | [NEON_2RM_VCVT_UF] = 0x4, | ||
49 | }; | ||
50 | |||
33 | + | 51 | + |
34 | +/* | 52 | +/* Expand v8.1 simd helper. */ |
35 | + * Half-precision floating point conversion functions | 53 | +static int do_v81_helper(DisasContext *s, gen_helper_gvec_3_ptr *fn, |
36 | + * | 54 | + int q, int rd, int rn, int rm) |
37 | + * There are a multitude of conversion functions with various | ||
38 | + * different rounding modes. This is dealt with by the calling code | ||
39 | + * setting the mode appropriately before calling the helper. | ||
40 | + */ | ||
41 | + | ||
42 | +uint32_t HELPER(advsimd_f16tosinth)(float16 a, void *fpstp) | ||
43 | +{ | 55 | +{ |
44 | + float_status *fpst = fpstp; | 56 | + if (arm_dc_feature(s, ARM_FEATURE_V8_RDM)) { |
45 | + | 57 | + int opr_sz = (1 + q) * 8; |
46 | + /* Invalid if we are passed a NaN */ | 58 | + tcg_gen_gvec_3_ptr(vfp_reg_offset(1, rd), |
47 | + if (float16_is_any_nan(a)) { | 59 | + vfp_reg_offset(1, rn), |
48 | + float_raise(float_flag_invalid, fpst); | 60 | + vfp_reg_offset(1, rm), cpu_env, |
61 | + opr_sz, opr_sz, 0, fn); | ||
49 | + return 0; | 62 | + return 0; |
50 | + } | 63 | + } |
51 | + return float16_to_int16(a, fpst); | 64 | + return 1; |
52 | +} | 65 | +} |
53 | + | 66 | + |
54 | +uint32_t HELPER(advsimd_f16touinth)(float16 a, void *fpstp) | 67 | /* Translate a NEON data processing instruction. Return nonzero if the |
55 | +{ | 68 | instruction is invalid. |
56 | + float_status *fpst = fpstp; | 69 | We process data in a mixture of 32-bit and 64-bit chunks. |
70 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
71 | if (q && ((rd | rn | rm) & 1)) { | ||
72 | return 1; | ||
73 | } | ||
74 | - /* | ||
75 | - * The SHA-1/SHA-256 3-register instructions require special treatment | ||
76 | - * here, as their size field is overloaded as an op type selector, and | ||
77 | - * they all consume their input in a single pass. | ||
78 | - */ | ||
79 | - if (op == NEON_3R_SHA) { | ||
80 | + switch (op) { | ||
81 | + case NEON_3R_SHA: | ||
82 | + /* The SHA-1/SHA-256 3-register instructions require special | ||
83 | + * treatment here, as their size field is overloaded as an | ||
84 | + * op type selector, and they all consume their input in a | ||
85 | + * single pass. | ||
86 | + */ | ||
87 | if (!q) { | ||
88 | return 1; | ||
89 | } | ||
90 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
91 | tcg_temp_free_ptr(ptr2); | ||
92 | tcg_temp_free_ptr(ptr3); | ||
93 | return 0; | ||
57 | + | 94 | + |
58 | + /* Invalid if we are passed a NaN */ | 95 | + case NEON_3R_VPADD_VQRDMLAH: |
59 | + if (float16_is_any_nan(a)) { | 96 | + if (!u) { |
60 | + float_raise(float_flag_invalid, fpst); | 97 | + break; /* VPADD */ |
61 | + return 0; | 98 | + } |
62 | + } | 99 | + /* VQRDMLAH */ |
63 | + return float16_to_uint16(a, fpst); | 100 | + switch (size) { |
64 | +} | 101 | + case 1: |
65 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 102 | + return do_v81_helper(s, gen_helper_gvec_qrdmlah_s16, |
66 | index XXXXXXX..XXXXXXX 100644 | 103 | + q, rd, rn, rm); |
67 | --- a/target/arm/translate-a64.c | 104 | + case 2: |
68 | +++ b/target/arm/translate-a64.c | 105 | + return do_v81_helper(s, gen_helper_gvec_qrdmlah_s32, |
69 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 106 | + q, rd, rn, rm); |
70 | only_in_vector = true; | 107 | + } |
71 | /* current rounding mode */ | 108 | + return 1; |
72 | break; | ||
73 | + case 0x1a: /* FCVTNS */ | ||
74 | + need_rmode = true; | ||
75 | + rmode = FPROUNDING_TIEEVEN; | ||
76 | + break; | ||
77 | + case 0x1b: /* FCVTMS */ | ||
78 | + need_rmode = true; | ||
79 | + rmode = FPROUNDING_NEGINF; | ||
80 | + break; | ||
81 | + case 0x1c: /* FCVTAS */ | ||
82 | + need_rmode = true; | ||
83 | + rmode = FPROUNDING_TIEAWAY; | ||
84 | + break; | ||
85 | + case 0x3a: /* FCVTPS */ | ||
86 | + need_rmode = true; | ||
87 | + rmode = FPROUNDING_POSINF; | ||
88 | + break; | ||
89 | + case 0x3b: /* FCVTZS */ | ||
90 | + need_rmode = true; | ||
91 | + rmode = FPROUNDING_ZERO; | ||
92 | + break; | ||
93 | + case 0x5a: /* FCVTNU */ | ||
94 | + need_rmode = true; | ||
95 | + rmode = FPROUNDING_TIEEVEN; | ||
96 | + break; | ||
97 | + case 0x5b: /* FCVTMU */ | ||
98 | + need_rmode = true; | ||
99 | + rmode = FPROUNDING_NEGINF; | ||
100 | + break; | ||
101 | + case 0x5c: /* FCVTAU */ | ||
102 | + need_rmode = true; | ||
103 | + rmode = FPROUNDING_TIEAWAY; | ||
104 | + break; | ||
105 | + case 0x7a: /* FCVTPU */ | ||
106 | + need_rmode = true; | ||
107 | + rmode = FPROUNDING_POSINF; | ||
108 | + break; | ||
109 | + case 0x7b: /* FCVTZU */ | ||
110 | + need_rmode = true; | ||
111 | + rmode = FPROUNDING_ZERO; | ||
112 | + break; | ||
113 | default: | ||
114 | fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop); | ||
115 | g_assert_not_reached(); | ||
116 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | ||
117 | } | ||
118 | |||
119 | if (is_scalar) { | ||
120 | - /* no operations yet */ | ||
121 | + TCGv_i32 tcg_op = tcg_temp_new_i32(); | ||
122 | + TCGv_i32 tcg_res = tcg_temp_new_i32(); | ||
123 | + | 109 | + |
124 | + read_vec_element_i32(s, tcg_op, rn, 0, MO_16); | 110 | + case NEON_3R_VFM_VQRDMLSH: |
125 | + | 111 | + if (!u) { |
126 | + switch (fpop) { | 112 | + /* VFM, VFMS */ |
127 | + case 0x1a: /* FCVTNS */ | 113 | + if (size == 1) { |
128 | + case 0x1b: /* FCVTMS */ | 114 | + return 1; |
129 | + case 0x1c: /* FCVTAS */ | 115 | + } |
130 | + case 0x3a: /* FCVTPS */ | ||
131 | + case 0x3b: /* FCVTZS */ | ||
132 | + gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus); | ||
133 | + break; | ||
134 | + case 0x5a: /* FCVTNU */ | ||
135 | + case 0x5b: /* FCVTMU */ | ||
136 | + case 0x5c: /* FCVTAU */ | ||
137 | + case 0x7a: /* FCVTPU */ | ||
138 | + case 0x7b: /* FCVTZU */ | ||
139 | + gen_helper_advsimd_f16touinth(tcg_res, tcg_op, tcg_fpstatus); | ||
140 | + break; | ||
141 | + default: | ||
142 | + g_assert_not_reached(); | ||
143 | + } | ||
144 | + | ||
145 | + /* limit any sign extension going on */ | ||
146 | + tcg_gen_andi_i32(tcg_res, tcg_res, 0xffff); | ||
147 | + write_fp_sreg(s, rd, tcg_res); | ||
148 | + | ||
149 | + tcg_temp_free_i32(tcg_res); | ||
150 | + tcg_temp_free_i32(tcg_op); | ||
151 | } else { | ||
152 | for (pass = 0; pass < (is_q ? 8 : 4); pass++) { | ||
153 | TCGv_i32 tcg_op = tcg_temp_new_i32(); | ||
154 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | ||
155 | read_vec_element_i32(s, tcg_op, rn, pass, MO_16); | ||
156 | |||
157 | switch (fpop) { | ||
158 | + case 0x1a: /* FCVTNS */ | ||
159 | + case 0x1b: /* FCVTMS */ | ||
160 | + case 0x1c: /* FCVTAS */ | ||
161 | + case 0x3a: /* FCVTPS */ | ||
162 | + case 0x3b: /* FCVTZS */ | ||
163 | + gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus); | ||
164 | + break; | 116 | + break; |
165 | + case 0x5a: /* FCVTNU */ | 117 | + } |
166 | + case 0x5b: /* FCVTMU */ | 118 | + /* VQRDMLSH */ |
167 | + case 0x5c: /* FCVTAU */ | 119 | + switch (size) { |
168 | + case 0x7a: /* FCVTPU */ | 120 | + case 1: |
169 | + case 0x7b: /* FCVTZU */ | 121 | + return do_v81_helper(s, gen_helper_gvec_qrdmlsh_s16, |
170 | + gen_helper_advsimd_f16touinth(tcg_res, tcg_op, tcg_fpstatus); | 122 | + q, rd, rn, rm); |
171 | + break; | 123 | + case 2: |
172 | case 0x18: /* FRINTN */ | 124 | + return do_v81_helper(s, gen_helper_gvec_qrdmlsh_s32, |
173 | case 0x19: /* FRINTM */ | 125 | + q, rd, rn, rm); |
174 | case 0x38: /* FRINTP */ | 126 | + } |
127 | + return 1; | ||
128 | } | ||
129 | if (size == 3 && op != NEON_3R_LOGIC) { | ||
130 | /* 64-bit element instructions. */ | ||
131 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
132 | rm = rtmp; | ||
133 | } | ||
134 | break; | ||
135 | - case NEON_3R_VPADD: | ||
136 | - if (u) { | ||
137 | - return 1; | ||
138 | - } | ||
139 | - /* Fall through */ | ||
140 | + case NEON_3R_VPADD_VQRDMLAH: | ||
141 | case NEON_3R_VPMAX: | ||
142 | case NEON_3R_VPMIN: | ||
143 | pairwise = 1; | ||
144 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
145 | return 1; | ||
146 | } | ||
147 | break; | ||
148 | - case NEON_3R_VFM: | ||
149 | - if (!arm_dc_feature(s, ARM_FEATURE_VFP4) || u) { | ||
150 | + case NEON_3R_VFM_VQRDMLSH: | ||
151 | + if (!arm_dc_feature(s, ARM_FEATURE_VFP4)) { | ||
152 | return 1; | ||
153 | } | ||
154 | break; | ||
155 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
156 | } | ||
157 | } | ||
158 | break; | ||
159 | - case NEON_3R_VPADD: | ||
160 | + case NEON_3R_VPADD_VQRDMLAH: | ||
161 | switch (size) { | ||
162 | case 0: gen_helper_neon_padd_u8(tmp, tmp, tmp2); break; | ||
163 | case 1: gen_helper_neon_padd_u16(tmp, tmp, tmp2); break; | ||
164 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
165 | } | ||
166 | } | ||
167 | break; | ||
168 | - case NEON_3R_VFM: | ||
169 | + case NEON_3R_VFM_VQRDMLSH: | ||
170 | { | ||
171 | /* VFMA, VFMS: fused multiply-add */ | ||
172 | TCGv_ptr fpstatus = get_fpstatus_ptr(1); | ||
175 | -- | 173 | -- |
176 | 2.16.2 | 174 | 2.16.2 |
177 | 175 | ||
178 | 176 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 3 | Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org> |
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
5 | Message-id: 20180227143852.11175-12-alex.bennee@linaro.org | 5 | Message-id: 20180228193125.20577-9-richard.henderson@linaro.org |
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 7 | --- |
8 | target/arm/helper-a64.h | 2 ++ | 8 | target/arm/translate.c | 46 ++++++++++++++++++++++++++++++++++++++++++---- |
9 | target/arm/helper-a64.c | 24 ++++++++++++++++++++++++ | 9 | 1 file changed, 42 insertions(+), 4 deletions(-) |
10 | target/arm/translate-a64.c | 15 +++++++++++++++ | ||
11 | 3 files changed, 41 insertions(+) | ||
12 | 10 | ||
13 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 11 | diff --git a/target/arm/translate.c b/target/arm/translate.c |
14 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
15 | --- a/target/arm/helper-a64.h | 13 | --- a/target/arm/translate.c |
16 | +++ b/target/arm/helper-a64.h | 14 | +++ b/target/arm/translate.c |
17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_cge_f16, i32, f16, f16, ptr) | 15 | @@ -XXX,XX +XXX,XX @@ static const char *regnames[] = |
18 | DEF_HELPER_3(advsimd_cgt_f16, i32, f16, f16, ptr) | 16 | { "r0", "r1", "r2", "r3", "r4", "r5", "r6", "r7", |
19 | DEF_HELPER_3(advsimd_acge_f16, i32, f16, f16, ptr) | 17 | "r8", "r9", "r10", "r11", "r12", "r13", "r14", "pc" }; |
20 | DEF_HELPER_3(advsimd_acgt_f16, i32, f16, f16, ptr) | 18 | |
21 | +DEF_HELPER_3(advsimd_mulxh, f16, f16, f16, ptr) | 19 | +/* Function prototypes for gen_ functions calling Neon helpers. */ |
22 | +DEF_HELPER_4(advsimd_muladdh, f16, f16, f16, f16, ptr) | 20 | +typedef void NeonGenThreeOpEnvFn(TCGv_i32, TCGv_env, TCGv_i32, |
23 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 21 | + TCGv_i32, TCGv_i32); |
24 | index XXXXXXX..XXXXXXX 100644 | ||
25 | --- a/target/arm/helper-a64.c | ||
26 | +++ b/target/arm/helper-a64.c | ||
27 | @@ -XXX,XX +XXX,XX @@ ADVSIMD_HALFOP(max) | ||
28 | ADVSIMD_HALFOP(minnum) | ||
29 | ADVSIMD_HALFOP(maxnum) | ||
30 | |||
31 | +/* Data processing - scalar floating-point and advanced SIMD */ | ||
32 | +float16 HELPER(advsimd_mulxh)(float16 a, float16 b, void *fpstp) | ||
33 | +{ | ||
34 | + float_status *fpst = fpstp; | ||
35 | + | 22 | + |
36 | + a = float16_squash_input_denormal(a, fpst); | 23 | /* initialize TCG globals. */ |
37 | + b = float16_squash_input_denormal(b, fpst); | 24 | void arm_translate_init(void) |
25 | { | ||
26 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) | ||
27 | } | ||
28 | neon_store_reg64(cpu_V0, rd + pass); | ||
29 | } | ||
30 | - | ||
31 | - | ||
32 | break; | ||
33 | - default: /* 14 and 15 are RESERVED */ | ||
34 | - return 1; | ||
35 | + case 14: /* VQRDMLAH scalar */ | ||
36 | + case 15: /* VQRDMLSH scalar */ | ||
37 | + { | ||
38 | + NeonGenThreeOpEnvFn *fn; | ||
38 | + | 39 | + |
39 | + if ((float16_is_zero(a) && float16_is_infinity(b)) || | 40 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_RDM)) { |
40 | + (float16_is_infinity(a) && float16_is_zero(b))) { | 41 | + return 1; |
41 | + /* 2.0 with the sign bit set to sign(A) XOR sign(B) */ | 42 | + } |
42 | + return make_float16((1U << 14) | | 43 | + if (u && ((rd | rn) & 1)) { |
43 | + ((float16_val(a) ^ float16_val(b)) & (1U << 15))); | 44 | + return 1; |
44 | + } | 45 | + } |
45 | + return float16_mul(a, b, fpst); | 46 | + if (op == 14) { |
46 | +} | 47 | + if (size == 1) { |
48 | + fn = gen_helper_neon_qrdmlah_s16; | ||
49 | + } else { | ||
50 | + fn = gen_helper_neon_qrdmlah_s32; | ||
51 | + } | ||
52 | + } else { | ||
53 | + if (size == 1) { | ||
54 | + fn = gen_helper_neon_qrdmlsh_s16; | ||
55 | + } else { | ||
56 | + fn = gen_helper_neon_qrdmlsh_s32; | ||
57 | + } | ||
58 | + } | ||
47 | + | 59 | + |
48 | +/* fused multiply-accumulate */ | 60 | + tmp2 = neon_get_scalar(size, rm); |
49 | +float16 HELPER(advsimd_muladdh)(float16 a, float16 b, float16 c, void *fpstp) | 61 | + for (pass = 0; pass < (u ? 4 : 2); pass++) { |
50 | +{ | 62 | + tmp = neon_load_reg(rn, pass); |
51 | + float_status *fpst = fpstp; | 63 | + tmp3 = neon_load_reg(rd, pass); |
52 | + return float16_muladd(a, b, c, 0, fpst); | 64 | + fn(tmp, cpu_env, tmp, tmp2, tmp3); |
53 | +} | 65 | + tcg_temp_free_i32(tmp3); |
54 | + | 66 | + neon_store_reg(rd, pass, tmp); |
55 | /* | 67 | + } |
56 | * Floating point comparisons produce an integer result. Softfloat | 68 | + tcg_temp_free_i32(tmp2); |
57 | * routines return float_relation types which we convert to the 0/-1 | 69 | + } |
58 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 70 | + break; |
59 | index XXXXXXX..XXXXXXX 100644 | 71 | + default: |
60 | --- a/target/arm/translate-a64.c | 72 | + g_assert_not_reached(); |
61 | +++ b/target/arm/translate-a64.c | 73 | } |
62 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | 74 | } |
63 | case 0x0: /* FMAXNM */ | 75 | } else { /* size == 3 */ |
64 | gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
65 | break; | ||
66 | + case 0x1: /* FMLA */ | ||
67 | + read_vec_element_i32(s, tcg_res, rd, pass, MO_16); | ||
68 | + gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res, | ||
69 | + fpst); | ||
70 | + break; | ||
71 | case 0x2: /* FADD */ | ||
72 | gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
73 | break; | ||
74 | + case 0x3: /* FMULX */ | ||
75 | + gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
76 | + break; | ||
77 | case 0x4: /* FCMEQ */ | ||
78 | gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst); | ||
79 | break; | ||
80 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn) | ||
81 | case 0x8: /* FMINNM */ | ||
82 | gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
83 | break; | ||
84 | + case 0x9: /* FMLS */ | ||
85 | + /* As usual for ARM, separate negation for fused multiply-add */ | ||
86 | + tcg_gen_xori_i32(tcg_op1, tcg_op1, 0x8000); | ||
87 | + read_vec_element_i32(s, tcg_res, rd, pass, MO_16); | ||
88 | + gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res, | ||
89 | + fpst); | ||
90 | + break; | ||
91 | case 0xa: /* FSUB */ | ||
92 | gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst); | ||
93 | break; | ||
94 | -- | 76 | -- |
95 | 2.16.2 | 77 | 2.16.2 |
96 | 78 | ||
97 | 79 | diff view generated by jsdifflib |
1 | Now we have implemented FP16 we can enable it for the "any" CPU. | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 3 | Enable it for the "any" CPU used by *-linux-user. |
4 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 4 | |
5 | [PMM: split out from an earlier patch in the series] | 5 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
7 | Message-id: 20180228193125.20577-10-richard.henderson@linaro.org | ||
6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
7 | --- | 9 | --- |
10 | target/arm/cpu.c | 1 + | ||
8 | target/arm/cpu64.c | 1 + | 11 | target/arm/cpu64.c | 1 + |
9 | 1 file changed, 1 insertion(+) | 12 | 2 files changed, 2 insertions(+) |
10 | 13 | ||
14 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c | ||
15 | index XXXXXXX..XXXXXXX 100644 | ||
16 | --- a/target/arm/cpu.c | ||
17 | +++ b/target/arm/cpu.c | ||
18 | @@ -XXX,XX +XXX,XX @@ static void arm_any_initfn(Object *obj) | ||
19 | set_feature(&cpu->env, ARM_FEATURE_V8_SHA256); | ||
20 | set_feature(&cpu->env, ARM_FEATURE_V8_PMULL); | ||
21 | set_feature(&cpu->env, ARM_FEATURE_CRC); | ||
22 | + set_feature(&cpu->env, ARM_FEATURE_V8_RDM); | ||
23 | cpu->midr = 0xffffffff; | ||
24 | } | ||
25 | #endif | ||
11 | diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c | 26 | diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c |
12 | index XXXXXXX..XXXXXXX 100644 | 27 | index XXXXXXX..XXXXXXX 100644 |
13 | --- a/target/arm/cpu64.c | 28 | --- a/target/arm/cpu64.c |
14 | +++ b/target/arm/cpu64.c | 29 | +++ b/target/arm/cpu64.c |
15 | @@ -XXX,XX +XXX,XX @@ static void aarch64_any_initfn(Object *obj) | 30 | @@ -XXX,XX +XXX,XX @@ static void aarch64_any_initfn(Object *obj) |
16 | set_feature(&cpu->env, ARM_FEATURE_V8_SM4); | 31 | set_feature(&cpu->env, ARM_FEATURE_V8_SM4); |
17 | set_feature(&cpu->env, ARM_FEATURE_V8_PMULL); | 32 | set_feature(&cpu->env, ARM_FEATURE_V8_PMULL); |
18 | set_feature(&cpu->env, ARM_FEATURE_CRC); | 33 | set_feature(&cpu->env, ARM_FEATURE_CRC); |
19 | + set_feature(&cpu->env, ARM_FEATURE_V8_FP16); | 34 | + set_feature(&cpu->env, ARM_FEATURE_V8_RDM); |
35 | set_feature(&cpu->env, ARM_FEATURE_V8_FP16); | ||
20 | cpu->ctr = 0x80038003; /* 32 byte I and D cacheline size, VIPT icache */ | 36 | cpu->ctr = 0x80038003; /* 32 byte I and D cacheline size, VIPT icache */ |
21 | cpu->dcz_blocksize = 7; /* 512 bytes */ | 37 | cpu->dcz_blocksize = 7; /* 512 bytes */ |
22 | } | ||
23 | -- | 38 | -- |
24 | 2.16.2 | 39 | 2.16.2 |
25 | 40 | ||
26 | 41 | diff view generated by jsdifflib |
1 | Set the appropriate Linux hwcap bits to tell the guest binary if we | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | have implemented half-precision floating point support. | ||
3 | 2 | ||
3 | Not enabled anywhere yet. | ||
4 | |||
5 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> | ||
6 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20180228193125.20577-11-richard.henderson@linaro.org | ||
4 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
5 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
6 | --- | 9 | --- |
7 | linux-user/elfload.c | 2 ++ | 10 | target/arm/cpu.h | 1 + |
8 | 1 file changed, 2 insertions(+) | 11 | linux-user/elfload.c | 1 + |
12 | 2 files changed, 2 insertions(+) | ||
9 | 13 | ||
14 | diff --git a/target/arm/cpu.h b/target/arm/cpu.h | ||
15 | index XXXXXXX..XXXXXXX 100644 | ||
16 | --- a/target/arm/cpu.h | ||
17 | +++ b/target/arm/cpu.h | ||
18 | @@ -XXX,XX +XXX,XX @@ enum arm_features { | ||
19 | ARM_FEATURE_V8_SM4, /* implements SM4 part of v8 Crypto Extensions */ | ||
20 | ARM_FEATURE_V8_RDM, /* implements v8.1 simd round multiply */ | ||
21 | ARM_FEATURE_V8_FP16, /* implements v8.2 half-precision float */ | ||
22 | + ARM_FEATURE_V8_FCMA, /* has complex number part of v8.3 extensions. */ | ||
23 | }; | ||
24 | |||
25 | static inline int arm_feature(CPUARMState *env, int feature) | ||
10 | diff --git a/linux-user/elfload.c b/linux-user/elfload.c | 26 | diff --git a/linux-user/elfload.c b/linux-user/elfload.c |
11 | index XXXXXXX..XXXXXXX 100644 | 27 | index XXXXXXX..XXXXXXX 100644 |
12 | --- a/linux-user/elfload.c | 28 | --- a/linux-user/elfload.c |
13 | +++ b/linux-user/elfload.c | 29 | +++ b/linux-user/elfload.c |
14 | @@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap(void) | 30 | @@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap(void) |
15 | GET_FEATURE(ARM_FEATURE_V8_SM3, ARM_HWCAP_A64_SM3); | 31 | GET_FEATURE(ARM_FEATURE_V8_FP16, |
16 | GET_FEATURE(ARM_FEATURE_V8_SM4, ARM_HWCAP_A64_SM4); | 32 | ARM_HWCAP_A64_FPHP | ARM_HWCAP_A64_ASIMDHP); |
17 | GET_FEATURE(ARM_FEATURE_V8_SHA512, ARM_HWCAP_A64_SHA512); | 33 | GET_FEATURE(ARM_FEATURE_V8_RDM, ARM_HWCAP_A64_ASIMDRDM); |
18 | + GET_FEATURE(ARM_FEATURE_V8_FP16, | 34 | + GET_FEATURE(ARM_FEATURE_V8_FCMA, ARM_HWCAP_A64_FCMA); |
19 | + ARM_HWCAP_A64_FPHP | ARM_HWCAP_A64_ASIMDHP); | ||
20 | #undef GET_FEATURE | 35 | #undef GET_FEATURE |
21 | 36 | ||
22 | return hwcaps; | 37 | return hwcaps; |
23 | -- | 38 | -- |
24 | 2.16.2 | 39 | 2.16.2 |
25 | 40 | ||
26 | 41 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | I've re-factored the handle_simd_intfp_conv helper to properly handle | 3 | Reviewed-by: Alex Bennée <alex.bennee@linaro.org> |
4 | half-precision as well as call plain conversion helpers when we are | 4 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
5 | not doing fixed point conversion. | 5 | Message-id: 20180228193125.20577-12-richard.henderson@linaro.org |
6 | |||
7 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | ||
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
9 | Message-id: 20180227143852.11175-21-alex.bennee@linaro.org | ||
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 7 | --- |
12 | target/arm/helper.h | 10 ++++ | 8 | target/arm/helper.h | 7 ++++ |
13 | target/arm/helper.c | 4 ++ | 9 | target/arm/translate-a64.c | 48 ++++++++++++++++++++++- |
14 | target/arm/translate-a64.c | 122 ++++++++++++++++++++++++++++++++++----------- | 10 | target/arm/vec_helper.c | 97 ++++++++++++++++++++++++++++++++++++++++++++++ |
15 | 3 files changed, 108 insertions(+), 28 deletions(-) | 11 | 3 files changed, 151 insertions(+), 1 deletion(-) |
16 | 12 | ||
17 | diff --git a/target/arm/helper.h b/target/arm/helper.h | 13 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
18 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
19 | --- a/target/arm/helper.h | 15 | --- a/target/arm/helper.h |
20 | +++ b/target/arm/helper.h | 16 | +++ b/target/arm/helper.h |
21 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_cmped, void, f64, f64, env) | 17 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_qrdmlah_s32, TCG_CALL_NO_RWG, |
22 | DEF_HELPER_2(vfp_fcvtds, f64, f32, env) | 18 | DEF_HELPER_FLAGS_5(gvec_qrdmlsh_s32, TCG_CALL_NO_RWG, |
23 | DEF_HELPER_2(vfp_fcvtsd, f32, f64, env) | 19 | void, ptr, ptr, ptr, ptr, i32) |
24 | 20 | ||
25 | +DEF_HELPER_2(vfp_uitoh, f16, i32, ptr) | 21 | +DEF_HELPER_FLAGS_5(gvec_fcaddh, TCG_CALL_NO_RWG, |
26 | DEF_HELPER_2(vfp_uitos, f32, i32, ptr) | 22 | + void, ptr, ptr, ptr, ptr, i32) |
27 | DEF_HELPER_2(vfp_uitod, f64, i32, ptr) | 23 | +DEF_HELPER_FLAGS_5(gvec_fcadds, TCG_CALL_NO_RWG, |
28 | +DEF_HELPER_2(vfp_sitoh, f16, i32, ptr) | 24 | + void, ptr, ptr, ptr, ptr, i32) |
29 | DEF_HELPER_2(vfp_sitos, f32, i32, ptr) | 25 | +DEF_HELPER_FLAGS_5(gvec_fcaddd, TCG_CALL_NO_RWG, |
30 | DEF_HELPER_2(vfp_sitod, f64, i32, ptr) | 26 | + void, ptr, ptr, ptr, ptr, i32) |
31 | 27 | + | |
32 | +DEF_HELPER_2(vfp_touih, i32, f16, ptr) | 28 | #ifdef TARGET_AARCH64 |
33 | DEF_HELPER_2(vfp_touis, i32, f32, ptr) | 29 | #include "helper-a64.h" |
34 | DEF_HELPER_2(vfp_touid, i32, f64, ptr) | 30 | #endif |
35 | +DEF_HELPER_2(vfp_touizh, i32, f16, ptr) | ||
36 | DEF_HELPER_2(vfp_touizs, i32, f32, ptr) | ||
37 | DEF_HELPER_2(vfp_touizd, i32, f64, ptr) | ||
38 | +DEF_HELPER_2(vfp_tosih, i32, f16, ptr) | ||
39 | DEF_HELPER_2(vfp_tosis, i32, f32, ptr) | ||
40 | DEF_HELPER_2(vfp_tosid, i32, f64, ptr) | ||
41 | +DEF_HELPER_2(vfp_tosizh, i32, f16, ptr) | ||
42 | DEF_HELPER_2(vfp_tosizs, i32, f32, ptr) | ||
43 | DEF_HELPER_2(vfp_tosizd, i32, f64, ptr) | ||
44 | |||
45 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_toshd_round_to_zero, i64, f64, i32, ptr) | ||
46 | DEF_HELPER_3(vfp_tosld_round_to_zero, i64, f64, i32, ptr) | ||
47 | DEF_HELPER_3(vfp_touhd_round_to_zero, i64, f64, i32, ptr) | ||
48 | DEF_HELPER_3(vfp_tould_round_to_zero, i64, f64, i32, ptr) | ||
49 | +DEF_HELPER_3(vfp_toulh, i32, f16, i32, ptr) | ||
50 | +DEF_HELPER_3(vfp_toslh, i32, f16, i32, ptr) | ||
51 | DEF_HELPER_3(vfp_toshs, i32, f32, i32, ptr) | ||
52 | DEF_HELPER_3(vfp_tosls, i32, f32, i32, ptr) | ||
53 | DEF_HELPER_3(vfp_tosqs, i64, f32, i32, ptr) | ||
54 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_sqtod, f64, i64, i32, ptr) | ||
55 | DEF_HELPER_3(vfp_uhtod, f64, i64, i32, ptr) | ||
56 | DEF_HELPER_3(vfp_ultod, f64, i64, i32, ptr) | ||
57 | DEF_HELPER_3(vfp_uqtod, f64, i64, i32, ptr) | ||
58 | +DEF_HELPER_3(vfp_sltoh, f16, i32, i32, ptr) | ||
59 | +DEF_HELPER_3(vfp_ultoh, f16, i32, i32, ptr) | ||
60 | |||
61 | DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, ptr) | ||
62 | DEF_HELPER_FLAGS_2(set_neon_rmode, TCG_CALL_NO_RWG, i32, i32, env) | ||
63 | diff --git a/target/arm/helper.c b/target/arm/helper.c | ||
64 | index XXXXXXX..XXXXXXX 100644 | ||
65 | --- a/target/arm/helper.c | ||
66 | +++ b/target/arm/helper.c | ||
67 | @@ -XXX,XX +XXX,XX @@ CONV_ITOF(vfp_##name##to##p, fsz, sign) \ | ||
68 | CONV_FTOI(vfp_to##name##p, fsz, sign, ) \ | ||
69 | CONV_FTOI(vfp_to##name##z##p, fsz, sign, _round_to_zero) | ||
70 | |||
71 | +FLOAT_CONVS(si, h, 16, ) | ||
72 | FLOAT_CONVS(si, s, 32, ) | ||
73 | FLOAT_CONVS(si, d, 64, ) | ||
74 | +FLOAT_CONVS(ui, h, 16, u) | ||
75 | FLOAT_CONVS(ui, s, 32, u) | ||
76 | FLOAT_CONVS(ui, d, 64, u) | ||
77 | |||
78 | @@ -XXX,XX +XXX,XX @@ VFP_CONV_FIX_A64(sq, s, 32, 64, int64) | ||
79 | VFP_CONV_FIX(uh, s, 32, 32, uint16) | ||
80 | VFP_CONV_FIX(ul, s, 32, 32, uint32) | ||
81 | VFP_CONV_FIX_A64(uq, s, 32, 64, uint64) | ||
82 | +VFP_CONV_FIX_A64(sl, h, 16, 32, int32) | ||
83 | +VFP_CONV_FIX_A64(ul, h, 16, 32, uint32) | ||
84 | #undef VFP_CONV_FIX | ||
85 | #undef VFP_CONV_FIX_FLOAT | ||
86 | #undef VFP_CONV_FLOAT_FIX_ROUND | ||
87 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 31 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
88 | index XXXXXXX..XXXXXXX 100644 | 32 | index XXXXXXX..XXXXXXX 100644 |
89 | --- a/target/arm/translate-a64.c | 33 | --- a/target/arm/translate-a64.c |
90 | +++ b/target/arm/translate-a64.c | 34 | +++ b/target/arm/translate-a64.c |
91 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_intfp_conv(DisasContext *s, int rd, int rn, | 35 | @@ -XXX,XX +XXX,XX @@ static void gen_gvec_op3_env(DisasContext *s, bool is_q, int rd, |
92 | int elements, int is_signed, | 36 | is_q ? 16 : 8, vec_full_reg_size(s), 0, fn); |
93 | int fracbits, int size) | 37 | } |
94 | { | 38 | |
95 | - bool is_double = size == 3 ? true : false; | 39 | +/* Expand a 3-operand + fpstatus pointer + simd data value operation using |
96 | - TCGv_ptr tcg_fpst = get_fpstatus_ptr(false); | 40 | + * an out-of-line helper. |
97 | - TCGv_i32 tcg_shift = tcg_const_i32(fracbits); | 41 | + */ |
98 | - TCGv_i64 tcg_int = tcg_temp_new_i64(); | 42 | +static void gen_gvec_op3_fpst(DisasContext *s, bool is_q, int rd, int rn, |
99 | + TCGv_ptr tcg_fpst = get_fpstatus_ptr(size == MO_16); | 43 | + int rm, bool is_fp16, int data, |
100 | + TCGv_i32 tcg_shift = NULL; | 44 | + gen_helper_gvec_3_ptr *fn) |
101 | + | 45 | +{ |
102 | TCGMemOp mop = size | (is_signed ? MO_SIGN : 0); | 46 | + TCGv_ptr fpst = get_fpstatus_ptr(is_fp16); |
103 | int pass; | 47 | + tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd), |
104 | 48 | + vec_full_reg_offset(s, rn), | |
105 | - for (pass = 0; pass < elements; pass++) { | 49 | + vec_full_reg_offset(s, rm), fpst, |
106 | - read_vec_element(s, tcg_int, rn, pass, mop); | 50 | + is_q ? 16 : 8, vec_full_reg_size(s), data, fn); |
107 | + if (fracbits || size == MO_64) { | 51 | + tcg_temp_free_ptr(fpst); |
108 | + tcg_shift = tcg_const_i32(fracbits); | 52 | +} |
109 | + } | 53 | + |
110 | + | 54 | /* Set ZF and NF based on a 64 bit result. This is alas fiddlier |
111 | + if (size == MO_64) { | 55 | * than the 32 bit equivalent. |
112 | + TCGv_i64 tcg_int64 = tcg_temp_new_i64(); | 56 | */ |
113 | + TCGv_i64 tcg_double = tcg_temp_new_i64(); | 57 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn) |
114 | + | 58 | int size = extract32(insn, 22, 2); |
115 | + for (pass = 0; pass < elements; pass++) { | 59 | bool u = extract32(insn, 29, 1); |
116 | + read_vec_element(s, tcg_int64, rn, pass, mop); | 60 | bool is_q = extract32(insn, 30, 1); |
117 | 61 | - int feature; | |
118 | - if (is_double) { | 62 | + int feature, rot; |
119 | - TCGv_i64 tcg_double = tcg_temp_new_i64(); | 63 | |
120 | if (is_signed) { | 64 | switch (u * 16 + opcode) { |
121 | - gen_helper_vfp_sqtod(tcg_double, tcg_int, | 65 | case 0x10: /* SQRDMLAH (vector) */ |
122 | + gen_helper_vfp_sqtod(tcg_double, tcg_int64, | 66 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn) |
123 | tcg_shift, tcg_fpst); | ||
124 | } else { | ||
125 | - gen_helper_vfp_uqtod(tcg_double, tcg_int, | ||
126 | + gen_helper_vfp_uqtod(tcg_double, tcg_int64, | ||
127 | tcg_shift, tcg_fpst); | ||
128 | } | ||
129 | if (elements == 1) { | ||
130 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_intfp_conv(DisasContext *s, int rd, int rn, | ||
131 | } else { | ||
132 | write_vec_element(s, tcg_double, rd, pass, MO_64); | ||
133 | } | ||
134 | - tcg_temp_free_i64(tcg_double); | ||
135 | - } else { | ||
136 | - TCGv_i32 tcg_single = tcg_temp_new_i32(); | ||
137 | - if (is_signed) { | ||
138 | - gen_helper_vfp_sqtos(tcg_single, tcg_int, | ||
139 | - tcg_shift, tcg_fpst); | ||
140 | - } else { | ||
141 | - gen_helper_vfp_uqtos(tcg_single, tcg_int, | ||
142 | - tcg_shift, tcg_fpst); | ||
143 | - } | ||
144 | - if (elements == 1) { | ||
145 | - write_fp_sreg(s, rd, tcg_single); | ||
146 | - } else { | ||
147 | - write_vec_element_i32(s, tcg_single, rd, pass, MO_32); | ||
148 | - } | ||
149 | - tcg_temp_free_i32(tcg_single); | ||
150 | } | 67 | } |
151 | + | 68 | feature = ARM_FEATURE_V8_RDM; |
152 | + tcg_temp_free_i64(tcg_int64); | 69 | break; |
153 | + tcg_temp_free_i64(tcg_double); | 70 | + case 0xc: /* FCADD, #90 */ |
154 | + | 71 | + case 0xe: /* FCADD, #270 */ |
155 | + } else { | 72 | + if (size == 0 |
156 | + TCGv_i32 tcg_int32 = tcg_temp_new_i32(); | 73 | + || (size == 1 && !arm_dc_feature(s, ARM_FEATURE_V8_FP16)) |
157 | + TCGv_i32 tcg_float = tcg_temp_new_i32(); | 74 | + || (size == 3 && !is_q)) { |
158 | + | 75 | + unallocated_encoding(s); |
159 | + for (pass = 0; pass < elements; pass++) { | ||
160 | + read_vec_element_i32(s, tcg_int32, rn, pass, mop); | ||
161 | + | ||
162 | + switch (size) { | ||
163 | + case MO_32: | ||
164 | + if (fracbits) { | ||
165 | + if (is_signed) { | ||
166 | + gen_helper_vfp_sltos(tcg_float, tcg_int32, | ||
167 | + tcg_shift, tcg_fpst); | ||
168 | + } else { | ||
169 | + gen_helper_vfp_ultos(tcg_float, tcg_int32, | ||
170 | + tcg_shift, tcg_fpst); | ||
171 | + } | ||
172 | + } else { | ||
173 | + if (is_signed) { | ||
174 | + gen_helper_vfp_sitos(tcg_float, tcg_int32, tcg_fpst); | ||
175 | + } else { | ||
176 | + gen_helper_vfp_uitos(tcg_float, tcg_int32, tcg_fpst); | ||
177 | + } | ||
178 | + } | ||
179 | + break; | ||
180 | + case MO_16: | ||
181 | + if (fracbits) { | ||
182 | + if (is_signed) { | ||
183 | + gen_helper_vfp_sltoh(tcg_float, tcg_int32, | ||
184 | + tcg_shift, tcg_fpst); | ||
185 | + } else { | ||
186 | + gen_helper_vfp_ultoh(tcg_float, tcg_int32, | ||
187 | + tcg_shift, tcg_fpst); | ||
188 | + } | ||
189 | + } else { | ||
190 | + if (is_signed) { | ||
191 | + gen_helper_vfp_sitoh(tcg_float, tcg_int32, tcg_fpst); | ||
192 | + } else { | ||
193 | + gen_helper_vfp_uitoh(tcg_float, tcg_int32, tcg_fpst); | ||
194 | + } | ||
195 | + } | ||
196 | + break; | ||
197 | + default: | ||
198 | + g_assert_not_reached(); | ||
199 | + } | ||
200 | + | ||
201 | + if (elements == 1) { | ||
202 | + write_fp_sreg(s, rd, tcg_float); | ||
203 | + } else { | ||
204 | + write_vec_element_i32(s, tcg_float, rd, pass, size); | ||
205 | + } | ||
206 | + } | ||
207 | + | ||
208 | + tcg_temp_free_i32(tcg_int32); | ||
209 | + tcg_temp_free_i32(tcg_float); | ||
210 | } | ||
211 | |||
212 | - tcg_temp_free_i64(tcg_int); | ||
213 | tcg_temp_free_ptr(tcg_fpst); | ||
214 | - tcg_temp_free_i32(tcg_shift); | ||
215 | + if (tcg_shift) { | ||
216 | + tcg_temp_free_i32(tcg_shift); | ||
217 | + } | ||
218 | |||
219 | clear_vec_high(s, elements << size == 16, rd); | ||
220 | } | ||
221 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | ||
222 | rn = extract32(insn, 5, 5); | ||
223 | |||
224 | switch (fpop) { | ||
225 | + case 0x1d: /* SCVTF */ | ||
226 | + case 0x5d: /* UCVTF */ | ||
227 | + { | ||
228 | + int elements; | ||
229 | + | ||
230 | + if (is_scalar) { | ||
231 | + elements = 1; | ||
232 | + } else { | ||
233 | + elements = (is_q ? 8 : 4); | ||
234 | + } | ||
235 | + | ||
236 | + if (!fp_access_check(s)) { | ||
237 | + return; | 76 | + return; |
238 | + } | 77 | + } |
239 | + handle_simd_intfp_conv(s, rd, rn, elements, !u, 0, MO_16); | 78 | + feature = ARM_FEATURE_V8_FCMA; |
79 | + break; | ||
80 | default: | ||
81 | unallocated_encoding(s); | ||
82 | return; | ||
83 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn) | ||
84 | } | ||
85 | return; | ||
86 | |||
87 | + case 0xc: /* FCADD, #90 */ | ||
88 | + case 0xe: /* FCADD, #270 */ | ||
89 | + rot = extract32(opcode, 1, 1); | ||
90 | + switch (size) { | ||
91 | + case 1: | ||
92 | + gen_gvec_op3_fpst(s, is_q, rd, rn, rm, size == 1, rot, | ||
93 | + gen_helper_gvec_fcaddh); | ||
94 | + break; | ||
95 | + case 2: | ||
96 | + gen_gvec_op3_fpst(s, is_q, rd, rn, rm, size == 1, rot, | ||
97 | + gen_helper_gvec_fcadds); | ||
98 | + break; | ||
99 | + case 3: | ||
100 | + gen_gvec_op3_fpst(s, is_q, rd, rn, rm, size == 1, rot, | ||
101 | + gen_helper_gvec_fcaddd); | ||
102 | + break; | ||
103 | + default: | ||
104 | + g_assert_not_reached(); | ||
105 | + } | ||
240 | + return; | 106 | + return; |
107 | + | ||
108 | default: | ||
109 | g_assert_not_reached(); | ||
110 | } | ||
111 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
112 | index XXXXXXX..XXXXXXX 100644 | ||
113 | --- a/target/arm/vec_helper.c | ||
114 | +++ b/target/arm/vec_helper.c | ||
115 | @@ -XXX,XX +XXX,XX @@ | ||
116 | #include "exec/exec-all.h" | ||
117 | #include "exec/helper-proto.h" | ||
118 | #include "tcg/tcg-gvec-desc.h" | ||
119 | +#include "fpu/softfloat.h" | ||
120 | |||
121 | |||
122 | +/* Note that vector data is stored in host-endian 64-bit chunks, | ||
123 | + so addressing units smaller than that needs a host-endian fixup. */ | ||
124 | +#ifdef HOST_WORDS_BIGENDIAN | ||
125 | +#define H1(x) ((x) ^ 7) | ||
126 | +#define H2(x) ((x) ^ 3) | ||
127 | +#define H4(x) ((x) ^ 1) | ||
128 | +#else | ||
129 | +#define H1(x) (x) | ||
130 | +#define H2(x) (x) | ||
131 | +#define H4(x) (x) | ||
132 | +#endif | ||
133 | + | ||
134 | #define SET_QC() env->vfp.xregs[ARM_VFP_FPSCR] |= CPSR_Q | ||
135 | |||
136 | static void clear_tail(void *vd, uintptr_t opr_sz, uintptr_t max_sz) | ||
137 | @@ -XXX,XX +XXX,XX @@ void HELPER(gvec_qrdmlsh_s32)(void *vd, void *vn, void *vm, | ||
138 | } | ||
139 | clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
140 | } | ||
141 | + | ||
142 | +void HELPER(gvec_fcaddh)(void *vd, void *vn, void *vm, | ||
143 | + void *vfpst, uint32_t desc) | ||
144 | +{ | ||
145 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
146 | + float16 *d = vd; | ||
147 | + float16 *n = vn; | ||
148 | + float16 *m = vm; | ||
149 | + float_status *fpst = vfpst; | ||
150 | + uint32_t neg_real = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
151 | + uint32_t neg_imag = neg_real ^ 1; | ||
152 | + uintptr_t i; | ||
153 | + | ||
154 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
155 | + neg_real <<= 15; | ||
156 | + neg_imag <<= 15; | ||
157 | + | ||
158 | + for (i = 0; i < opr_sz / 2; i += 2) { | ||
159 | + float16 e0 = n[H2(i)]; | ||
160 | + float16 e1 = m[H2(i + 1)] ^ neg_imag; | ||
161 | + float16 e2 = n[H2(i + 1)]; | ||
162 | + float16 e3 = m[H2(i)] ^ neg_real; | ||
163 | + | ||
164 | + d[H2(i)] = float16_add(e0, e1, fpst); | ||
165 | + d[H2(i + 1)] = float16_add(e2, e3, fpst); | ||
241 | + } | 166 | + } |
242 | break; | 167 | + clear_tail(d, opr_sz, simd_maxsz(desc)); |
243 | case 0x2c: /* FCMGT (zero) */ | 168 | +} |
244 | case 0x2d: /* FCMEQ (zero) */ | 169 | + |
170 | +void HELPER(gvec_fcadds)(void *vd, void *vn, void *vm, | ||
171 | + void *vfpst, uint32_t desc) | ||
172 | +{ | ||
173 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
174 | + float32 *d = vd; | ||
175 | + float32 *n = vn; | ||
176 | + float32 *m = vm; | ||
177 | + float_status *fpst = vfpst; | ||
178 | + uint32_t neg_real = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
179 | + uint32_t neg_imag = neg_real ^ 1; | ||
180 | + uintptr_t i; | ||
181 | + | ||
182 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
183 | + neg_real <<= 31; | ||
184 | + neg_imag <<= 31; | ||
185 | + | ||
186 | + for (i = 0; i < opr_sz / 4; i += 2) { | ||
187 | + float32 e0 = n[H4(i)]; | ||
188 | + float32 e1 = m[H4(i + 1)] ^ neg_imag; | ||
189 | + float32 e2 = n[H4(i + 1)]; | ||
190 | + float32 e3 = m[H4(i)] ^ neg_real; | ||
191 | + | ||
192 | + d[H4(i)] = float32_add(e0, e1, fpst); | ||
193 | + d[H4(i + 1)] = float32_add(e2, e3, fpst); | ||
194 | + } | ||
195 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
196 | +} | ||
197 | + | ||
198 | +void HELPER(gvec_fcaddd)(void *vd, void *vn, void *vm, | ||
199 | + void *vfpst, uint32_t desc) | ||
200 | +{ | ||
201 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
202 | + float64 *d = vd; | ||
203 | + float64 *n = vn; | ||
204 | + float64 *m = vm; | ||
205 | + float_status *fpst = vfpst; | ||
206 | + uint64_t neg_real = extract64(desc, SIMD_DATA_SHIFT, 1); | ||
207 | + uint64_t neg_imag = neg_real ^ 1; | ||
208 | + uintptr_t i; | ||
209 | + | ||
210 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
211 | + neg_real <<= 63; | ||
212 | + neg_imag <<= 63; | ||
213 | + | ||
214 | + for (i = 0; i < opr_sz / 8; i += 2) { | ||
215 | + float64 e0 = n[i]; | ||
216 | + float64 e1 = m[i + 1] ^ neg_imag; | ||
217 | + float64 e2 = n[i + 1]; | ||
218 | + float64 e3 = m[i] ^ neg_real; | ||
219 | + | ||
220 | + d[i] = float64_add(e0, e1, fpst); | ||
221 | + d[i + 1] = float64_add(e2, e3, fpst); | ||
222 | + } | ||
223 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
224 | +} | ||
245 | -- | 225 | -- |
246 | 2.16.2 | 226 | 2.16.2 |
247 | 227 | ||
248 | 228 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This implements the half-precision variants of the across vector | 3 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
4 | reduction operations. This involves a re-factor of the reduction code | 4 | Message-id: 20180228193125.20577-13-richard.henderson@linaro.org |
5 | which more closely matches the ARM ARM order (and handles 8 element | 5 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
6 | reductions). | 6 | [PMM: renamed e1/e2/e3/e4 to use the same naming as the version |
7 | of the pseudocode in the Arm ARM] | ||
8 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | ||
9 | --- | ||
10 | target/arm/helper.h | 11 ++++ | ||
11 | target/arm/translate-a64.c | 94 +++++++++++++++++++++++++--- | ||
12 | target/arm/vec_helper.c | 149 +++++++++++++++++++++++++++++++++++++++++++++ | ||
13 | 3 files changed, 246 insertions(+), 8 deletions(-) | ||
7 | 14 | ||
8 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 15 | diff --git a/target/arm/helper.h b/target/arm/helper.h |
9 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
10 | Message-id: 20180227143852.11175-7-alex.bennee@linaro.org | ||
11 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | ||
12 | --- | ||
13 | target/arm/helper-a64.h | 4 ++ | ||
14 | target/arm/helper-a64.c | 18 ++++++ | ||
15 | target/arm/translate-a64.c | 140 ++++++++++++++++++++++++++++----------------- | ||
16 | 3 files changed, 109 insertions(+), 53 deletions(-) | ||
17 | |||
18 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | ||
19 | index XXXXXXX..XXXXXXX 100644 | 16 | index XXXXXXX..XXXXXXX 100644 |
20 | --- a/target/arm/helper-a64.h | 17 | --- a/target/arm/helper.h |
21 | +++ b/target/arm/helper-a64.h | 18 | +++ b/target/arm/helper.h |
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(paired_cmpxchg64_le_parallel, TCG_CALL_NO_WG, | 19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fcadds, TCG_CALL_NO_RWG, |
23 | DEF_HELPER_FLAGS_4(paired_cmpxchg64_be, TCG_CALL_NO_WG, i64, env, i64, i64, i64) | 20 | DEF_HELPER_FLAGS_5(gvec_fcaddd, TCG_CALL_NO_RWG, |
24 | DEF_HELPER_FLAGS_4(paired_cmpxchg64_be_parallel, TCG_CALL_NO_WG, | 21 | void, ptr, ptr, ptr, ptr, i32) |
25 | i64, env, i64, i64, i64) | 22 | |
26 | +DEF_HELPER_FLAGS_3(advsimd_maxh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 23 | +DEF_HELPER_FLAGS_5(gvec_fcmlah, TCG_CALL_NO_RWG, |
27 | +DEF_HELPER_FLAGS_3(advsimd_minh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 24 | + void, ptr, ptr, ptr, ptr, i32) |
28 | +DEF_HELPER_FLAGS_3(advsimd_maxnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 25 | +DEF_HELPER_FLAGS_5(gvec_fcmlah_idx, TCG_CALL_NO_RWG, |
29 | +DEF_HELPER_FLAGS_3(advsimd_minnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr) | 26 | + void, ptr, ptr, ptr, ptr, i32) |
30 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | 27 | +DEF_HELPER_FLAGS_5(gvec_fcmlas, TCG_CALL_NO_RWG, |
31 | index XXXXXXX..XXXXXXX 100644 | 28 | + void, ptr, ptr, ptr, ptr, i32) |
32 | --- a/target/arm/helper-a64.c | 29 | +DEF_HELPER_FLAGS_5(gvec_fcmlas_idx, TCG_CALL_NO_RWG, |
33 | +++ b/target/arm/helper-a64.c | 30 | + void, ptr, ptr, ptr, ptr, i32) |
34 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(paired_cmpxchg64_be_parallel)(CPUARMState *env, uint64_t addr, | 31 | +DEF_HELPER_FLAGS_5(gvec_fcmlad, TCG_CALL_NO_RWG, |
35 | { | 32 | + void, ptr, ptr, ptr, ptr, i32) |
36 | return do_paired_cmpxchg64_be(env, addr, new_lo, new_hi, true, GETPC()); | 33 | + |
37 | } | 34 | #ifdef TARGET_AARCH64 |
38 | + | 35 | #include "helper-a64.h" |
39 | +/* | 36 | #endif |
40 | + * AdvSIMD half-precision | ||
41 | + */ | ||
42 | + | ||
43 | +#define ADVSIMD_HELPER(name, suffix) HELPER(glue(glue(advsimd_, name), suffix)) | ||
44 | + | ||
45 | +#define ADVSIMD_HALFOP(name) \ | ||
46 | +float16 ADVSIMD_HELPER(name, h)(float16 a, float16 b, void *fpstp) \ | ||
47 | +{ \ | ||
48 | + float_status *fpst = fpstp; \ | ||
49 | + return float16_ ## name(a, b, fpst); \ | ||
50 | +} | ||
51 | + | ||
52 | +ADVSIMD_HALFOP(min) | ||
53 | +ADVSIMD_HALFOP(max) | ||
54 | +ADVSIMD_HALFOP(minnum) | ||
55 | +ADVSIMD_HALFOP(maxnum) | ||
56 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 37 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c |
57 | index XXXXXXX..XXXXXXX 100644 | 38 | index XXXXXXX..XXXXXXX 100644 |
58 | --- a/target/arm/translate-a64.c | 39 | --- a/target/arm/translate-a64.c |
59 | +++ b/target/arm/translate-a64.c | 40 | +++ b/target/arm/translate-a64.c |
60 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_zip_trn(DisasContext *s, uint32_t insn) | 41 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn) |
61 | tcg_temp_free_i64(tcg_resh); | 42 | } |
62 | } | 43 | feature = ARM_FEATURE_V8_RDM; |
63 | 44 | break; | |
64 | -static void do_minmaxop(DisasContext *s, TCGv_i32 tcg_elt1, TCGv_i32 tcg_elt2, | 45 | + case 0x8: /* FCMLA, #0 */ |
65 | - int opc, bool is_min, TCGv_ptr fpst) | 46 | + case 0x9: /* FCMLA, #90 */ |
66 | +/* | 47 | + case 0xa: /* FCMLA, #180 */ |
67 | + * do_reduction_op helper | 48 | + case 0xb: /* FCMLA, #270 */ |
68 | + * | 49 | case 0xc: /* FCADD, #90 */ |
69 | + * This mirrors the Reduce() pseudocode in the ARM ARM. It is | 50 | case 0xe: /* FCADD, #270 */ |
70 | + * important for correct NaN propagation that we do these | 51 | if (size == 0 |
71 | + * operations in exactly the order specified by the pseudocode. | 52 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn) |
72 | + * | 53 | } |
73 | + * This is a recursive function, TCG temps should be freed by the | 54 | return; |
74 | + * calling function once it is done with the values. | 55 | |
75 | + */ | 56 | + case 0x8: /* FCMLA, #0 */ |
76 | +static TCGv_i32 do_reduction_op(DisasContext *s, int fpopcode, int rn, | 57 | + case 0x9: /* FCMLA, #90 */ |
77 | + int esize, int size, int vmap, TCGv_ptr fpst) | 58 | + case 0xa: /* FCMLA, #180 */ |
78 | { | 59 | + case 0xb: /* FCMLA, #270 */ |
79 | - /* Helper function for disas_simd_across_lanes: do a single precision | 60 | + rot = extract32(opcode, 0, 2); |
80 | - * min/max operation on the specified two inputs, | 61 | + switch (size) { |
81 | - * and return the result in tcg_elt1. | 62 | + case 1: |
82 | - */ | 63 | + gen_gvec_op3_fpst(s, is_q, rd, rn, rm, true, rot, |
83 | - if (opc == 0xc) { | 64 | + gen_helper_gvec_fcmlah); |
84 | - if (is_min) { | 65 | + break; |
85 | - gen_helper_vfp_minnums(tcg_elt1, tcg_elt1, tcg_elt2, fpst); | 66 | + case 2: |
86 | - } else { | 67 | + gen_gvec_op3_fpst(s, is_q, rd, rn, rm, false, rot, |
87 | - gen_helper_vfp_maxnums(tcg_elt1, tcg_elt1, tcg_elt2, fpst); | 68 | + gen_helper_gvec_fcmlas); |
88 | - } | 69 | + break; |
89 | + if (esize == size) { | 70 | + case 3: |
90 | + int element; | 71 | + gen_gvec_op3_fpst(s, is_q, rd, rn, rm, false, rot, |
91 | + TCGMemOp msize = esize == 16 ? MO_16 : MO_32; | 72 | + gen_helper_gvec_fcmlad); |
92 | + TCGv_i32 tcg_elem; | ||
93 | + | ||
94 | + /* We should have one register left here */ | ||
95 | + assert(ctpop8(vmap) == 1); | ||
96 | + element = ctz32(vmap); | ||
97 | + assert(element < 8); | ||
98 | + | ||
99 | + tcg_elem = tcg_temp_new_i32(); | ||
100 | + read_vec_element_i32(s, tcg_elem, rn, element, msize); | ||
101 | + return tcg_elem; | ||
102 | } else { | ||
103 | - assert(opc == 0xf); | ||
104 | - if (is_min) { | ||
105 | - gen_helper_vfp_mins(tcg_elt1, tcg_elt1, tcg_elt2, fpst); | ||
106 | - } else { | ||
107 | - gen_helper_vfp_maxs(tcg_elt1, tcg_elt1, tcg_elt2, fpst); | ||
108 | + int bits = size / 2; | ||
109 | + int shift = ctpop8(vmap) / 2; | ||
110 | + int vmap_lo = (vmap >> shift) & vmap; | ||
111 | + int vmap_hi = (vmap & ~vmap_lo); | ||
112 | + TCGv_i32 tcg_hi, tcg_lo, tcg_res; | ||
113 | + | ||
114 | + tcg_hi = do_reduction_op(s, fpopcode, rn, esize, bits, vmap_hi, fpst); | ||
115 | + tcg_lo = do_reduction_op(s, fpopcode, rn, esize, bits, vmap_lo, fpst); | ||
116 | + tcg_res = tcg_temp_new_i32(); | ||
117 | + | ||
118 | + switch (fpopcode) { | ||
119 | + case 0x0c: /* fmaxnmv half-precision */ | ||
120 | + gen_helper_advsimd_maxnumh(tcg_res, tcg_lo, tcg_hi, fpst); | ||
121 | + break; | ||
122 | + case 0x0f: /* fmaxv half-precision */ | ||
123 | + gen_helper_advsimd_maxh(tcg_res, tcg_lo, tcg_hi, fpst); | ||
124 | + break; | ||
125 | + case 0x1c: /* fminnmv half-precision */ | ||
126 | + gen_helper_advsimd_minnumh(tcg_res, tcg_lo, tcg_hi, fpst); | ||
127 | + break; | ||
128 | + case 0x1f: /* fminv half-precision */ | ||
129 | + gen_helper_advsimd_minh(tcg_res, tcg_lo, tcg_hi, fpst); | ||
130 | + break; | ||
131 | + case 0x2c: /* fmaxnmv */ | ||
132 | + gen_helper_vfp_maxnums(tcg_res, tcg_lo, tcg_hi, fpst); | ||
133 | + break; | ||
134 | + case 0x2f: /* fmaxv */ | ||
135 | + gen_helper_vfp_maxs(tcg_res, tcg_lo, tcg_hi, fpst); | ||
136 | + break; | ||
137 | + case 0x3c: /* fminnmv */ | ||
138 | + gen_helper_vfp_minnums(tcg_res, tcg_lo, tcg_hi, fpst); | ||
139 | + break; | ||
140 | + case 0x3f: /* fminv */ | ||
141 | + gen_helper_vfp_mins(tcg_res, tcg_lo, tcg_hi, fpst); | ||
142 | + break; | 73 | + break; |
143 | + default: | 74 | + default: |
144 | + g_assert_not_reached(); | 75 | + g_assert_not_reached(); |
145 | } | 76 | + } |
146 | + | 77 | + return; |
147 | + tcg_temp_free_i32(tcg_hi); | 78 | + |
148 | + tcg_temp_free_i32(tcg_lo); | 79 | case 0xc: /* FCADD, #90 */ |
149 | + return tcg_res; | 80 | case 0xe: /* FCADD, #270 */ |
150 | } | 81 | rot = extract32(opcode, 1, 1); |
151 | } | 82 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
152 | 83 | int rn = extract32(insn, 5, 5); | |
153 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_across_lanes(DisasContext *s, uint32_t insn) | 84 | int rd = extract32(insn, 0, 5); |
85 | bool is_long = false; | ||
86 | - bool is_fp = false; | ||
87 | + int is_fp = 0; | ||
88 | bool is_fp16 = false; | ||
89 | int index; | ||
90 | TCGv_ptr fpst; | ||
91 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
92 | case 0x05: /* FMLS */ | ||
93 | case 0x09: /* FMUL */ | ||
94 | case 0x19: /* FMULX */ | ||
95 | - is_fp = true; | ||
96 | + is_fp = 1; | ||
154 | break; | 97 | break; |
155 | case 0xc: /* FMAXNMV, FMINNMV */ | 98 | case 0x1d: /* SQRDMLAH */ |
156 | case 0xf: /* FMAXV, FMINV */ | 99 | case 0x1f: /* SQRDMLSH */ |
157 | - if (!is_u || !is_q || extract32(size, 0, 1)) { | 100 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) |
158 | - unallocated_encoding(s); | 101 | return; |
159 | - return; | 102 | } |
160 | - } | 103 | break; |
161 | - /* Bit 1 of size field encodes min vs max, and actual size is always | 104 | + case 0x11: /* FCMLA #0 */ |
162 | - * 32 bits: adjust the size variable so following code can rely on it | 105 | + case 0x13: /* FCMLA #90 */ |
163 | + /* Bit 1 of size field encodes min vs max and the actual size | 106 | + case 0x15: /* FCMLA #180 */ |
164 | + * depends on the encoding of the U bit. If not set (and FP16 | 107 | + case 0x17: /* FCMLA #270 */ |
165 | + * enabled) then we do half-precision float instead of single | 108 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA)) { |
166 | + * precision. | ||
167 | */ | ||
168 | is_min = extract32(size, 1, 1); | ||
169 | is_fp = true; | ||
170 | - size = 2; | ||
171 | + if (!is_u && arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | ||
172 | + size = 1; | ||
173 | + } else if (!is_u || !is_q || extract32(size, 0, 1)) { | ||
174 | + unallocated_encoding(s); | 109 | + unallocated_encoding(s); |
175 | + return; | 110 | + return; |
176 | + } else { | ||
177 | + size = 2; | ||
178 | + } | 111 | + } |
179 | break; | 112 | + is_fp = 2; |
113 | + break; | ||
180 | default: | 114 | default: |
181 | unallocated_encoding(s); | 115 | unallocated_encoding(s); |
182 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_across_lanes(DisasContext *s, uint32_t insn) | 116 | return; |
183 | |||
184 | } | ||
185 | } else { | ||
186 | - /* Floating point ops which work on 32 bit (single) intermediates. | ||
187 | + /* Floating point vector reduction ops which work across 32 | ||
188 | + * bit (single) or 16 bit (half-precision) intermediates. | ||
189 | * Note that correct NaN propagation requires that we do these | ||
190 | * operations in exactly the order specified by the pseudocode. | ||
191 | */ | ||
192 | - TCGv_i32 tcg_elt1 = tcg_temp_new_i32(); | ||
193 | - TCGv_i32 tcg_elt2 = tcg_temp_new_i32(); | ||
194 | - TCGv_i32 tcg_elt3 = tcg_temp_new_i32(); | ||
195 | - TCGv_ptr fpst = get_fpstatus_ptr(false); | ||
196 | - | ||
197 | - assert(esize == 32); | ||
198 | - assert(elements == 4); | ||
199 | - | ||
200 | - read_vec_element(s, tcg_elt, rn, 0, MO_32); | ||
201 | - tcg_gen_extrl_i64_i32(tcg_elt1, tcg_elt); | ||
202 | - read_vec_element(s, tcg_elt, rn, 1, MO_32); | ||
203 | - tcg_gen_extrl_i64_i32(tcg_elt2, tcg_elt); | ||
204 | - | ||
205 | - do_minmaxop(s, tcg_elt1, tcg_elt2, opcode, is_min, fpst); | ||
206 | - | ||
207 | - read_vec_element(s, tcg_elt, rn, 2, MO_32); | ||
208 | - tcg_gen_extrl_i64_i32(tcg_elt2, tcg_elt); | ||
209 | - read_vec_element(s, tcg_elt, rn, 3, MO_32); | ||
210 | - tcg_gen_extrl_i64_i32(tcg_elt3, tcg_elt); | ||
211 | - | ||
212 | - do_minmaxop(s, tcg_elt2, tcg_elt3, opcode, is_min, fpst); | ||
213 | - | ||
214 | - do_minmaxop(s, tcg_elt1, tcg_elt2, opcode, is_min, fpst); | ||
215 | - | ||
216 | - tcg_gen_extu_i32_i64(tcg_res, tcg_elt1); | ||
217 | - tcg_temp_free_i32(tcg_elt1); | ||
218 | - tcg_temp_free_i32(tcg_elt2); | ||
219 | - tcg_temp_free_i32(tcg_elt3); | ||
220 | + TCGv_ptr fpst = get_fpstatus_ptr(size == MO_16); | ||
221 | + int fpopcode = opcode | is_min << 4 | is_u << 5; | ||
222 | + int vmap = (1 << elements) - 1; | ||
223 | + TCGv_i32 tcg_res32 = do_reduction_op(s, fpopcode, rn, esize, | ||
224 | + (is_q ? 128 : 64), vmap, fpst); | ||
225 | + tcg_gen_extu_i32_i64(tcg_res, tcg_res32); | ||
226 | + tcg_temp_free_i32(tcg_res32); | ||
227 | tcg_temp_free_ptr(fpst); | ||
228 | } | 117 | } |
229 | 118 | ||
119 | - if (is_fp) { | ||
120 | + switch (is_fp) { | ||
121 | + case 1: /* normal fp */ | ||
122 | /* convert insn encoded size to TCGMemOp size */ | ||
123 | switch (size) { | ||
124 | case 0: /* half-precision */ | ||
125 | - if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | ||
126 | - unallocated_encoding(s); | ||
127 | - return; | ||
128 | - } | ||
129 | size = MO_16; | ||
130 | + is_fp16 = true; | ||
131 | break; | ||
132 | case MO_32: /* single precision */ | ||
133 | case MO_64: /* double precision */ | ||
134 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
135 | unallocated_encoding(s); | ||
136 | return; | ||
137 | } | ||
138 | - } else { | ||
139 | + break; | ||
140 | + | ||
141 | + case 2: /* complex fp */ | ||
142 | + /* Each indexable element is a complex pair. */ | ||
143 | + size <<= 1; | ||
144 | + switch (size) { | ||
145 | + case MO_32: | ||
146 | + if (h && !is_q) { | ||
147 | + unallocated_encoding(s); | ||
148 | + return; | ||
149 | + } | ||
150 | + is_fp16 = true; | ||
151 | + break; | ||
152 | + case MO_64: | ||
153 | + break; | ||
154 | + default: | ||
155 | + unallocated_encoding(s); | ||
156 | + return; | ||
157 | + } | ||
158 | + break; | ||
159 | + | ||
160 | + default: /* integer */ | ||
161 | switch (size) { | ||
162 | case MO_8: | ||
163 | case MO_64: | ||
164 | unallocated_encoding(s); | ||
165 | return; | ||
166 | } | ||
167 | + break; | ||
168 | + } | ||
169 | + if (is_fp16 && !arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | ||
170 | + unallocated_encoding(s); | ||
171 | + return; | ||
172 | } | ||
173 | |||
174 | /* Given TCGMemOp size, adjust register and indexing. */ | ||
175 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn) | ||
176 | fpst = NULL; | ||
177 | } | ||
178 | |||
179 | + switch (16 * u + opcode) { | ||
180 | + case 0x11: /* FCMLA #0 */ | ||
181 | + case 0x13: /* FCMLA #90 */ | ||
182 | + case 0x15: /* FCMLA #180 */ | ||
183 | + case 0x17: /* FCMLA #270 */ | ||
184 | + tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd), | ||
185 | + vec_full_reg_offset(s, rn), | ||
186 | + vec_reg_offset(s, rm, index, size), fpst, | ||
187 | + is_q ? 16 : 8, vec_full_reg_size(s), | ||
188 | + extract32(insn, 13, 2), /* rot */ | ||
189 | + size == MO_64 | ||
190 | + ? gen_helper_gvec_fcmlas_idx | ||
191 | + : gen_helper_gvec_fcmlah_idx); | ||
192 | + tcg_temp_free_ptr(fpst); | ||
193 | + return; | ||
194 | + } | ||
195 | + | ||
196 | if (size == 3) { | ||
197 | TCGv_i64 tcg_idx = tcg_temp_new_i64(); | ||
198 | int pass; | ||
199 | diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c | ||
200 | index XXXXXXX..XXXXXXX 100644 | ||
201 | --- a/target/arm/vec_helper.c | ||
202 | +++ b/target/arm/vec_helper.c | ||
203 | @@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fcaddd)(void *vd, void *vn, void *vm, | ||
204 | } | ||
205 | clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
206 | } | ||
207 | + | ||
208 | +void HELPER(gvec_fcmlah)(void *vd, void *vn, void *vm, | ||
209 | + void *vfpst, uint32_t desc) | ||
210 | +{ | ||
211 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
212 | + float16 *d = vd; | ||
213 | + float16 *n = vn; | ||
214 | + float16 *m = vm; | ||
215 | + float_status *fpst = vfpst; | ||
216 | + intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
217 | + uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1); | ||
218 | + uint32_t neg_real = flip ^ neg_imag; | ||
219 | + uintptr_t i; | ||
220 | + | ||
221 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
222 | + neg_real <<= 15; | ||
223 | + neg_imag <<= 15; | ||
224 | + | ||
225 | + for (i = 0; i < opr_sz / 2; i += 2) { | ||
226 | + float16 e2 = n[H2(i + flip)]; | ||
227 | + float16 e1 = m[H2(i + flip)] ^ neg_real; | ||
228 | + float16 e4 = e2; | ||
229 | + float16 e3 = m[H2(i + 1 - flip)] ^ neg_imag; | ||
230 | + | ||
231 | + d[H2(i)] = float16_muladd(e2, e1, d[H2(i)], 0, fpst); | ||
232 | + d[H2(i + 1)] = float16_muladd(e4, e3, d[H2(i + 1)], 0, fpst); | ||
233 | + } | ||
234 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
235 | +} | ||
236 | + | ||
237 | +void HELPER(gvec_fcmlah_idx)(void *vd, void *vn, void *vm, | ||
238 | + void *vfpst, uint32_t desc) | ||
239 | +{ | ||
240 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
241 | + float16 *d = vd; | ||
242 | + float16 *n = vn; | ||
243 | + float16 *m = vm; | ||
244 | + float_status *fpst = vfpst; | ||
245 | + intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
246 | + uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1); | ||
247 | + uint32_t neg_real = flip ^ neg_imag; | ||
248 | + uintptr_t i; | ||
249 | + float16 e1 = m[H2(flip)]; | ||
250 | + float16 e3 = m[H2(1 - flip)]; | ||
251 | + | ||
252 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
253 | + neg_real <<= 15; | ||
254 | + neg_imag <<= 15; | ||
255 | + e1 ^= neg_real; | ||
256 | + e3 ^= neg_imag; | ||
257 | + | ||
258 | + for (i = 0; i < opr_sz / 2; i += 2) { | ||
259 | + float16 e2 = n[H2(i + flip)]; | ||
260 | + float16 e4 = e2; | ||
261 | + | ||
262 | + d[H2(i)] = float16_muladd(e2, e1, d[H2(i)], 0, fpst); | ||
263 | + d[H2(i + 1)] = float16_muladd(e4, e3, d[H2(i + 1)], 0, fpst); | ||
264 | + } | ||
265 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
266 | +} | ||
267 | + | ||
268 | +void HELPER(gvec_fcmlas)(void *vd, void *vn, void *vm, | ||
269 | + void *vfpst, uint32_t desc) | ||
270 | +{ | ||
271 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
272 | + float32 *d = vd; | ||
273 | + float32 *n = vn; | ||
274 | + float32 *m = vm; | ||
275 | + float_status *fpst = vfpst; | ||
276 | + intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
277 | + uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1); | ||
278 | + uint32_t neg_real = flip ^ neg_imag; | ||
279 | + uintptr_t i; | ||
280 | + | ||
281 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
282 | + neg_real <<= 31; | ||
283 | + neg_imag <<= 31; | ||
284 | + | ||
285 | + for (i = 0; i < opr_sz / 4; i += 2) { | ||
286 | + float32 e2 = n[H4(i + flip)]; | ||
287 | + float32 e1 = m[H4(i + flip)] ^ neg_real; | ||
288 | + float32 e4 = e2; | ||
289 | + float32 e3 = m[H4(i + 1 - flip)] ^ neg_imag; | ||
290 | + | ||
291 | + d[H4(i)] = float32_muladd(e2, e1, d[H4(i)], 0, fpst); | ||
292 | + d[H4(i + 1)] = float32_muladd(e4, e3, d[H4(i + 1)], 0, fpst); | ||
293 | + } | ||
294 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
295 | +} | ||
296 | + | ||
297 | +void HELPER(gvec_fcmlas_idx)(void *vd, void *vn, void *vm, | ||
298 | + void *vfpst, uint32_t desc) | ||
299 | +{ | ||
300 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
301 | + float32 *d = vd; | ||
302 | + float32 *n = vn; | ||
303 | + float32 *m = vm; | ||
304 | + float_status *fpst = vfpst; | ||
305 | + intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
306 | + uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1); | ||
307 | + uint32_t neg_real = flip ^ neg_imag; | ||
308 | + uintptr_t i; | ||
309 | + float32 e1 = m[H4(flip)]; | ||
310 | + float32 e3 = m[H4(1 - flip)]; | ||
311 | + | ||
312 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
313 | + neg_real <<= 31; | ||
314 | + neg_imag <<= 31; | ||
315 | + e1 ^= neg_real; | ||
316 | + e3 ^= neg_imag; | ||
317 | + | ||
318 | + for (i = 0; i < opr_sz / 4; i += 2) { | ||
319 | + float32 e2 = n[H4(i + flip)]; | ||
320 | + float32 e4 = e2; | ||
321 | + | ||
322 | + d[H4(i)] = float32_muladd(e2, e1, d[H4(i)], 0, fpst); | ||
323 | + d[H4(i + 1)] = float32_muladd(e4, e3, d[H4(i + 1)], 0, fpst); | ||
324 | + } | ||
325 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
326 | +} | ||
327 | + | ||
328 | +void HELPER(gvec_fcmlad)(void *vd, void *vn, void *vm, | ||
329 | + void *vfpst, uint32_t desc) | ||
330 | +{ | ||
331 | + uintptr_t opr_sz = simd_oprsz(desc); | ||
332 | + float64 *d = vd; | ||
333 | + float64 *n = vn; | ||
334 | + float64 *m = vm; | ||
335 | + float_status *fpst = vfpst; | ||
336 | + intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1); | ||
337 | + uint64_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1); | ||
338 | + uint64_t neg_real = flip ^ neg_imag; | ||
339 | + uintptr_t i; | ||
340 | + | ||
341 | + /* Shift boolean to the sign bit so we can xor to negate. */ | ||
342 | + neg_real <<= 63; | ||
343 | + neg_imag <<= 63; | ||
344 | + | ||
345 | + for (i = 0; i < opr_sz / 8; i += 2) { | ||
346 | + float64 e2 = n[i + flip]; | ||
347 | + float64 e1 = m[i + flip] ^ neg_real; | ||
348 | + float64 e4 = e2; | ||
349 | + float64 e3 = m[i + 1 - flip] ^ neg_imag; | ||
350 | + | ||
351 | + d[i] = float64_muladd(e2, e1, d[i], 0, fpst); | ||
352 | + d[i + 1] = float64_muladd(e4, e3, d[i + 1], 0, fpst); | ||
353 | + } | ||
354 | + clear_tail(d, opr_sz, simd_maxsz(desc)); | ||
355 | +} | ||
230 | -- | 356 | -- |
231 | 2.16.2 | 357 | 2.16.2 |
232 | 358 | ||
233 | 359 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | We go with the localised helper. | 3 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
4 | 4 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> | |
5 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | Message-id: 20180228193125.20577-14-richard.henderson@linaro.org |
6 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
7 | Message-id: 20180227143852.11175-25-alex.bennee@linaro.org | ||
8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
9 | --- | 7 | --- |
10 | target/arm/helper-a64.h | 1 + | 8 | target/arm/translate.c | 68 ++++++++++++++++++++++++++++++++++++++++++++++++++ |
11 | target/arm/helper-a64.c | 29 +++++++++++++++++++++++++++++ | 9 | 1 file changed, 68 insertions(+) |
12 | target/arm/translate-a64.c | 4 ++++ | ||
13 | 3 files changed, 34 insertions(+) | ||
14 | 10 | ||
15 | diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h | 11 | diff --git a/target/arm/translate.c b/target/arm/translate.c |
16 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/target/arm/helper-a64.h | 13 | --- a/target/arm/translate.c |
18 | +++ b/target/arm/helper-a64.h | 14 | +++ b/target/arm/translate.c |
19 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_1(neon_addlp_s16, TCG_CALL_NO_RWG_SE, i64, i64) | 15 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn) |
20 | DEF_HELPER_FLAGS_1(neon_addlp_u16, TCG_CALL_NO_RWG_SE, i64, i64) | 16 | return 0; |
21 | DEF_HELPER_FLAGS_2(frecpx_f64, TCG_CALL_NO_RWG, f64, f64, ptr) | ||
22 | DEF_HELPER_FLAGS_2(frecpx_f32, TCG_CALL_NO_RWG, f32, f32, ptr) | ||
23 | +DEF_HELPER_FLAGS_2(frecpx_f16, TCG_CALL_NO_RWG, f16, f16, ptr) | ||
24 | DEF_HELPER_FLAGS_2(fcvtx_f64_to_f32, TCG_CALL_NO_RWG, f32, f64, env) | ||
25 | DEF_HELPER_FLAGS_3(crc32_64, TCG_CALL_NO_RWG_SE, i64, i64, i64, i32) | ||
26 | DEF_HELPER_FLAGS_3(crc32c_64, TCG_CALL_NO_RWG_SE, i64, i64, i64, i32) | ||
27 | diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c | ||
28 | index XXXXXXX..XXXXXXX 100644 | ||
29 | --- a/target/arm/helper-a64.c | ||
30 | +++ b/target/arm/helper-a64.c | ||
31 | @@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_addlp_u16)(uint64_t a) | ||
32 | } | 17 | } |
33 | 18 | ||
34 | /* Floating-point reciprocal exponent - see FPRecpX in ARM ARM */ | 19 | +/* Advanced SIMD three registers of the same length extension. |
35 | +float16 HELPER(frecpx_f16)(float16 a, void *fpstp) | 20 | + * 31 25 23 22 20 16 12 11 10 9 8 3 0 |
21 | + * +---------------+-----+---+-----+----+----+---+----+---+----+---------+----+ | ||
22 | + * | 1 1 1 1 1 1 0 | op1 | D | op2 | Vn | Vd | 1 | o3 | 0 | o4 | N Q M U | Vm | | ||
23 | + * +---------------+-----+---+-----+----+----+---+----+---+----+---------+----+ | ||
24 | + */ | ||
25 | +static int disas_neon_insn_3same_ext(DisasContext *s, uint32_t insn) | ||
36 | +{ | 26 | +{ |
37 | + float_status *fpst = fpstp; | 27 | + gen_helper_gvec_3_ptr *fn_gvec_ptr; |
38 | + uint16_t val16, sbit; | 28 | + int rd, rn, rm, rot, size, opr_sz; |
39 | + int16_t exp; | 29 | + TCGv_ptr fpst; |
30 | + bool q; | ||
40 | + | 31 | + |
41 | + if (float16_is_any_nan(a)) { | 32 | + q = extract32(insn, 6, 1); |
42 | + float16 nan = a; | 33 | + VFP_DREG_D(rd, insn); |
43 | + if (float16_is_signaling_nan(a, fpst)) { | 34 | + VFP_DREG_N(rn, insn); |
44 | + float_raise(float_flag_invalid, fpst); | 35 | + VFP_DREG_M(rm, insn); |
45 | + nan = float16_maybe_silence_nan(a, fpst); | 36 | + if ((rd | rn | rm) & q) { |
46 | + } | 37 | + return 1; |
47 | + if (fpst->default_nan_mode) { | ||
48 | + nan = float16_default_nan(fpst); | ||
49 | + } | ||
50 | + return nan; | ||
51 | + } | 38 | + } |
52 | + | 39 | + |
53 | + val16 = float16_val(a); | 40 | + if ((insn & 0xfe200f10) == 0xfc200800) { |
54 | + sbit = 0x8000 & val16; | 41 | + /* VCMLA -- 1111 110R R.1S .... .... 1000 ...0 .... */ |
55 | + exp = extract32(val16, 10, 5); | 42 | + size = extract32(insn, 20, 1); |
43 | + rot = extract32(insn, 23, 2); | ||
44 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA) | ||
45 | + || (!size && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))) { | ||
46 | + return 1; | ||
47 | + } | ||
48 | + fn_gvec_ptr = size ? gen_helper_gvec_fcmlas : gen_helper_gvec_fcmlah; | ||
49 | + } else if ((insn & 0xfea00f10) == 0xfc800800) { | ||
50 | + /* VCADD -- 1111 110R 1.0S .... .... 1000 ...0 .... */ | ||
51 | + size = extract32(insn, 20, 1); | ||
52 | + rot = extract32(insn, 24, 1); | ||
53 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA) | ||
54 | + || (!size && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))) { | ||
55 | + return 1; | ||
56 | + } | ||
57 | + fn_gvec_ptr = size ? gen_helper_gvec_fcadds : gen_helper_gvec_fcaddh; | ||
58 | + } else { | ||
59 | + return 1; | ||
60 | + } | ||
56 | + | 61 | + |
57 | + if (exp == 0) { | 62 | + if (s->fp_excp_el) { |
58 | + return make_float16(deposit32(sbit, 10, 5, 0x1e)); | 63 | + gen_exception_insn(s, 4, EXCP_UDEF, |
59 | + } else { | 64 | + syn_fp_access_trap(1, 0xe, false), s->fp_excp_el); |
60 | + return make_float16(deposit32(sbit, 10, 5, ~exp)); | 65 | + return 0; |
61 | + } | 66 | + } |
67 | + if (!s->vfp_enabled) { | ||
68 | + return 1; | ||
69 | + } | ||
70 | + | ||
71 | + opr_sz = (1 + q) * 8; | ||
72 | + fpst = get_fpstatus_ptr(1); | ||
73 | + tcg_gen_gvec_3_ptr(vfp_reg_offset(1, rd), | ||
74 | + vfp_reg_offset(1, rn), | ||
75 | + vfp_reg_offset(1, rm), fpst, | ||
76 | + opr_sz, opr_sz, rot, fn_gvec_ptr); | ||
77 | + tcg_temp_free_ptr(fpst); | ||
78 | + return 0; | ||
62 | +} | 79 | +} |
63 | + | 80 | + |
64 | float32 HELPER(frecpx_f32)(float32 a, void *fpstp) | 81 | static int disas_coproc_insn(DisasContext *s, uint32_t insn) |
65 | { | 82 | { |
66 | float_status *fpst = fpstp; | 83 | int cpnum, is64, crn, crm, opc1, opc2, isread, rt, rt2; |
67 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 84 | @@ -XXX,XX +XXX,XX @@ static void disas_arm_insn(DisasContext *s, unsigned int insn) |
68 | index XXXXXXX..XXXXXXX 100644 | 85 | } |
69 | --- a/target/arm/translate-a64.c | 86 | } |
70 | +++ b/target/arm/translate-a64.c | 87 | } |
71 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 88 | + } else if ((insn & 0x0e000a00) == 0x0c000800 |
72 | handle_2misc_fcmp_zero(s, fpop, is_scalar, 0, is_q, MO_16, rn, rd); | 89 | + && arm_dc_feature(s, ARM_FEATURE_V8)) { |
73 | return; | 90 | + if (disas_neon_insn_3same_ext(s, insn)) { |
74 | case 0x3d: /* FRECPE */ | 91 | + goto illegal_op; |
75 | + case 0x3f: /* FRECPX */ | 92 | + } |
76 | break; | 93 | + return; |
77 | case 0x18: /* FRINTN */ | 94 | } else if ((insn & 0x0fe00000) == 0x0c400000) { |
78 | need_rmode = true; | 95 | /* Coprocessor double register transfer. */ |
79 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 96 | ARCH(5TE); |
80 | case 0x3d: /* FRECPE */ | ||
81 | gen_helper_recpe_f16(tcg_res, tcg_op, tcg_fpstatus); | ||
82 | break; | ||
83 | + case 0x3f: /* FRECPX */ | ||
84 | + gen_helper_frecpx_f16(tcg_res, tcg_op, tcg_fpstatus); | ||
85 | + break; | ||
86 | case 0x5a: /* FCVTNU */ | ||
87 | case 0x5b: /* FCVTMU */ | ||
88 | case 0x5c: /* FCVTAU */ | ||
89 | -- | 97 | -- |
90 | 2.16.2 | 98 | 2.16.2 |
91 | 99 | ||
92 | 100 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This actually covers two different sections of the encoding table: | 3 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
4 | 4 | Message-id: 20180228193125.20577-15-richard.henderson@linaro.org | |
5 | Advanced SIMD scalar two-register miscellaneous FP16 | 5 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
6 | Advanced SIMD two-register miscellaneous (FP16) | ||
7 | |||
8 | The difference between the two is covered by a combination of Q (bit | ||
9 | 30) and S (bit 28). Notably the FRINTx instructions are only | ||
10 | available in the vector form. | ||
11 | |||
12 | This is just the decode skeleton which will be filled out by later | ||
13 | patches. | ||
14 | |||
15 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | ||
16 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | ||
17 | Message-id: 20180227143852.11175-17-alex.bennee@linaro.org | ||
18 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 6 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
19 | --- | 7 | --- |
20 | target/arm/translate-a64.c | 40 ++++++++++++++++++++++++++++++++++++++++ | 8 | target/arm/translate.c | 61 ++++++++++++++++++++++++++++++++++++++++++++++++++ |
21 | 1 file changed, 40 insertions(+) | 9 | 1 file changed, 61 insertions(+) |
22 | 10 | ||
23 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | 11 | diff --git a/target/arm/translate.c b/target/arm/translate.c |
24 | index XXXXXXX..XXXXXXX 100644 | 12 | index XXXXXXX..XXXXXXX 100644 |
25 | --- a/target/arm/translate-a64.c | 13 | --- a/target/arm/translate.c |
26 | +++ b/target/arm/translate-a64.c | 14 | +++ b/target/arm/translate.c |
27 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn) | 15 | @@ -XXX,XX +XXX,XX @@ static int disas_neon_insn_3same_ext(DisasContext *s, uint32_t insn) |
28 | } | 16 | return 0; |
29 | } | 17 | } |
30 | 18 | ||
31 | +/* AdvSIMD [scalar] two register miscellaneous (FP16) | 19 | +/* Advanced SIMD two registers and a scalar extension. |
20 | + * 31 24 23 22 20 16 12 11 10 9 8 3 0 | ||
21 | + * +-----------------+----+---+----+----+----+---+----+---+----+---------+----+ | ||
22 | + * | 1 1 1 1 1 1 1 0 | o1 | D | o2 | Vn | Vd | 1 | o3 | 0 | o4 | N Q M U | Vm | | ||
23 | + * +-----------------+----+---+----+----+----+---+----+---+----+---------+----+ | ||
32 | + * | 24 | + * |
33 | + * 31 30 29 28 27 24 23 22 21 17 16 12 11 10 9 5 4 0 | ||
34 | + * +---+---+---+---+---------+---+-------------+--------+-----+------+------+ | ||
35 | + * | 0 | Q | U | S | 1 1 1 0 | a | 1 1 1 1 0 0 | opcode | 1 0 | Rn | Rd | | ||
36 | + * +---+---+---+---+---------+---+-------------+--------+-----+------+------+ | ||
37 | + * mask: 1000 1111 0111 1110 0000 1100 0000 0000 0x8f7e 0c00 | ||
38 | + * val: 0000 1110 0111 1000 0000 1000 0000 0000 0x0e78 0800 | ||
39 | + * | ||
40 | + * This actually covers two groups where scalar access is governed by | ||
41 | + * bit 28. A bunch of the instructions (float to integral) only exist | ||
42 | + * in the vector form and are un-allocated for the scalar decode. Also | ||
43 | + * in the scalar decode Q is always 1. | ||
44 | + */ | 25 | + */ |
45 | +static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn) | 26 | + |
27 | +static int disas_neon_insn_2reg_scalar_ext(DisasContext *s, uint32_t insn) | ||
46 | +{ | 28 | +{ |
47 | + int fpop, opcode, a; | 29 | + int rd, rn, rm, rot, size, opr_sz; |
30 | + TCGv_ptr fpst; | ||
31 | + bool q; | ||
48 | + | 32 | + |
49 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) { | 33 | + q = extract32(insn, 6, 1); |
50 | + unallocated_encoding(s); | 34 | + VFP_DREG_D(rd, insn); |
51 | + return; | 35 | + VFP_DREG_N(rn, insn); |
36 | + VFP_DREG_M(rm, insn); | ||
37 | + if ((rd | rn) & q) { | ||
38 | + return 1; | ||
52 | + } | 39 | + } |
53 | + | 40 | + |
54 | + if (!fp_access_check(s)) { | 41 | + if ((insn & 0xff000f10) == 0xfe000800) { |
55 | + return; | 42 | + /* VCMLA (indexed) -- 1111 1110 S.RR .... .... 1000 ...0 .... */ |
43 | + rot = extract32(insn, 20, 2); | ||
44 | + size = extract32(insn, 23, 1); | ||
45 | + if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA) | ||
46 | + || (!size && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))) { | ||
47 | + return 1; | ||
48 | + } | ||
49 | + } else { | ||
50 | + return 1; | ||
56 | + } | 51 | + } |
57 | + | 52 | + |
58 | + opcode = extract32(insn, 12, 4); | 53 | + if (s->fp_excp_el) { |
59 | + a = extract32(insn, 23, 1); | 54 | + gen_exception_insn(s, 4, EXCP_UDEF, |
60 | + fpop = deposit32(opcode, 5, 1, a); | 55 | + syn_fp_access_trap(1, 0xe, false), s->fp_excp_el); |
61 | + | 56 | + return 0; |
62 | + switch (fpop) { | 57 | + } |
63 | + default: | 58 | + if (!s->vfp_enabled) { |
64 | + fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop); | 59 | + return 1; |
65 | + g_assert_not_reached(); | ||
66 | + } | 60 | + } |
67 | + | 61 | + |
62 | + opr_sz = (1 + q) * 8; | ||
63 | + fpst = get_fpstatus_ptr(1); | ||
64 | + tcg_gen_gvec_3_ptr(vfp_reg_offset(1, rd), | ||
65 | + vfp_reg_offset(1, rn), | ||
66 | + vfp_reg_offset(1, rm), fpst, | ||
67 | + opr_sz, opr_sz, rot, | ||
68 | + size ? gen_helper_gvec_fcmlas_idx | ||
69 | + : gen_helper_gvec_fcmlah_idx); | ||
70 | + tcg_temp_free_ptr(fpst); | ||
71 | + return 0; | ||
68 | +} | 72 | +} |
69 | + | 73 | + |
70 | /* AdvSIMD scalar x indexed element | 74 | static int disas_coproc_insn(DisasContext *s, uint32_t insn) |
71 | * 31 30 29 28 24 23 22 21 20 19 16 15 12 11 10 9 5 4 0 | 75 | { |
72 | * +-----+---+-----------+------+---+---+------+-----+---+---+------+------+ | 76 | int cpnum, is64, crn, crm, opc1, opc2, isread, rt, rt2; |
73 | @@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = { | 77 | @@ -XXX,XX +XXX,XX @@ static void disas_arm_insn(DisasContext *s, unsigned int insn) |
74 | { 0xce800000, 0xffe00000, disas_crypto_xar }, | 78 | goto illegal_op; |
75 | { 0xce408000, 0xffe0c000, disas_crypto_three_reg_imm2 }, | 79 | } |
76 | { 0x0e400400, 0x9f60c400, disas_simd_three_reg_same_fp16 }, | 80 | return; |
77 | + { 0x0e780800, 0x8f7e0c00, disas_simd_two_reg_misc_fp16 }, | 81 | + } else if ((insn & 0x0f000a00) == 0x0e000800 |
78 | { 0x00000000, 0x00000000, NULL } | 82 | + && arm_dc_feature(s, ARM_FEATURE_V8)) { |
79 | }; | 83 | + if (disas_neon_insn_2reg_scalar_ext(s, insn)) { |
80 | 84 | + goto illegal_op; | |
85 | + } | ||
86 | + return; | ||
87 | } else if ((insn & 0x0fe00000) == 0x0c400000) { | ||
88 | /* Coprocessor double register transfer. */ | ||
89 | ARCH(5TE); | ||
81 | -- | 90 | -- |
82 | 2.16.2 | 91 | 2.16.2 |
83 | 92 | ||
84 | 93 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | As the rounding mode is now split between FP16 and the rest of | 3 | Happily, the bits are in the same places compared to a32. |
4 | floating point we need to be explicit when tweaking it. Instead of | ||
5 | passing the CPU env we now pass the appropriate fpst pointer directly. | ||
6 | 4 | ||
7 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 6 | Message-id: 20180228193125.20577-16-richard.henderson@linaro.org |
9 | Message-id: 20180227143852.11175-6-alex.bennee@linaro.org | 7 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 9 | --- |
12 | target/arm/helper.h | 2 +- | 10 | target/arm/translate.c | 14 +++++++++++++- |
13 | target/arm/helper.c | 4 ++-- | 11 | 1 file changed, 13 insertions(+), 1 deletion(-) |
14 | target/arm/translate-a64.c | 26 +++++++++++++------------- | ||
15 | target/arm/translate.c | 12 ++++++------ | ||
16 | 4 files changed, 22 insertions(+), 22 deletions(-) | ||
17 | 12 | ||
18 | diff --git a/target/arm/helper.h b/target/arm/helper.h | ||
19 | index XXXXXXX..XXXXXXX 100644 | ||
20 | --- a/target/arm/helper.h | ||
21 | +++ b/target/arm/helper.h | ||
22 | @@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_uhtod, f64, i64, i32, ptr) | ||
23 | DEF_HELPER_3(vfp_ultod, f64, i64, i32, ptr) | ||
24 | DEF_HELPER_3(vfp_uqtod, f64, i64, i32, ptr) | ||
25 | |||
26 | -DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, env) | ||
27 | +DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, ptr) | ||
28 | DEF_HELPER_FLAGS_2(set_neon_rmode, TCG_CALL_NO_RWG, i32, i32, env) | ||
29 | |||
30 | DEF_HELPER_2(vfp_fcvt_f16_to_f32, f32, i32, env) | ||
31 | diff --git a/target/arm/helper.c b/target/arm/helper.c | ||
32 | index XXXXXXX..XXXXXXX 100644 | ||
33 | --- a/target/arm/helper.c | ||
34 | +++ b/target/arm/helper.c | ||
35 | @@ -XXX,XX +XXX,XX @@ VFP_CONV_FIX_A64(uq, s, 32, 64, uint64) | ||
36 | /* Set the current fp rounding mode and return the old one. | ||
37 | * The argument is a softfloat float_round_ value. | ||
38 | */ | ||
39 | -uint32_t HELPER(set_rmode)(uint32_t rmode, CPUARMState *env) | ||
40 | +uint32_t HELPER(set_rmode)(uint32_t rmode, void *fpstp) | ||
41 | { | ||
42 | - float_status *fp_status = &env->vfp.fp_status; | ||
43 | + float_status *fp_status = fpstp; | ||
44 | |||
45 | uint32_t prev_rmode = get_float_rounding_mode(fp_status); | ||
46 | set_float_rounding_mode(rmode, fp_status); | ||
47 | diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c | ||
48 | index XXXXXXX..XXXXXXX 100644 | ||
49 | --- a/target/arm/translate-a64.c | ||
50 | +++ b/target/arm/translate-a64.c | ||
51 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_single(DisasContext *s, int opcode, int rd, int rn) | ||
52 | { | ||
53 | TCGv_i32 tcg_rmode = tcg_const_i32(arm_rmode_to_sf(opcode & 7)); | ||
54 | |||
55 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
56 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
57 | gen_helper_rints(tcg_res, tcg_op, fpst); | ||
58 | |||
59 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
60 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
61 | tcg_temp_free_i32(tcg_rmode); | ||
62 | break; | ||
63 | } | ||
64 | @@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_double(DisasContext *s, int opcode, int rd, int rn) | ||
65 | { | ||
66 | TCGv_i32 tcg_rmode = tcg_const_i32(arm_rmode_to_sf(opcode & 7)); | ||
67 | |||
68 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
69 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
70 | gen_helper_rintd(tcg_res, tcg_op, fpst); | ||
71 | |||
72 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
73 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
74 | tcg_temp_free_i32(tcg_rmode); | ||
75 | break; | ||
76 | } | ||
77 | @@ -XXX,XX +XXX,XX @@ static void handle_fpfpcvt(DisasContext *s, int rd, int rn, int opcode, | ||
78 | |||
79 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | ||
80 | |||
81 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
82 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
83 | |||
84 | if (is_double) { | ||
85 | TCGv_i64 tcg_double = read_fp_dreg(s, rn); | ||
86 | @@ -XXX,XX +XXX,XX @@ static void handle_fpfpcvt(DisasContext *s, int rd, int rn, int opcode, | ||
87 | tcg_temp_free_i32(tcg_single); | ||
88 | } | ||
89 | |||
90 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
91 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
92 | tcg_temp_free_i32(tcg_rmode); | ||
93 | |||
94 | if (!sf) { | ||
95 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar, | ||
96 | assert(!(is_scalar && is_q)); | ||
97 | |||
98 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(FPROUNDING_ZERO)); | ||
99 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
100 | tcg_fpstatus = get_fpstatus_ptr(false); | ||
101 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
102 | tcg_shift = tcg_const_i32(fracbits); | ||
103 | |||
104 | if (is_double) { | ||
105 | @@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar, | ||
106 | |||
107 | tcg_temp_free_ptr(tcg_fpstatus); | ||
108 | tcg_temp_free_i32(tcg_shift); | ||
109 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
110 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
111 | tcg_temp_free_i32(tcg_rmode); | ||
112 | } | ||
113 | |||
114 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_two_reg_misc(DisasContext *s, uint32_t insn) | ||
115 | |||
116 | if (is_fcvt) { | ||
117 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | ||
118 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
119 | tcg_fpstatus = get_fpstatus_ptr(false); | ||
120 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
121 | } else { | ||
122 | tcg_rmode = NULL; | ||
123 | tcg_fpstatus = NULL; | ||
124 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_two_reg_misc(DisasContext *s, uint32_t insn) | ||
125 | } | ||
126 | |||
127 | if (is_fcvt) { | ||
128 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
129 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
130 | tcg_temp_free_i32(tcg_rmode); | ||
131 | tcg_temp_free_ptr(tcg_fpstatus); | ||
132 | } | ||
133 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn) | ||
134 | return; | ||
135 | } | ||
136 | |||
137 | - if (need_fpstatus) { | ||
138 | + if (need_fpstatus || need_rmode) { | ||
139 | tcg_fpstatus = get_fpstatus_ptr(false); | ||
140 | } else { | ||
141 | tcg_fpstatus = NULL; | ||
142 | } | ||
143 | if (need_rmode) { | ||
144 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode)); | ||
145 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
146 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
147 | } else { | ||
148 | tcg_rmode = NULL; | ||
149 | } | ||
150 | @@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn) | ||
151 | clear_vec_high(s, is_q, rd); | ||
152 | |||
153 | if (need_rmode) { | ||
154 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
155 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus); | ||
156 | tcg_temp_free_i32(tcg_rmode); | ||
157 | } | ||
158 | if (need_fpstatus) { | ||
159 | diff --git a/target/arm/translate.c b/target/arm/translate.c | 13 | diff --git a/target/arm/translate.c b/target/arm/translate.c |
160 | index XXXXXXX..XXXXXXX 100644 | 14 | index XXXXXXX..XXXXXXX 100644 |
161 | --- a/target/arm/translate.c | 15 | --- a/target/arm/translate.c |
162 | +++ b/target/arm/translate.c | 16 | +++ b/target/arm/translate.c |
163 | @@ -XXX,XX +XXX,XX @@ static int handle_vrint(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp, | 17 | @@ -XXX,XX +XXX,XX @@ static void disas_thumb2_insn(DisasContext *s, uint32_t insn) |
164 | TCGv_i32 tcg_rmode; | 18 | default_exception_el(s)); |
165 | 19 | break; | |
166 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rounding)); | 20 | } |
167 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | 21 | - if (((insn >> 24) & 3) == 3) { |
168 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | 22 | + if ((insn & 0xfe000a00) == 0xfc000800 |
169 | 23 | + && arm_dc_feature(s, ARM_FEATURE_V8)) { | |
170 | if (dp) { | 24 | + /* The Thumb2 and ARM encodings are identical. */ |
171 | TCGv_i64 tcg_op; | 25 | + if (disas_neon_insn_3same_ext(s, insn)) { |
172 | @@ -XXX,XX +XXX,XX @@ static int handle_vrint(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp, | 26 | + goto illegal_op; |
173 | tcg_temp_free_i32(tcg_res); | 27 | + } |
174 | } | 28 | + } else if ((insn & 0xff000a00) == 0xfe000800 |
175 | 29 | + && arm_dc_feature(s, ARM_FEATURE_V8)) { | |
176 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | 30 | + /* The Thumb2 and ARM encodings are identical. */ |
177 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | 31 | + if (disas_neon_insn_2reg_scalar_ext(s, insn)) { |
178 | tcg_temp_free_i32(tcg_rmode); | 32 | + goto illegal_op; |
179 | 33 | + } | |
180 | tcg_temp_free_ptr(fpst); | 34 | + } else if (((insn >> 24) & 3) == 3) { |
181 | @@ -XXX,XX +XXX,XX @@ static int handle_vcvt(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp, | 35 | /* Translate into the equivalent ARM encoding. */ |
182 | tcg_shift = tcg_const_i32(0); | 36 | insn = (insn & 0xe2ffffff) | ((insn & (1 << 28)) >> 4) | (1 << 28); |
183 | 37 | if (disas_neon_data_insn(s, insn)) { | |
184 | tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rounding)); | ||
185 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
186 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
187 | |||
188 | if (dp) { | ||
189 | TCGv_i64 tcg_double, tcg_res; | ||
190 | @@ -XXX,XX +XXX,XX @@ static int handle_vcvt(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp, | ||
191 | tcg_temp_free_i32(tcg_single); | ||
192 | } | ||
193 | |||
194 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
195 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
196 | tcg_temp_free_i32(tcg_rmode); | ||
197 | |||
198 | tcg_temp_free_i32(tcg_shift); | ||
199 | @@ -XXX,XX +XXX,XX @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn) | ||
200 | TCGv_ptr fpst = get_fpstatus_ptr(0); | ||
201 | TCGv_i32 tcg_rmode; | ||
202 | tcg_rmode = tcg_const_i32(float_round_to_zero); | ||
203 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
204 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
205 | if (dp) { | ||
206 | gen_helper_rintd(cpu_F0d, cpu_F0d, fpst); | ||
207 | } else { | ||
208 | gen_helper_rints(cpu_F0s, cpu_F0s, fpst); | ||
209 | } | ||
210 | - gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env); | ||
211 | + gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst); | ||
212 | tcg_temp_free_i32(tcg_rmode); | ||
213 | tcg_temp_free_ptr(fpst); | ||
214 | break; | ||
215 | -- | 38 | -- |
216 | 2.16.2 | 39 | 2.16.2 |
217 | 40 | ||
218 | 41 | diff view generated by jsdifflib |
1 | From: Alex Bennée <alex.bennee@linaro.org> | 1 | From: Richard Henderson <richard.henderson@linaro.org> |
---|---|---|---|
2 | 2 | ||
3 | This allows us to explicitly pass float16 to helpers rather than | 3 | Enable it for the "any" CPU used by *-linux-user. |
4 | assuming uint32_t and dealing with the result. Of course they will be | ||
5 | passed in i32 sized registers by default. | ||
6 | 4 | ||
7 | Signed-off-by: Alex Bennée <alex.bennee@linaro.org> | 5 | Signed-off-by: Richard Henderson <richard.henderson@linaro.org> |
8 | Reviewed-by: Richard Henderson <richard.henderson@linaro.org> | 6 | Reviewed-by: Peter Maydell <peter.maydell@linaro.org> |
9 | Message-id: 20180227143852.11175-2-alex.bennee@linaro.org | 7 | Message-id: 20180228193125.20577-17-richard.henderson@linaro.org |
10 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> | 8 | Signed-off-by: Peter Maydell <peter.maydell@linaro.org> |
11 | --- | 9 | --- |
12 | include/exec/helper-head.h | 3 +++ | 10 | target/arm/cpu.c | 1 + |
13 | 1 file changed, 3 insertions(+) | 11 | target/arm/cpu64.c | 1 + |
12 | 2 files changed, 2 insertions(+) | ||
14 | 13 | ||
15 | diff --git a/include/exec/helper-head.h b/include/exec/helper-head.h | 14 | diff --git a/target/arm/cpu.c b/target/arm/cpu.c |
16 | index XXXXXXX..XXXXXXX 100644 | 15 | index XXXXXXX..XXXXXXX 100644 |
17 | --- a/include/exec/helper-head.h | 16 | --- a/target/arm/cpu.c |
18 | +++ b/include/exec/helper-head.h | 17 | +++ b/target/arm/cpu.c |
19 | @@ -XXX,XX +XXX,XX @@ | 18 | @@ -XXX,XX +XXX,XX @@ static void arm_any_initfn(Object *obj) |
20 | #define dh_alias_int i32 | 19 | set_feature(&cpu->env, ARM_FEATURE_V8_PMULL); |
21 | #define dh_alias_i64 i64 | 20 | set_feature(&cpu->env, ARM_FEATURE_CRC); |
22 | #define dh_alias_s64 i64 | 21 | set_feature(&cpu->env, ARM_FEATURE_V8_RDM); |
23 | +#define dh_alias_f16 i32 | 22 | + set_feature(&cpu->env, ARM_FEATURE_V8_FCMA); |
24 | #define dh_alias_f32 i32 | 23 | cpu->midr = 0xffffffff; |
25 | #define dh_alias_f64 i64 | 24 | } |
26 | #define dh_alias_ptr ptr | 25 | #endif |
27 | @@ -XXX,XX +XXX,XX @@ | 26 | diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c |
28 | #define dh_ctype_int int | 27 | index XXXXXXX..XXXXXXX 100644 |
29 | #define dh_ctype_i64 uint64_t | 28 | --- a/target/arm/cpu64.c |
30 | #define dh_ctype_s64 int64_t | 29 | +++ b/target/arm/cpu64.c |
31 | +#define dh_ctype_f16 float16 | 30 | @@ -XXX,XX +XXX,XX @@ static void aarch64_any_initfn(Object *obj) |
32 | #define dh_ctype_f32 float32 | 31 | set_feature(&cpu->env, ARM_FEATURE_CRC); |
33 | #define dh_ctype_f64 float64 | 32 | set_feature(&cpu->env, ARM_FEATURE_V8_RDM); |
34 | #define dh_ctype_ptr void * | 33 | set_feature(&cpu->env, ARM_FEATURE_V8_FP16); |
35 | @@ -XXX,XX +XXX,XX @@ | 34 | + set_feature(&cpu->env, ARM_FEATURE_V8_FCMA); |
36 | #define dh_is_signed_s32 1 | 35 | cpu->ctr = 0x80038003; /* 32 byte I and D cacheline size, VIPT icache */ |
37 | #define dh_is_signed_i64 0 | 36 | cpu->dcz_blocksize = 7; /* 512 bytes */ |
38 | #define dh_is_signed_s64 1 | 37 | } |
39 | +#define dh_is_signed_f16 0 | ||
40 | #define dh_is_signed_f32 0 | ||
41 | #define dh_is_signed_f64 0 | ||
42 | #define dh_is_signed_tl 0 | ||
43 | -- | 38 | -- |
44 | 2.16.2 | 39 | 2.16.2 |
45 | 40 | ||
46 | 41 | diff view generated by jsdifflib |