1
Arm queue -- I have more stuff pending but I prefer to push
1
Second pull request of the week; mostly RTH's support for some
2
this first lot out and keep the pull below 50 patches.
2
new-in-v8.1/v8.3 instructions, and my v8M board model.
3
Most of this is Alex's FP16 support work.
4
3
4
thanks
5
-- PMM
5
-- PMM
6
6
7
The following changes since commit 427cbc7e4136a061628cb4315cc8182ea36d772f:
7
8
8
The following changes since commit 6697439794f72b3501ee16bb95d16854f9981421:
9
Merge remote-tracking branch 'remotes/mst/tags/for_upstream' into staging (2018-03-01 18:46:41 +0000)
9
10
Merge remote-tracking branch 'remotes/kraxel/tags/usb-20180227-pull-request' into staging (2018-02-27 17:50:46 +0000)
11
10
12
are available in the Git repository at:
11
are available in the Git repository at:
13
12
14
git://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20180301
13
git://git.linaro.org/people/pmaydell/qemu-arm.git tags/pull-target-arm-20180302
15
14
16
for you to fetch changes up to c22e580c2ad1cccef582e1490e732f254d4ac064:
15
for you to fetch changes up to e66a67bf28e1b4fce2e3d72a2610dbd48d9d3078:
17
16
18
MAINTAINERS: Update my email address (2018-03-01 11:13:59 +0000)
17
target/arm: Enable ARM_FEATURE_V8_FCMA (2018-03-02 11:03:45 +0000)
19
18
20
----------------------------------------------------------------
19
----------------------------------------------------------------
21
target-arm queue:
20
target-arm queue:
22
* update MAINTAINERS for Alistair's new email address
21
* implement FCMA and RDM v8.1 and v8.3 instructions
23
* add Arm v8.2 FP16 arithmetic extension for linux-user
22
* enable Cortex-M33 v8M core, and provide new mps2-an505 board model
24
* implement display connector emulation for vexpress board
23
that uses it
25
* xilinx_spips: Enable only two slaves when reading/writing with stripe
24
* decodetree: Propagate return value from translate subroutines
26
* xilinx_spips: Use 8 dummy cycles with the QIOR/QIOR4 commands
25
* xlnx-zynqmp: Implement the RTC device
27
* hw: register: Run post_write hook on reset
28
26
29
----------------------------------------------------------------
27
----------------------------------------------------------------
30
Alex Bennée (31):
28
Alistair Francis (3):
31
include/exec/helper-head.h: support f16 in helper calls
29
xlnx-zynqmp-rtc: Initial commit
32
target/arm/cpu64: introduce ARM_V8_FP16 feature bit
30
xlnx-zynqmp-rtc: Add basic time support
33
target/arm/cpu.h: update comment for half-precision values
31
xlnx-zynqmp: Connect the RTC device
34
target/arm/cpu.h: add additional float_status flags
35
target/arm/helper: pass explicit fpst to set_rmode
36
arm/translate-a64: implement half-precision F(MIN|MAX)(V|NMV)
37
arm/translate-a64: handle_3same_64 comment fix
38
arm/translate-a64: initial decode for simd_three_reg_same_fp16
39
arm/translate-a64: add FP16 FADD/FABD/FSUB/FMUL/FDIV to simd_three_reg_same_fp16
40
arm/translate-a64: add FP16 F[A]C[EQ/GE/GT] to simd_three_reg_same_fp16
41
arm/translate-a64: add FP16 FMULA/X/S to simd_three_reg_same_fp16
42
arm/translate-a64: add FP16 FR[ECP/SQRT]S to simd_three_reg_same_fp16
43
arm/translate-a64: add FP16 pairwise ops simd_three_reg_same_fp16
44
arm/translate-a64: add FP16 FMULX/MLS/FMLA to simd_indexed
45
arm/translate-a64: add FP16 x2 ops for simd_indexed
46
arm/translate-a64: initial decode for simd_two_reg_misc_fp16
47
arm/translate-a64: add FP16 FPRINTx to simd_two_reg_misc_fp16
48
arm/translate-a64: add FCVTxx to simd_two_reg_misc_fp16
49
arm/translate-a64: add FP16 FCMxx (zero) to simd_two_reg_misc_fp16
50
arm/translate-a64: add FP16 SCVTF/UCVFT to simd_two_reg_misc_fp16
51
arm/translate-a64: add FP16 FNEG/FABS to simd_two_reg_misc_fp16
52
arm/helper.c: re-factor recpe and add recepe_f16
53
arm/translate-a64: add FP16 FRECPE
54
arm/translate-a64: add FP16 FRCPX to simd_two_reg_misc_fp16
55
arm/translate-a64: add FP16 FSQRT to simd_two_reg_misc_fp16
56
arm/helper.c: re-factor rsqrte and add rsqrte_f16
57
arm/translate-a64: add FP16 FRSQRTE to simd_two_reg_misc_fp16
58
arm/translate-a64: add FP16 FMOV to simd_mod_imm
59
arm/translate-a64: add all FP16 ops in simd_scalar_pairwise
60
arm/translate-a64: implement simd_scalar_three_reg_same_fp16
61
arm/translate-a64: add all single op FP16 to handle_fp_1src_half
62
32
63
Alistair Francis (2):
33
Peter Maydell (19):
64
hw: register: Run post_write hook on reset
34
loader: Add new load_ramdisk_as()
65
MAINTAINERS: Update my email address
35
hw/arm/boot: Honour CPU's address space for image loads
36
hw/arm/armv7m: Honour CPU's address space for image loads
37
target/arm: Define an IDAU interface
38
armv7m: Forward idau property to CPU object
39
target/arm: Define init-svtor property for the reset secure VTOR value
40
armv7m: Forward init-svtor property to CPU object
41
target/arm: Add Cortex-M33
42
hw/misc/unimp: Move struct to header file
43
include/hw/or-irq.h: Add missing include guard
44
qdev: Add new qdev_init_gpio_in_named_with_opaque()
45
hw/core/split-irq: Device that splits IRQ lines
46
hw/misc/mps2-fpgaio: FPGA control block for MPS2 AN505
47
hw/misc/tz-ppc: Model TrustZone peripheral protection controller
48
hw/misc/iotkit-secctl: Arm IoT Kit security controller initial skeleton
49
hw/misc/iotkit-secctl: Add handling for PPCs
50
hw/misc/iotkit-secctl: Add remaining simple registers
51
hw/arm/iotkit: Model Arm IOT Kit
52
mps2-an505: New board model: MPS2 with AN505 Cortex-M33 FPGA image
66
53
67
Corey Minyard (2):
54
Richard Henderson (17):
68
i2c: Fix some brace style issues
55
decodetree: Propagate return value from translate subroutines
69
i2c: Move the bus class to i2c.h
56
target/arm: Add ARM_FEATURE_V8_RDM
57
target/arm: Refactor disas_simd_indexed decode
58
target/arm: Refactor disas_simd_indexed size checks
59
target/arm: Decode aa64 armv8.1 scalar three same extra
60
target/arm: Decode aa64 armv8.1 three same extra
61
target/arm: Decode aa64 armv8.1 scalar/vector x indexed element
62
target/arm: Decode aa32 armv8.1 three same
63
target/arm: Decode aa32 armv8.1 two reg and a scalar
64
target/arm: Enable ARM_FEATURE_V8_RDM
65
target/arm: Add ARM_FEATURE_V8_FCMA
66
target/arm: Decode aa64 armv8.3 fcadd
67
target/arm: Decode aa64 armv8.3 fcmla
68
target/arm: Decode aa32 armv8.3 3-same
69
target/arm: Decode aa32 armv8.3 2-reg-index
70
target/arm: Decode t32 simd 3reg and 2reg_scalar extension
71
target/arm: Enable ARM_FEATURE_V8_FCMA
70
72
71
Francisco Iglesias (2):
73
hw/arm/Makefile.objs | 2 +
72
xilinx_spips: Enable only two slaves when reading/writing with stripe
74
hw/core/Makefile.objs | 1 +
73
xilinx_spips: Use 8 dummy cycles with the QIOR/QIOR4 commands
75
hw/misc/Makefile.objs | 4 +
76
hw/timer/Makefile.objs | 1 +
77
target/arm/Makefile.objs | 2 +-
78
include/hw/arm/armv7m.h | 5 +
79
include/hw/arm/iotkit.h | 109 ++++++
80
include/hw/arm/xlnx-zynqmp.h | 2 +
81
include/hw/core/split-irq.h | 57 +++
82
include/hw/irq.h | 4 +-
83
include/hw/loader.h | 12 +-
84
include/hw/misc/iotkit-secctl.h | 103 ++++++
85
include/hw/misc/mps2-fpgaio.h | 43 +++
86
include/hw/misc/tz-ppc.h | 101 ++++++
87
include/hw/misc/unimp.h | 10 +
88
include/hw/or-irq.h | 5 +
89
include/hw/qdev-core.h | 30 +-
90
include/hw/timer/xlnx-zynqmp-rtc.h | 86 +++++
91
target/arm/cpu.h | 8 +
92
target/arm/helper.h | 31 ++
93
target/arm/idau.h | 61 ++++
94
hw/arm/armv7m.c | 35 +-
95
hw/arm/boot.c | 119 ++++---
96
hw/arm/iotkit.c | 598 +++++++++++++++++++++++++++++++
97
hw/arm/mps2-tz.c | 503 ++++++++++++++++++++++++++
98
hw/arm/xlnx-zynqmp.c | 14 +
99
hw/core/loader.c | 8 +-
100
hw/core/qdev.c | 8 +-
101
hw/core/split-irq.c | 89 +++++
102
hw/misc/iotkit-secctl.c | 704 +++++++++++++++++++++++++++++++++++++
103
hw/misc/mps2-fpgaio.c | 176 ++++++++++
104
hw/misc/tz-ppc.c | 302 ++++++++++++++++
105
hw/misc/unimp.c | 10 -
106
hw/timer/xlnx-zynqmp-rtc.c | 272 ++++++++++++++
107
linux-user/elfload.c | 2 +
108
target/arm/cpu.c | 66 +++-
109
target/arm/cpu64.c | 2 +
110
target/arm/helper.c | 28 +-
111
target/arm/translate-a64.c | 514 +++++++++++++++++++++------
112
target/arm/translate.c | 275 +++++++++++++--
113
target/arm/vec_helper.c | 429 ++++++++++++++++++++++
114
default-configs/arm-softmmu.mak | 5 +
115
hw/misc/trace-events | 24 ++
116
hw/timer/trace-events | 3 +
117
scripts/decodetree.py | 5 +-
118
45 files changed, 4668 insertions(+), 200 deletions(-)
119
create mode 100644 include/hw/arm/iotkit.h
120
create mode 100644 include/hw/core/split-irq.h
121
create mode 100644 include/hw/misc/iotkit-secctl.h
122
create mode 100644 include/hw/misc/mps2-fpgaio.h
123
create mode 100644 include/hw/misc/tz-ppc.h
124
create mode 100644 include/hw/timer/xlnx-zynqmp-rtc.h
125
create mode 100644 target/arm/idau.h
126
create mode 100644 hw/arm/iotkit.c
127
create mode 100644 hw/arm/mps2-tz.c
128
create mode 100644 hw/core/split-irq.c
129
create mode 100644 hw/misc/iotkit-secctl.c
130
create mode 100644 hw/misc/mps2-fpgaio.c
131
create mode 100644 hw/misc/tz-ppc.c
132
create mode 100644 hw/timer/xlnx-zynqmp-rtc.c
133
create mode 100644 target/arm/vec_helper.c
74
134
75
Linus Walleij (3):
76
hw/i2c-ddc: Do not fail writes
77
hw/sii9022: Add support for Silicon Image SII9022
78
arm/vexpress: Add proper display connector emulation
79
80
Peter Maydell (2):
81
target/arm: Enable ARM_V8_FP16 feature bit for the AArch64 "any" CPU
82
linux-user: Report AArch64 FP16 support via hwcap bits
83
84
hw/display/Makefile.objs | 1 +
85
include/exec/helper-head.h | 3 +
86
include/fpu/softfloat.h | 18 +-
87
include/hw/i2c/i2c.h | 23 +-
88
include/hw/register.h | 6 +-
89
target/arm/cpu.h | 34 +-
90
target/arm/helper-a64.h | 33 +
91
target/arm/helper.h | 14 +-
92
hw/arm/vexpress.c | 6 +-
93
hw/core/register.c | 8 +
94
hw/display/sii9022.c | 191 ++++++
95
hw/i2c/core.c | 18 -
96
hw/i2c/i2c-ddc.c | 4 +-
97
hw/ssi/xilinx_spips.c | 43 +-
98
linux-user/elfload.c | 2 +
99
target/arm/cpu64.c | 1 +
100
target/arm/helper-a64.c | 269 +++++++++
101
target/arm/helper.c | 481 ++++++++-------
102
target/arm/translate-a64.c | 1266 +++++++++++++++++++++++++++++++++------
103
target/arm/translate.c | 12 +-
104
MAINTAINERS | 12 +-
105
default-configs/arm-softmmu.mak | 2 +
106
hw/display/trace-events | 5 +
107
23 files changed, 1981 insertions(+), 471 deletions(-)
108
create mode 100644 hw/display/sii9022.c
109
diff view generated by jsdifflib
1
From: Alistair Francis <alistair.francis@xilinx.com>
1
From: Alistair Francis <alistair.francis@xilinx.com>
2
2
3
I am leaving Xilinx, so to avoid having an email address that bounces
3
Initial commit of the ZynqMP RTC device.
4
update my maintainer address to point to my personal email address.
5
4
6
Signed-off-by: Alistair Francis <alistair.francis@xilinx.com>
5
Signed-off-by: Alistair Francis <alistair.francis@xilinx.com>
7
Signed-off-by: Alistair Francis <alistair@alistair23.me>
8
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
6
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
9
Message-id: 7bb690382e3370aa1c1e047a84e36603c787ec0e.1519749987.git.alistair.francis@xilinx.com
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
8
---
12
MAINTAINERS | 12 ++++++------
9
hw/timer/Makefile.objs | 1 +
13
1 file changed, 6 insertions(+), 6 deletions(-)
10
include/hw/timer/xlnx-zynqmp-rtc.h | 84 +++++++++++++++
14
11
hw/timer/xlnx-zynqmp-rtc.c | 214 +++++++++++++++++++++++++++++++++++++
15
diff --git a/MAINTAINERS b/MAINTAINERS
12
3 files changed, 299 insertions(+)
13
create mode 100644 include/hw/timer/xlnx-zynqmp-rtc.h
14
create mode 100644 hw/timer/xlnx-zynqmp-rtc.c
15
16
diff --git a/hw/timer/Makefile.objs b/hw/timer/Makefile.objs
16
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
17
--- a/MAINTAINERS
18
--- a/hw/timer/Makefile.objs
18
+++ b/MAINTAINERS
19
+++ b/hw/timer/Makefile.objs
19
@@ -XXX,XX +XXX,XX @@ F: hw/misc/arm_sysctl.c
20
@@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_IMX) += imx_epit.o
20
21
common-obj-$(CONFIG_IMX) += imx_gpt.o
21
Xilinx Zynq
22
common-obj-$(CONFIG_LM32) += lm32_timer.o
22
M: Edgar E. Iglesias <edgar.iglesias@gmail.com>
23
common-obj-$(CONFIG_MILKYMIST) += milkymist-sysctl.o
23
-M: Alistair Francis <alistair.francis@xilinx.com>
24
+common-obj-$(CONFIG_XLNX_ZYNQMP) += xlnx-zynqmp-rtc.o
24
+M: Alistair Francis <alistair@alistair23.me>
25
25
L: qemu-arm@nongnu.org
26
obj-$(CONFIG_ALTERA_TIMER) += altera_timer.o
26
S: Maintained
27
obj-$(CONFIG_EXYNOS4) += exynos4210_mct.o
27
F: hw/*/xilinx_*
28
diff --git a/include/hw/timer/xlnx-zynqmp-rtc.h b/include/hw/timer/xlnx-zynqmp-rtc.h
28
@@ -XXX,XX +XXX,XX @@ F: include/hw/misc/zynq*
29
new file mode 100644
29
X: hw/ssi/xilinx_*
30
index XXXXXXX..XXXXXXX
30
31
--- /dev/null
31
Xilinx ZynqMP
32
+++ b/include/hw/timer/xlnx-zynqmp-rtc.h
32
-M: Alistair Francis <alistair.francis@xilinx.com>
33
@@ -XXX,XX +XXX,XX @@
33
+M: Alistair Francis <alistair@alistair23.me>
34
+/*
34
M: Edgar E. Iglesias <edgar.iglesias@gmail.com>
35
+ * QEMU model of the Xilinx ZynqMP Real Time Clock (RTC).
35
L: qemu-arm@nongnu.org
36
+ *
36
S: Maintained
37
+ * Copyright (c) 2017 Xilinx Inc.
37
@@ -XXX,XX +XXX,XX @@ T: git git://github.com/bonzini/qemu.git scsi-next
38
+ *
38
39
+ * Written-by: Alistair Francis <alistair.francis@xilinx.com>
39
SSI
40
+ *
40
M: Peter Crosthwaite <crosthwaite.peter@gmail.com>
41
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
41
-M: Alistair Francis <alistair.francis@xilinx.com>
42
+ * of this software and associated documentation files (the "Software"), to deal
42
+M: Alistair Francis <alistair@alistair23.me>
43
+ * in the Software without restriction, including without limitation the rights
43
S: Maintained
44
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
44
F: hw/ssi/*
45
+ * copies of the Software, and to permit persons to whom the Software is
45
F: hw/block/m25p80.c
46
+ * furnished to do so, subject to the following conditions:
46
@@ -XXX,XX +XXX,XX @@ X: hw/ssi/xilinx_*
47
+ *
47
F: tests/m25p80-test.c
48
+ * The above copyright notice and this permission notice shall be included in
48
49
+ * all copies or substantial portions of the Software.
49
Xilinx SPI
50
+ *
50
-M: Alistair Francis <alistair.francis@xilinx.com>
51
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
51
+M: Alistair Francis <alistair@alistair23.me>
52
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
52
M: Peter Crosthwaite <crosthwaite.peter@gmail.com>
53
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
53
S: Maintained
54
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
54
F: hw/ssi/xilinx_*
55
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
55
@@ -XXX,XX +XXX,XX @@ S: Maintained
56
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
56
F: hw/net/eepro100.c
57
+ * THE SOFTWARE.
57
58
+ */
58
Generic Loader
59
+
59
-M: Alistair Francis <alistair.francis@xilinx.com>
60
+#include "hw/register.h"
60
+M: Alistair Francis <alistair@alistair23.me>
61
+
61
S: Maintained
62
+#define TYPE_XLNX_ZYNQMP_RTC "xlnx-zynmp.rtc"
62
F: hw/core/generic-loader.c
63
+
63
F: include/hw/core/generic-loader.h
64
+#define XLNX_ZYNQMP_RTC(obj) \
64
@@ -XXX,XX +XXX,XX @@ F: tests/qmp-test.c
65
+ OBJECT_CHECK(XlnxZynqMPRTC, (obj), TYPE_XLNX_ZYNQMP_RTC)
65
T: git git://repo.or.cz/qemu/armbru.git qapi-next
66
+
66
67
+REG32(SET_TIME_WRITE, 0x0)
67
Register API
68
+REG32(SET_TIME_READ, 0x4)
68
-M: Alistair Francis <alistair.francis@xilinx.com>
69
+REG32(CALIB_WRITE, 0x8)
69
+M: Alistair Francis <alistair@alistair23.me>
70
+ FIELD(CALIB_WRITE, FRACTION_EN, 20, 1)
70
S: Maintained
71
+ FIELD(CALIB_WRITE, FRACTION_DATA, 16, 4)
71
F: hw/core/register.c
72
+ FIELD(CALIB_WRITE, MAX_TICK, 0, 16)
72
F: include/hw/register.h
73
+REG32(CALIB_READ, 0xc)
74
+ FIELD(CALIB_READ, FRACTION_EN, 20, 1)
75
+ FIELD(CALIB_READ, FRACTION_DATA, 16, 4)
76
+ FIELD(CALIB_READ, MAX_TICK, 0, 16)
77
+REG32(CURRENT_TIME, 0x10)
78
+REG32(CURRENT_TICK, 0x14)
79
+ FIELD(CURRENT_TICK, VALUE, 0, 16)
80
+REG32(ALARM, 0x18)
81
+REG32(RTC_INT_STATUS, 0x20)
82
+ FIELD(RTC_INT_STATUS, ALARM, 1, 1)
83
+ FIELD(RTC_INT_STATUS, SECONDS, 0, 1)
84
+REG32(RTC_INT_MASK, 0x24)
85
+ FIELD(RTC_INT_MASK, ALARM, 1, 1)
86
+ FIELD(RTC_INT_MASK, SECONDS, 0, 1)
87
+REG32(RTC_INT_EN, 0x28)
88
+ FIELD(RTC_INT_EN, ALARM, 1, 1)
89
+ FIELD(RTC_INT_EN, SECONDS, 0, 1)
90
+REG32(RTC_INT_DIS, 0x2c)
91
+ FIELD(RTC_INT_DIS, ALARM, 1, 1)
92
+ FIELD(RTC_INT_DIS, SECONDS, 0, 1)
93
+REG32(ADDR_ERROR, 0x30)
94
+ FIELD(ADDR_ERROR, STATUS, 0, 1)
95
+REG32(ADDR_ERROR_INT_MASK, 0x34)
96
+ FIELD(ADDR_ERROR_INT_MASK, MASK, 0, 1)
97
+REG32(ADDR_ERROR_INT_EN, 0x38)
98
+ FIELD(ADDR_ERROR_INT_EN, MASK, 0, 1)
99
+REG32(ADDR_ERROR_INT_DIS, 0x3c)
100
+ FIELD(ADDR_ERROR_INT_DIS, MASK, 0, 1)
101
+REG32(CONTROL, 0x40)
102
+ FIELD(CONTROL, BATTERY_DISABLE, 31, 1)
103
+ FIELD(CONTROL, OSC_CNTRL, 24, 4)
104
+ FIELD(CONTROL, SLVERR_ENABLE, 0, 1)
105
+REG32(SAFETY_CHK, 0x50)
106
+
107
+#define XLNX_ZYNQMP_RTC_R_MAX (R_SAFETY_CHK + 1)
108
+
109
+typedef struct XlnxZynqMPRTC {
110
+ SysBusDevice parent_obj;
111
+ MemoryRegion iomem;
112
+ qemu_irq irq_rtc_int;
113
+ qemu_irq irq_addr_error_int;
114
+
115
+ uint32_t regs[XLNX_ZYNQMP_RTC_R_MAX];
116
+ RegisterInfo regs_info[XLNX_ZYNQMP_RTC_R_MAX];
117
+} XlnxZynqMPRTC;
118
diff --git a/hw/timer/xlnx-zynqmp-rtc.c b/hw/timer/xlnx-zynqmp-rtc.c
119
new file mode 100644
120
index XXXXXXX..XXXXXXX
121
--- /dev/null
122
+++ b/hw/timer/xlnx-zynqmp-rtc.c
123
@@ -XXX,XX +XXX,XX @@
124
+/*
125
+ * QEMU model of the Xilinx ZynqMP Real Time Clock (RTC).
126
+ *
127
+ * Copyright (c) 2017 Xilinx Inc.
128
+ *
129
+ * Written-by: Alistair Francis <alistair.francis@xilinx.com>
130
+ *
131
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
132
+ * of this software and associated documentation files (the "Software"), to deal
133
+ * in the Software without restriction, including without limitation the rights
134
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
135
+ * copies of the Software, and to permit persons to whom the Software is
136
+ * furnished to do so, subject to the following conditions:
137
+ *
138
+ * The above copyright notice and this permission notice shall be included in
139
+ * all copies or substantial portions of the Software.
140
+ *
141
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
142
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
143
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
144
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
145
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
146
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
147
+ * THE SOFTWARE.
148
+ */
149
+
150
+#include "qemu/osdep.h"
151
+#include "hw/sysbus.h"
152
+#include "hw/register.h"
153
+#include "qemu/bitops.h"
154
+#include "qemu/log.h"
155
+#include "hw/timer/xlnx-zynqmp-rtc.h"
156
+
157
+#ifndef XLNX_ZYNQMP_RTC_ERR_DEBUG
158
+#define XLNX_ZYNQMP_RTC_ERR_DEBUG 0
159
+#endif
160
+
161
+static void rtc_int_update_irq(XlnxZynqMPRTC *s)
162
+{
163
+ bool pending = s->regs[R_RTC_INT_STATUS] & ~s->regs[R_RTC_INT_MASK];
164
+ qemu_set_irq(s->irq_rtc_int, pending);
165
+}
166
+
167
+static void addr_error_int_update_irq(XlnxZynqMPRTC *s)
168
+{
169
+ bool pending = s->regs[R_ADDR_ERROR] & ~s->regs[R_ADDR_ERROR_INT_MASK];
170
+ qemu_set_irq(s->irq_addr_error_int, pending);
171
+}
172
+
173
+static void rtc_int_status_postw(RegisterInfo *reg, uint64_t val64)
174
+{
175
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
176
+ rtc_int_update_irq(s);
177
+}
178
+
179
+static uint64_t rtc_int_en_prew(RegisterInfo *reg, uint64_t val64)
180
+{
181
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
182
+
183
+ s->regs[R_RTC_INT_MASK] &= (uint32_t) ~val64;
184
+ rtc_int_update_irq(s);
185
+ return 0;
186
+}
187
+
188
+static uint64_t rtc_int_dis_prew(RegisterInfo *reg, uint64_t val64)
189
+{
190
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
191
+
192
+ s->regs[R_RTC_INT_MASK] |= (uint32_t) val64;
193
+ rtc_int_update_irq(s);
194
+ return 0;
195
+}
196
+
197
+static void addr_error_postw(RegisterInfo *reg, uint64_t val64)
198
+{
199
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
200
+ addr_error_int_update_irq(s);
201
+}
202
+
203
+static uint64_t addr_error_int_en_prew(RegisterInfo *reg, uint64_t val64)
204
+{
205
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
206
+
207
+ s->regs[R_ADDR_ERROR_INT_MASK] &= (uint32_t) ~val64;
208
+ addr_error_int_update_irq(s);
209
+ return 0;
210
+}
211
+
212
+static uint64_t addr_error_int_dis_prew(RegisterInfo *reg, uint64_t val64)
213
+{
214
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
215
+
216
+ s->regs[R_ADDR_ERROR_INT_MASK] |= (uint32_t) val64;
217
+ addr_error_int_update_irq(s);
218
+ return 0;
219
+}
220
+
221
+static const RegisterAccessInfo rtc_regs_info[] = {
222
+ { .name = "SET_TIME_WRITE", .addr = A_SET_TIME_WRITE,
223
+ },{ .name = "SET_TIME_READ", .addr = A_SET_TIME_READ,
224
+ .ro = 0xffffffff,
225
+ },{ .name = "CALIB_WRITE", .addr = A_CALIB_WRITE,
226
+ },{ .name = "CALIB_READ", .addr = A_CALIB_READ,
227
+ .ro = 0x1fffff,
228
+ },{ .name = "CURRENT_TIME", .addr = A_CURRENT_TIME,
229
+ .ro = 0xffffffff,
230
+ },{ .name = "CURRENT_TICK", .addr = A_CURRENT_TICK,
231
+ .ro = 0xffff,
232
+ },{ .name = "ALARM", .addr = A_ALARM,
233
+ },{ .name = "RTC_INT_STATUS", .addr = A_RTC_INT_STATUS,
234
+ .w1c = 0x3,
235
+ .post_write = rtc_int_status_postw,
236
+ },{ .name = "RTC_INT_MASK", .addr = A_RTC_INT_MASK,
237
+ .reset = 0x3,
238
+ .ro = 0x3,
239
+ },{ .name = "RTC_INT_EN", .addr = A_RTC_INT_EN,
240
+ .pre_write = rtc_int_en_prew,
241
+ },{ .name = "RTC_INT_DIS", .addr = A_RTC_INT_DIS,
242
+ .pre_write = rtc_int_dis_prew,
243
+ },{ .name = "ADDR_ERROR", .addr = A_ADDR_ERROR,
244
+ .w1c = 0x1,
245
+ .post_write = addr_error_postw,
246
+ },{ .name = "ADDR_ERROR_INT_MASK", .addr = A_ADDR_ERROR_INT_MASK,
247
+ .reset = 0x1,
248
+ .ro = 0x1,
249
+ },{ .name = "ADDR_ERROR_INT_EN", .addr = A_ADDR_ERROR_INT_EN,
250
+ .pre_write = addr_error_int_en_prew,
251
+ },{ .name = "ADDR_ERROR_INT_DIS", .addr = A_ADDR_ERROR_INT_DIS,
252
+ .pre_write = addr_error_int_dis_prew,
253
+ },{ .name = "CONTROL", .addr = A_CONTROL,
254
+ .reset = 0x1000000,
255
+ .rsvd = 0x70fffffe,
256
+ },{ .name = "SAFETY_CHK", .addr = A_SAFETY_CHK,
257
+ }
258
+};
259
+
260
+static void rtc_reset(DeviceState *dev)
261
+{
262
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(dev);
263
+ unsigned int i;
264
+
265
+ for (i = 0; i < ARRAY_SIZE(s->regs_info); ++i) {
266
+ register_reset(&s->regs_info[i]);
267
+ }
268
+
269
+ rtc_int_update_irq(s);
270
+ addr_error_int_update_irq(s);
271
+}
272
+
273
+static const MemoryRegionOps rtc_ops = {
274
+ .read = register_read_memory,
275
+ .write = register_write_memory,
276
+ .endianness = DEVICE_LITTLE_ENDIAN,
277
+ .valid = {
278
+ .min_access_size = 4,
279
+ .max_access_size = 4,
280
+ },
281
+};
282
+
283
+static void rtc_init(Object *obj)
284
+{
285
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(obj);
286
+ SysBusDevice *sbd = SYS_BUS_DEVICE(obj);
287
+ RegisterInfoArray *reg_array;
288
+
289
+ memory_region_init(&s->iomem, obj, TYPE_XLNX_ZYNQMP_RTC,
290
+ XLNX_ZYNQMP_RTC_R_MAX * 4);
291
+ reg_array =
292
+ register_init_block32(DEVICE(obj), rtc_regs_info,
293
+ ARRAY_SIZE(rtc_regs_info),
294
+ s->regs_info, s->regs,
295
+ &rtc_ops,
296
+ XLNX_ZYNQMP_RTC_ERR_DEBUG,
297
+ XLNX_ZYNQMP_RTC_R_MAX * 4);
298
+ memory_region_add_subregion(&s->iomem,
299
+ 0x0,
300
+ &reg_array->mem);
301
+ sysbus_init_mmio(sbd, &s->iomem);
302
+ sysbus_init_irq(sbd, &s->irq_rtc_int);
303
+ sysbus_init_irq(sbd, &s->irq_addr_error_int);
304
+}
305
+
306
+static const VMStateDescription vmstate_rtc = {
307
+ .name = TYPE_XLNX_ZYNQMP_RTC,
308
+ .version_id = 1,
309
+ .minimum_version_id = 1,
310
+ .fields = (VMStateField[]) {
311
+ VMSTATE_UINT32_ARRAY(regs, XlnxZynqMPRTC, XLNX_ZYNQMP_RTC_R_MAX),
312
+ VMSTATE_END_OF_LIST(),
313
+ }
314
+};
315
+
316
+static void rtc_class_init(ObjectClass *klass, void *data)
317
+{
318
+ DeviceClass *dc = DEVICE_CLASS(klass);
319
+
320
+ dc->reset = rtc_reset;
321
+ dc->vmsd = &vmstate_rtc;
322
+}
323
+
324
+static const TypeInfo rtc_info = {
325
+ .name = TYPE_XLNX_ZYNQMP_RTC,
326
+ .parent = TYPE_SYS_BUS_DEVICE,
327
+ .instance_size = sizeof(XlnxZynqMPRTC),
328
+ .class_init = rtc_class_init,
329
+ .instance_init = rtc_init,
330
+};
331
+
332
+static void rtc_register_types(void)
333
+{
334
+ type_register_static(&rtc_info);
335
+}
336
+
337
+type_init(rtc_register_types)
73
--
338
--
74
2.16.2
339
2.16.2
75
340
76
341
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Alistair Francis <alistair.francis@xilinx.com>
2
2
3
These use the generic float16_compare functionality which in turn uses
3
Allow the guest to determine the time set from the QEMU command line.
4
the common float_compare code from the softfloat re-factor.
5
4
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
This includes adding a trace event to debug the new time.
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
8
Message-id: 20180227143852.11175-11-alex.bennee@linaro.org
7
Signed-off-by: Alistair Francis <alistair.francis@xilinx.com>
8
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
9
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
11
---
11
target/arm/helper-a64.h | 5 +++++
12
include/hw/timer/xlnx-zynqmp-rtc.h | 2 ++
12
target/arm/helper-a64.c | 49 ++++++++++++++++++++++++++++++++++++++++++++++
13
hw/timer/xlnx-zynqmp-rtc.c | 58 ++++++++++++++++++++++++++++++++++++++
13
target/arm/translate-a64.c | 15 ++++++++++++++
14
hw/timer/trace-events | 3 ++
14
3 files changed, 69 insertions(+)
15
3 files changed, 63 insertions(+)
15
16
16
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
17
diff --git a/include/hw/timer/xlnx-zynqmp-rtc.h b/include/hw/timer/xlnx-zynqmp-rtc.h
17
index XXXXXXX..XXXXXXX 100644
18
index XXXXXXX..XXXXXXX 100644
18
--- a/target/arm/helper-a64.h
19
--- a/include/hw/timer/xlnx-zynqmp-rtc.h
19
+++ b/target/arm/helper-a64.h
20
+++ b/include/hw/timer/xlnx-zynqmp-rtc.h
20
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_addh, f16, f16, f16, ptr)
21
@@ -XXX,XX +XXX,XX @@ typedef struct XlnxZynqMPRTC {
21
DEF_HELPER_3(advsimd_subh, f16, f16, f16, ptr)
22
qemu_irq irq_rtc_int;
22
DEF_HELPER_3(advsimd_mulh, f16, f16, f16, ptr)
23
qemu_irq irq_addr_error_int;
23
DEF_HELPER_3(advsimd_divh, f16, f16, f16, ptr)
24
24
+DEF_HELPER_3(advsimd_ceq_f16, i32, f16, f16, ptr)
25
+ uint32_t tick_offset;
25
+DEF_HELPER_3(advsimd_cge_f16, i32, f16, f16, ptr)
26
+
26
+DEF_HELPER_3(advsimd_cgt_f16, i32, f16, f16, ptr)
27
uint32_t regs[XLNX_ZYNQMP_RTC_R_MAX];
27
+DEF_HELPER_3(advsimd_acge_f16, i32, f16, f16, ptr)
28
RegisterInfo regs_info[XLNX_ZYNQMP_RTC_R_MAX];
28
+DEF_HELPER_3(advsimd_acgt_f16, i32, f16, f16, ptr)
29
} XlnxZynqMPRTC;
29
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
30
diff --git a/hw/timer/xlnx-zynqmp-rtc.c b/hw/timer/xlnx-zynqmp-rtc.c
30
index XXXXXXX..XXXXXXX 100644
31
index XXXXXXX..XXXXXXX 100644
31
--- a/target/arm/helper-a64.c
32
--- a/hw/timer/xlnx-zynqmp-rtc.c
32
+++ b/target/arm/helper-a64.c
33
+++ b/hw/timer/xlnx-zynqmp-rtc.c
33
@@ -XXX,XX +XXX,XX @@ ADVSIMD_HALFOP(min)
34
@@ -XXX,XX +XXX,XX @@
34
ADVSIMD_HALFOP(max)
35
#include "hw/register.h"
35
ADVSIMD_HALFOP(minnum)
36
#include "qemu/bitops.h"
36
ADVSIMD_HALFOP(maxnum)
37
#include "qemu/log.h"
37
+
38
+#include "hw/ptimer.h"
38
+/*
39
+#include "qemu/cutils.h"
39
+ * Floating point comparisons produce an integer result. Softfloat
40
+#include "sysemu/sysemu.h"
40
+ * routines return float_relation types which we convert to the 0/-1
41
+#include "trace.h"
41
+ * Neon requires.
42
#include "hw/timer/xlnx-zynqmp-rtc.h"
42
+ */
43
43
+
44
#ifndef XLNX_ZYNQMP_RTC_ERR_DEBUG
44
+#define ADVSIMD_CMPRES(test) (test) ? 0xffff : 0
45
@@ -XXX,XX +XXX,XX @@ static void addr_error_int_update_irq(XlnxZynqMPRTC *s)
45
+
46
qemu_set_irq(s->irq_addr_error_int, pending);
46
+uint32_t HELPER(advsimd_ceq_f16)(float16 a, float16 b, void *fpstp)
47
}
48
49
+static uint32_t rtc_get_count(XlnxZynqMPRTC *s)
47
+{
50
+{
48
+ float_status *fpst = fpstp;
51
+ int64_t now = qemu_clock_get_ns(rtc_clock);
49
+ int compare = float16_compare_quiet(a, b, fpst);
52
+ return s->tick_offset + now / NANOSECONDS_PER_SECOND;
50
+ return ADVSIMD_CMPRES(compare == float_relation_equal);
51
+}
53
+}
52
+
54
+
53
+uint32_t HELPER(advsimd_cge_f16)(float16 a, float16 b, void *fpstp)
55
+static uint64_t current_time_postr(RegisterInfo *reg, uint64_t val64)
54
+{
56
+{
55
+ float_status *fpst = fpstp;
57
+ XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
56
+ int compare = float16_compare(a, b, fpst);
58
+
57
+ return ADVSIMD_CMPRES(compare == float_relation_greater ||
59
+ return rtc_get_count(s);
58
+ compare == float_relation_equal);
59
+}
60
+}
60
+
61
+
61
+uint32_t HELPER(advsimd_cgt_f16)(float16 a, float16 b, void *fpstp)
62
static void rtc_int_status_postw(RegisterInfo *reg, uint64_t val64)
62
+{
63
{
63
+ float_status *fpst = fpstp;
64
XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(reg->opaque);
64
+ int compare = float16_compare(a, b, fpst);
65
@@ -XXX,XX +XXX,XX @@ static uint64_t addr_error_int_dis_prew(RegisterInfo *reg, uint64_t val64)
65
+ return ADVSIMD_CMPRES(compare == float_relation_greater);
66
67
static const RegisterAccessInfo rtc_regs_info[] = {
68
{ .name = "SET_TIME_WRITE", .addr = A_SET_TIME_WRITE,
69
+ .unimp = MAKE_64BIT_MASK(0, 32),
70
},{ .name = "SET_TIME_READ", .addr = A_SET_TIME_READ,
71
.ro = 0xffffffff,
72
+ .post_read = current_time_postr,
73
},{ .name = "CALIB_WRITE", .addr = A_CALIB_WRITE,
74
+ .unimp = MAKE_64BIT_MASK(0, 32),
75
},{ .name = "CALIB_READ", .addr = A_CALIB_READ,
76
.ro = 0x1fffff,
77
},{ .name = "CURRENT_TIME", .addr = A_CURRENT_TIME,
78
.ro = 0xffffffff,
79
+ .post_read = current_time_postr,
80
},{ .name = "CURRENT_TICK", .addr = A_CURRENT_TICK,
81
.ro = 0xffff,
82
},{ .name = "ALARM", .addr = A_ALARM,
83
@@ -XXX,XX +XXX,XX @@ static void rtc_init(Object *obj)
84
XlnxZynqMPRTC *s = XLNX_ZYNQMP_RTC(obj);
85
SysBusDevice *sbd = SYS_BUS_DEVICE(obj);
86
RegisterInfoArray *reg_array;
87
+ struct tm current_tm;
88
89
memory_region_init(&s->iomem, obj, TYPE_XLNX_ZYNQMP_RTC,
90
XLNX_ZYNQMP_RTC_R_MAX * 4);
91
@@ -XXX,XX +XXX,XX @@ static void rtc_init(Object *obj)
92
sysbus_init_mmio(sbd, &s->iomem);
93
sysbus_init_irq(sbd, &s->irq_rtc_int);
94
sysbus_init_irq(sbd, &s->irq_addr_error_int);
95
+
96
+ qemu_get_timedate(&current_tm, 0);
97
+ s->tick_offset = mktimegm(&current_tm) -
98
+ qemu_clock_get_ns(rtc_clock) / NANOSECONDS_PER_SECOND;
99
+
100
+ trace_xlnx_zynqmp_rtc_gettime(current_tm.tm_year, current_tm.tm_mon,
101
+ current_tm.tm_mday, current_tm.tm_hour,
102
+ current_tm.tm_min, current_tm.tm_sec);
66
+}
103
+}
67
+
104
+
68
+uint32_t HELPER(advsimd_acge_f16)(float16 a, float16 b, void *fpstp)
105
+static int rtc_pre_save(void *opaque)
69
+{
106
+{
70
+ float_status *fpst = fpstp;
107
+ XlnxZynqMPRTC *s = opaque;
71
+ float16 f0 = float16_abs(a);
108
+ int64_t now = qemu_clock_get_ns(rtc_clock) / NANOSECONDS_PER_SECOND;
72
+ float16 f1 = float16_abs(b);
109
+
73
+ int compare = float16_compare(f0, f1, fpst);
110
+ /* Add the time at migration */
74
+ return ADVSIMD_CMPRES(compare == float_relation_greater ||
111
+ s->tick_offset = s->tick_offset + now;
75
+ compare == float_relation_equal);
112
+
113
+ return 0;
76
+}
114
+}
77
+
115
+
78
+uint32_t HELPER(advsimd_acgt_f16)(float16 a, float16 b, void *fpstp)
116
+static int rtc_post_load(void *opaque, int version_id)
79
+{
117
+{
80
+ float_status *fpst = fpstp;
118
+ XlnxZynqMPRTC *s = opaque;
81
+ float16 f0 = float16_abs(a);
119
+ int64_t now = qemu_clock_get_ns(rtc_clock) / NANOSECONDS_PER_SECOND;
82
+ float16 f1 = float16_abs(b);
120
+
83
+ int compare = float16_compare(f0, f1, fpst);
121
+ /* Subtract the time after migration. This combined with the pre_save
84
+ return ADVSIMD_CMPRES(compare == float_relation_greater);
122
+ * action results in us having subtracted the time that the guest was
85
+}
123
+ * stopped to the offset.
86
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
124
+ */
125
+ s->tick_offset = s->tick_offset - now;
126
+
127
+ return 0;
128
}
129
130
static const VMStateDescription vmstate_rtc = {
131
.name = TYPE_XLNX_ZYNQMP_RTC,
132
.version_id = 1,
133
.minimum_version_id = 1,
134
+ .pre_save = rtc_pre_save,
135
+ .post_load = rtc_post_load,
136
.fields = (VMStateField[]) {
137
VMSTATE_UINT32_ARRAY(regs, XlnxZynqMPRTC, XLNX_ZYNQMP_RTC_R_MAX),
138
+ VMSTATE_UINT32(tick_offset, XlnxZynqMPRTC),
139
VMSTATE_END_OF_LIST(),
140
}
141
};
142
diff --git a/hw/timer/trace-events b/hw/timer/trace-events
87
index XXXXXXX..XXXXXXX 100644
143
index XXXXXXX..XXXXXXX 100644
88
--- a/target/arm/translate-a64.c
144
--- a/hw/timer/trace-events
89
+++ b/target/arm/translate-a64.c
145
+++ b/hw/timer/trace-events
90
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
146
@@ -XXX,XX +XXX,XX @@ systick_write(uint64_t addr, uint32_t value, unsigned size) "systick write addr
91
case 0x2: /* FADD */
147
cmsdk_apb_timer_read(uint64_t offset, uint64_t data, unsigned size) "CMSDK APB timer read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u"
92
gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst);
148
cmsdk_apb_timer_write(uint64_t offset, uint64_t data, unsigned size) "CMSDK APB timer write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u"
93
break;
149
cmsdk_apb_timer_reset(void) "CMSDK APB timer: reset"
94
+ case 0x4: /* FCMEQ */
150
+
95
+ gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst);
151
+# hw/timer/xlnx-zynqmp-rtc.c
96
+ break;
152
+xlnx_zynqmp_rtc_gettime(int year, int month, int day, int hour, int min, int sec) "Get time from host: %d-%d-%d %2d:%02d:%02d"
97
case 0x6: /* FMAX */
98
gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst);
99
break;
100
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
101
case 0x13: /* FMUL */
102
gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst);
103
break;
104
+ case 0x14: /* FCMGE */
105
+ gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
106
+ break;
107
+ case 0x15: /* FACGE */
108
+ gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
109
+ break;
110
case 0x17: /* FDIV */
111
gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst);
112
break;
113
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
114
gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
115
tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff);
116
break;
117
+ case 0x1c: /* FCMGT */
118
+ gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
119
+ break;
120
+ case 0x1d: /* FACGT */
121
+ gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
122
+ break;
123
default:
124
fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n",
125
__func__, insn, fpopcode, s->pc);
126
--
153
--
127
2.16.2
154
2.16.2
128
155
129
156
diff view generated by jsdifflib
1
From: Alistair Francis <alistair.francis@xilinx.com>
1
From: Alistair Francis <alistair.francis@xilinx.com>
2
2
3
Ensure that the post write hook is called during reset. This allows us
4
to rely on the post write functions instead of having to call them from
5
the reset() function.
6
7
Signed-off-by: Alistair Francis <alistair.francis@xilinx.com>
3
Signed-off-by: Alistair Francis <alistair.francis@xilinx.com>
4
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
8
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
9
Message-id: d131e24b911653a945e46ca2d8f90f572469e1dd.1517856214.git.alistair.francis@xilinx.com
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
7
---
12
include/hw/register.h | 6 +++---
8
include/hw/arm/xlnx-zynqmp.h | 2 ++
13
hw/core/register.c | 8 ++++++++
9
hw/arm/xlnx-zynqmp.c | 14 ++++++++++++++
14
2 files changed, 11 insertions(+), 3 deletions(-)
10
2 files changed, 16 insertions(+)
15
11
16
diff --git a/include/hw/register.h b/include/hw/register.h
12
diff --git a/include/hw/arm/xlnx-zynqmp.h b/include/hw/arm/xlnx-zynqmp.h
17
index XXXXXXX..XXXXXXX 100644
13
index XXXXXXX..XXXXXXX 100644
18
--- a/include/hw/register.h
14
--- a/include/hw/arm/xlnx-zynqmp.h
19
+++ b/include/hw/register.h
15
+++ b/include/hw/arm/xlnx-zynqmp.h
20
@@ -XXX,XX +XXX,XX @@ typedef struct RegisterInfoArray RegisterInfoArray;
16
@@ -XXX,XX +XXX,XX @@
21
* immediately before the actual write. The returned value is what is written,
17
#include "hw/dma/xlnx_dpdma.h"
22
* giving the handler a chance to modify the written value.
18
#include "hw/display/xlnx_dp.h"
23
* @post_write: Post write callback. Passed the written value. Most write side
19
#include "hw/intc/xlnx-zynqmp-ipi.h"
24
- * effects should be implemented here.
20
+#include "hw/timer/xlnx-zynqmp-rtc.h"
25
+ * effects should be implemented here. This is called during device reset.
21
26
*
22
#define TYPE_XLNX_ZYNQMP "xlnx,zynqmp"
27
* @post_read: Post read callback. Passes the value that is about to be returned
23
#define XLNX_ZYNQMP(obj) OBJECT_CHECK(XlnxZynqMPState, (obj), \
28
* for a read. The return value from this function is what is ultimately read,
24
@@ -XXX,XX +XXX,XX @@ typedef struct XlnxZynqMPState {
29
@@ -XXX,XX +XXX,XX @@ uint64_t register_read(RegisterInfo *reg, uint64_t re, const char* prefix,
25
XlnxDPState dp;
30
bool debug);
26
XlnxDPDMAState dpdma;
31
27
XlnxZynqMPIPI ipi;
32
/**
28
+ XlnxZynqMPRTC rtc;
33
- * reset a register
29
34
- * @reg: register to reset
30
char *boot_cpu;
35
+ * Resets a register. This will also call the post_write hook if it exists.
31
ARMCPU *boot_cpu_ptr;
36
+ * @reg: The register to reset.
32
diff --git a/hw/arm/xlnx-zynqmp.c b/hw/arm/xlnx-zynqmp.c
37
*/
38
39
void register_reset(RegisterInfo *reg);
40
diff --git a/hw/core/register.c b/hw/core/register.c
41
index XXXXXXX..XXXXXXX 100644
33
index XXXXXXX..XXXXXXX 100644
42
--- a/hw/core/register.c
34
--- a/hw/arm/xlnx-zynqmp.c
43
+++ b/hw/core/register.c
35
+++ b/hw/arm/xlnx-zynqmp.c
44
@@ -XXX,XX +XXX,XX @@ uint64_t register_read(RegisterInfo *reg, uint64_t re, const char* prefix,
36
@@ -XXX,XX +XXX,XX @@
45
37
#define IPI_ADDR 0xFF300000
46
void register_reset(RegisterInfo *reg)
38
#define IPI_IRQ 64
47
{
39
48
+ const RegisterAccessInfo *ac;
40
+#define RTC_ADDR 0xffa60000
41
+#define RTC_IRQ 26
49
+
42
+
50
g_assert(reg);
43
#define SDHCI_CAPABILITIES 0x280737ec6481 /* Datasheet: UG1085 (v1.7) */
51
44
52
if (!reg->data || !reg->access) {
45
static const uint64_t gem_addr[XLNX_ZYNQMP_NUM_GEMS] = {
53
return;
46
@@ -XXX,XX +XXX,XX @@ static void xlnx_zynqmp_init(Object *obj)
47
48
object_initialize(&s->ipi, sizeof(s->ipi), TYPE_XLNX_ZYNQMP_IPI);
49
qdev_set_parent_bus(DEVICE(&s->ipi), sysbus_get_default());
50
+
51
+ object_initialize(&s->rtc, sizeof(s->rtc), TYPE_XLNX_ZYNQMP_RTC);
52
+ qdev_set_parent_bus(DEVICE(&s->rtc), sysbus_get_default());
53
}
54
55
static void xlnx_zynqmp_realize(DeviceState *dev, Error **errp)
56
@@ -XXX,XX +XXX,XX @@ static void xlnx_zynqmp_realize(DeviceState *dev, Error **errp)
54
}
57
}
55
58
sysbus_mmio_map(SYS_BUS_DEVICE(&s->ipi), 0, IPI_ADDR);
56
+ ac = reg->access;
59
sysbus_connect_irq(SYS_BUS_DEVICE(&s->ipi), 0, gic_spi[IPI_IRQ]);
57
+
60
+
58
register_write_val(reg, reg->access->reset);
61
+ object_property_set_bool(OBJECT(&s->rtc), true, "realized", &err);
59
+
62
+ if (err) {
60
+ if (ac->post_write) {
63
+ error_propagate(errp, err);
61
+ ac->post_write(reg, reg->access->reset);
64
+ return;
62
+ }
65
+ }
66
+ sysbus_mmio_map(SYS_BUS_DEVICE(&s->rtc), 0, RTC_ADDR);
67
+ sysbus_connect_irq(SYS_BUS_DEVICE(&s->rtc), 0, gic_spi[RTC_IRQ]);
63
}
68
}
64
69
65
void register_init(RegisterInfo *reg)
70
static Property xlnx_zynqmp_props[] = {
66
--
71
--
67
2.16.2
72
2.16.2
68
73
69
74
diff view generated by jsdifflib
Deleted patch
1
From: Francisco Iglesias <frasse.iglesias@gmail.com>
2
1
3
Assert only the lower cs on bus 0 and upper cs on bus 1 when both buses and
4
chip selects are enabled (e.g reading/writing with stripe).
5
6
Signed-off-by: Francisco Iglesias <frasse.iglesias@gmail.com>
7
Reviewed-by: Alistair Francis <alistair.francis@xilinx.com>
8
Tested-by: Alistair Francis <alistair.francis@xilinx.com>
9
Message-id: 20180223232233.31482-2-frasse.iglesias@gmail.com
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
12
hw/ssi/xilinx_spips.c | 41 +++++++++++++++++++++++++++++++++++++----
13
1 file changed, 37 insertions(+), 4 deletions(-)
14
15
diff --git a/hw/ssi/xilinx_spips.c b/hw/ssi/xilinx_spips.c
16
index XXXXXXX..XXXXXXX 100644
17
--- a/hw/ssi/xilinx_spips.c
18
+++ b/hw/ssi/xilinx_spips.c
19
@@ -XXX,XX +XXX,XX @@ static void xilinx_spips_update_cs(XilinxSPIPS *s, int field)
20
{
21
int i;
22
23
- for (i = 0; i < s->num_cs; i++) {
24
+ for (i = 0; i < s->num_cs * s->num_busses; i++) {
25
bool old_state = s->cs_lines_state[i];
26
bool new_state = field & (1 << i);
27
28
@@ -XXX,XX +XXX,XX @@ static void xilinx_spips_update_cs(XilinxSPIPS *s, int field)
29
}
30
qemu_set_irq(s->cs_lines[i], !new_state);
31
}
32
- if (!(field & ((1 << s->num_cs) - 1))) {
33
+ if (!(field & ((1 << (s->num_cs * s->num_busses)) - 1))) {
34
s->snoop_state = SNOOP_CHECKING;
35
s->cmd_dummies = 0;
36
s->link_state = 1;
37
@@ -XXX,XX +XXX,XX @@ static void xlnx_zynqmp_qspips_update_cs_lines(XlnxZynqMPQSPIPS *s)
38
{
39
if (s->regs[R_GQSPI_GF_SNAPSHOT]) {
40
int field = ARRAY_FIELD_EX32(s->regs, GQSPI_GF_SNAPSHOT, CHIP_SELECT);
41
- xilinx_spips_update_cs(XILINX_SPIPS(s), field);
42
+ bool upper_cs_sel = field & (1 << 1);
43
+ bool lower_cs_sel = field & 1;
44
+ bool bus0_enabled;
45
+ bool bus1_enabled;
46
+ uint8_t buses;
47
+ int cs = 0;
48
+
49
+ buses = ARRAY_FIELD_EX32(s->regs, GQSPI_GF_SNAPSHOT, DATA_BUS_SELECT);
50
+ bus0_enabled = buses & 1;
51
+ bus1_enabled = buses & (1 << 1);
52
+
53
+ if (bus0_enabled && bus1_enabled) {
54
+ if (lower_cs_sel) {
55
+ cs |= 1;
56
+ }
57
+ if (upper_cs_sel) {
58
+ cs |= 1 << 3;
59
+ }
60
+ } else if (bus0_enabled) {
61
+ if (lower_cs_sel) {
62
+ cs |= 1;
63
+ }
64
+ if (upper_cs_sel) {
65
+ cs |= 1 << 1;
66
+ }
67
+ } else if (bus1_enabled) {
68
+ if (lower_cs_sel) {
69
+ cs |= 1 << 2;
70
+ }
71
+ if (upper_cs_sel) {
72
+ cs |= 1 << 3;
73
+ }
74
+ }
75
+ xilinx_spips_update_cs(XILINX_SPIPS(s), cs);
76
}
77
}
78
79
@@ -XXX,XX +XXX,XX @@ static void xilinx_spips_update_cs_lines(XilinxSPIPS *s)
80
if (num_effective_busses(s) == 2) {
81
/* Single bit chip-select for qspi */
82
field &= 0x1;
83
- field |= field << 1;
84
+ field |= field << 3;
85
/* Dual stack U-Page */
86
} else if (s->regs[R_LQSPI_CFG] & LQSPI_CFG_TWO_MEM &&
87
s->regs[R_LQSPI_STS] & LQSPI_CFG_U_PAGE) {
88
--
89
2.16.2
90
91
diff view generated by jsdifflib
Deleted patch
1
From: Francisco Iglesias <frasse.iglesias@gmail.com>
2
1
3
Use 8 dummy cycles (4 dummy bytes) with the QIOR/QIOR4 commands in legacy mode
4
for matching what is expected by Micron (Numonyx) flashes (the default target
5
flash type of the QSPI).
6
7
Signed-off-by: Francisco Iglesias <frasse.iglesias@gmail.com>
8
Tested-by: Alistair Francis <alistair.francis@xilinx.com>
9
Reviewed-by: Alistair Francis <alistair.francis@xilinx.com>
10
Message-id: 20180223232233.31482-3-frasse.iglesias@gmail.com
11
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
12
---
13
hw/ssi/xilinx_spips.c | 2 +-
14
1 file changed, 1 insertion(+), 1 deletion(-)
15
16
diff --git a/hw/ssi/xilinx_spips.c b/hw/ssi/xilinx_spips.c
17
index XXXXXXX..XXXXXXX 100644
18
--- a/hw/ssi/xilinx_spips.c
19
+++ b/hw/ssi/xilinx_spips.c
20
@@ -XXX,XX +XXX,XX @@ static int xilinx_spips_num_dummies(XilinxQSPIPS *qs, uint8_t command)
21
return 2;
22
case QIOR:
23
case QIOR_4:
24
- return 5;
25
+ return 4;
26
default:
27
return -1;
28
}
29
--
30
2.16.2
31
32
diff view generated by jsdifflib
Deleted patch
1
From: Corey Minyard <cminyard@mvista.com>
2
1
3
Signed-off-by: Corey Minyard <cminyard@mvista.com>
4
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
5
Signed-off-by: Linus Walleij <linus.walleij@linaro.org>
6
Message-id: 20180227104903.21353-2-linus.walleij@linaro.org
7
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
8
---
9
include/hw/i2c/i2c.h | 6 ++----
10
hw/i2c/core.c | 3 +--
11
2 files changed, 3 insertions(+), 6 deletions(-)
12
13
diff --git a/include/hw/i2c/i2c.h b/include/hw/i2c/i2c.h
14
index XXXXXXX..XXXXXXX 100644
15
--- a/include/hw/i2c/i2c.h
16
+++ b/include/hw/i2c/i2c.h
17
@@ -XXX,XX +XXX,XX @@ typedef struct I2CSlave I2CSlave;
18
#define I2C_SLAVE_GET_CLASS(obj) \
19
OBJECT_GET_CLASS(I2CSlaveClass, (obj), TYPE_I2C_SLAVE)
20
21
-typedef struct I2CSlaveClass
22
-{
23
+typedef struct I2CSlaveClass {
24
DeviceClass parent_class;
25
26
/* Callbacks provided by the device. */
27
@@ -XXX,XX +XXX,XX @@ typedef struct I2CSlaveClass
28
int (*event)(I2CSlave *s, enum i2c_event event);
29
} I2CSlaveClass;
30
31
-struct I2CSlave
32
-{
33
+struct I2CSlave {
34
DeviceState qdev;
35
36
/* Remaining fields for internal use by the I2C code. */
37
diff --git a/hw/i2c/core.c b/hw/i2c/core.c
38
index XXXXXXX..XXXXXXX 100644
39
--- a/hw/i2c/core.c
40
+++ b/hw/i2c/core.c
41
@@ -XXX,XX +XXX,XX @@ struct I2CNode {
42
43
#define I2C_BROADCAST 0x00
44
45
-struct I2CBus
46
-{
47
+struct I2CBus {
48
BusState qbus;
49
QLIST_HEAD(, I2CNode) current_devs;
50
uint8_t saved_address;
51
--
52
2.16.2
53
54
diff view generated by jsdifflib
1
From: Linus Walleij <linus.walleij@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
The tx function of the DDC I2C slave emulation was returning 1
3
Allow the translate subroutines to return false for invalid insns.
4
on all writes resulting in NACK in the I2C bus. Changing it to
5
0 makes the DDC I2C work fine with bit-banged I2C such as the
6
versatile I2C.
7
4
8
I guess it was not affecting whatever I2C controller this was
5
At present we can of course invoke an invalid insn exception from within
9
used with until now, but with the Versatile I2C it surely
6
the translate subroutine, but in the short term this consolidates code.
10
does not work.
7
In the long term it would allow the decodetree language to support
8
overlapping patterns for ISA extensions.
11
9
10
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
11
Message-id: 20180227232618.2908-1-richard.henderson@linaro.org
12
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
12
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
13
Signed-off-by: Linus Walleij <linus.walleij@linaro.org>
14
Message-id: 20180227104903.21353-4-linus.walleij@linaro.org
15
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
16
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
13
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
17
---
14
---
18
hw/i2c/i2c-ddc.c | 4 ++--
15
scripts/decodetree.py | 5 ++---
19
1 file changed, 2 insertions(+), 2 deletions(-)
16
1 file changed, 2 insertions(+), 3 deletions(-)
20
17
21
diff --git a/hw/i2c/i2c-ddc.c b/hw/i2c/i2c-ddc.c
18
diff --git a/scripts/decodetree.py b/scripts/decodetree.py
22
index XXXXXXX..XXXXXXX 100644
19
index XXXXXXX..XXXXXXX 100755
23
--- a/hw/i2c/i2c-ddc.c
20
--- a/scripts/decodetree.py
24
+++ b/hw/i2c/i2c-ddc.c
21
+++ b/scripts/decodetree.py
25
@@ -XXX,XX +XXX,XX @@ static int i2c_ddc_tx(I2CSlave *i2c, uint8_t data)
22
@@ -XXX,XX +XXX,XX @@ class Pattern(General):
26
s->reg = data;
23
global translate_prefix
27
s->firstbyte = false;
24
output('typedef ', self.base.base.struct_name(),
28
DPRINTF("[EDID] Written new pointer: %u\n", data);
25
' arg_', self.name, ';\n')
29
- return 1;
26
- output(translate_scope, 'void ', translate_prefix, '_', self.name,
30
+ return 0;
27
+ output(translate_scope, 'bool ', translate_prefix, '_', self.name,
31
}
28
'(DisasContext *ctx, arg_', self.name,
32
29
' *a, ', insntype, ' insn);\n')
33
/* Ignore all writes */
30
34
s->reg++;
31
@@ -XXX,XX +XXX,XX @@ class Pattern(General):
35
- return 1;
32
output(ind, self.base.extract_name(), '(&u.f_', arg, ', insn);\n')
36
+ return 0;
33
for n, f in self.fields.items():
37
}
34
output(ind, 'u.f_', arg, '.', n, ' = ', f.str_extract(), ';\n')
38
35
- output(ind, translate_prefix, '_', self.name,
39
static void i2c_ddc_init(Object *obj)
36
+ output(ind, 'return ', translate_prefix, '_', self.name,
37
'(ctx, &u.f_', arg, ', insn);\n')
38
- output(ind, 'return true;\n')
39
# end Pattern
40
41
40
--
42
--
41
2.16.2
43
2.16.2
42
44
43
45
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Add a function load_ramdisk_as() which behaves like the existing
2
load_ramdisk() but allows the caller to specify the AddressSpace
3
to use. This matches the pattern we have already for various
4
other loader functions.
2
5
3
A bunch of the vectorised bitwise operations just operate on larger
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
chunks at a time. We can do the same for the new half-precision
7
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
operations by introducing some TWOHALFOP helpers which work on each
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
half of a pair of half-precision operations at once.
9
Message-id: 20180220180325.29818-2-peter.maydell@linaro.org
10
---
11
include/hw/loader.h | 12 +++++++++++-
12
hw/core/loader.c | 8 +++++++-
13
2 files changed, 18 insertions(+), 2 deletions(-)
7
14
8
Hopefully all this hoop jumping will get simpler once we have
15
diff --git a/include/hw/loader.h b/include/hw/loader.h
9
generically vectorised helpers here.
10
11
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
12
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
13
Message-id: 20180227143852.11175-16-alex.bennee@linaro.org
14
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
15
---
16
target/arm/helper-a64.h | 10 ++++++++++
17
target/arm/helper-a64.c | 46 +++++++++++++++++++++++++++++++++++++++++++++-
18
target/arm/translate-a64.c | 26 +++++++++++++++++++++-----
19
3 files changed, 76 insertions(+), 6 deletions(-)
20
21
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
22
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
23
--- a/target/arm/helper-a64.h
17
--- a/include/hw/loader.h
24
+++ b/target/arm/helper-a64.h
18
+++ b/include/hw/loader.h
25
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_acge_f16, i32, f16, f16, ptr)
19
@@ -XXX,XX +XXX,XX @@ int load_uimage(const char *filename, hwaddr *ep,
26
DEF_HELPER_3(advsimd_acgt_f16, i32, f16, f16, ptr)
20
void *translate_opaque);
27
DEF_HELPER_3(advsimd_mulxh, f16, f16, f16, ptr)
21
28
DEF_HELPER_4(advsimd_muladdh, f16, f16, f16, f16, ptr)
22
/**
29
+DEF_HELPER_3(advsimd_add2h, i32, i32, i32, ptr)
23
- * load_ramdisk:
30
+DEF_HELPER_3(advsimd_sub2h, i32, i32, i32, ptr)
24
+ * load_ramdisk_as:
31
+DEF_HELPER_3(advsimd_mul2h, i32, i32, i32, ptr)
25
* @filename: Path to the ramdisk image
32
+DEF_HELPER_3(advsimd_div2h, i32, i32, i32, ptr)
26
* @addr: Memory address to load the ramdisk to
33
+DEF_HELPER_3(advsimd_max2h, i32, i32, i32, ptr)
27
* @max_sz: Maximum allowed ramdisk size (for non-u-boot ramdisks)
34
+DEF_HELPER_3(advsimd_min2h, i32, i32, i32, ptr)
28
+ * @as: The AddressSpace to load the ELF to. The value of address_space_memory
35
+DEF_HELPER_3(advsimd_maxnum2h, i32, i32, i32, ptr)
29
+ * is used if nothing is supplied here.
36
+DEF_HELPER_3(advsimd_minnum2h, i32, i32, i32, ptr)
30
*
37
+DEF_HELPER_3(advsimd_mulx2h, i32, i32, i32, ptr)
31
* Load a ramdisk image with U-Boot header to the specified memory
38
+DEF_HELPER_4(advsimd_muladd2h, i32, i32, i32, i32, ptr)
32
* address.
39
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
33
*
34
* Returns the size of the loaded image on success, -1 otherwise.
35
*/
36
+int load_ramdisk_as(const char *filename, hwaddr addr, uint64_t max_sz,
37
+ AddressSpace *as);
38
+
39
+/**
40
+ * load_ramdisk:
41
+ * Same as load_ramdisk_as(), but doesn't allow the caller to specify
42
+ * an AddressSpace.
43
+ */
44
int load_ramdisk(const char *filename, hwaddr addr, uint64_t max_sz);
45
46
ssize_t gunzip(void *dst, size_t dstlen, uint8_t *src, size_t srclen);
47
diff --git a/hw/core/loader.c b/hw/core/loader.c
40
index XXXXXXX..XXXXXXX 100644
48
index XXXXXXX..XXXXXXX 100644
41
--- a/target/arm/helper-a64.c
49
--- a/hw/core/loader.c
42
+++ b/target/arm/helper-a64.c
50
+++ b/hw/core/loader.c
43
@@ -XXX,XX +XXX,XX @@ ADVSIMD_HALFOP(max)
51
@@ -XXX,XX +XXX,XX @@ int load_uimage_as(const char *filename, hwaddr *ep, hwaddr *loadaddr,
44
ADVSIMD_HALFOP(minnum)
52
45
ADVSIMD_HALFOP(maxnum)
53
/* Load a ramdisk. */
46
54
int load_ramdisk(const char *filename, hwaddr addr, uint64_t max_sz)
47
+#define ADVSIMD_TWOHALFOP(name) \
55
+{
48
+uint32_t ADVSIMD_HELPER(name, 2h)(uint32_t two_a, uint32_t two_b, void *fpstp) \
56
+ return load_ramdisk_as(filename, addr, max_sz, NULL);
49
+{ \
50
+ float16 a1, a2, b1, b2; \
51
+ uint32_t r1, r2; \
52
+ float_status *fpst = fpstp; \
53
+ a1 = extract32(two_a, 0, 16); \
54
+ a2 = extract32(two_a, 16, 16); \
55
+ b1 = extract32(two_b, 0, 16); \
56
+ b2 = extract32(two_b, 16, 16); \
57
+ r1 = float16_ ## name(a1, b1, fpst); \
58
+ r2 = float16_ ## name(a2, b2, fpst); \
59
+ return deposit32(r1, 16, 16, r2); \
60
+}
57
+}
61
+
58
+
62
+ADVSIMD_TWOHALFOP(add)
59
+int load_ramdisk_as(const char *filename, hwaddr addr, uint64_t max_sz,
63
+ADVSIMD_TWOHALFOP(sub)
60
+ AddressSpace *as)
64
+ADVSIMD_TWOHALFOP(mul)
65
+ADVSIMD_TWOHALFOP(div)
66
+ADVSIMD_TWOHALFOP(min)
67
+ADVSIMD_TWOHALFOP(max)
68
+ADVSIMD_TWOHALFOP(minnum)
69
+ADVSIMD_TWOHALFOP(maxnum)
70
+
71
/* Data processing - scalar floating-point and advanced SIMD */
72
-float16 HELPER(advsimd_mulxh)(float16 a, float16 b, void *fpstp)
73
+static float16 float16_mulx(float16 a, float16 b, void *fpstp)
74
{
61
{
75
float_status *fpst = fpstp;
62
return load_uboot_image(filename, NULL, &addr, NULL, IH_TYPE_RAMDISK,
76
63
- NULL, NULL, NULL);
77
@@ -XXX,XX +XXX,XX @@ float16 HELPER(advsimd_mulxh)(float16 a, float16 b, void *fpstp)
64
+ NULL, NULL, as);
78
return float16_mul(a, b, fpst);
79
}
65
}
80
66
81
+ADVSIMD_HALFOP(mulx)
67
/* Load a gzip-compressed kernel to a dynamically allocated buffer. */
82
+ADVSIMD_TWOHALFOP(mulx)
83
+
84
/* fused multiply-accumulate */
85
float16 HELPER(advsimd_muladdh)(float16 a, float16 b, float16 c, void *fpstp)
86
{
87
@@ -XXX,XX +XXX,XX @@ float16 HELPER(advsimd_muladdh)(float16 a, float16 b, float16 c, void *fpstp)
88
return float16_muladd(a, b, c, 0, fpst);
89
}
90
91
+uint32_t HELPER(advsimd_muladd2h)(uint32_t two_a, uint32_t two_b,
92
+ uint32_t two_c, void *fpstp)
93
+{
94
+ float_status *fpst = fpstp;
95
+ float16 a1, a2, b1, b2, c1, c2;
96
+ uint32_t r1, r2;
97
+ a1 = extract32(two_a, 0, 16);
98
+ a2 = extract32(two_a, 16, 16);
99
+ b1 = extract32(two_b, 0, 16);
100
+ b2 = extract32(two_b, 16, 16);
101
+ c1 = extract32(two_c, 0, 16);
102
+ c2 = extract32(two_c, 16, 16);
103
+ r1 = float16_muladd(a1, b1, c1, 0, fpst);
104
+ r2 = float16_muladd(a2, b2, c2, 0, fpst);
105
+ return deposit32(r1, 16, 16, r2);
106
+}
107
+
108
/*
109
* Floating point comparisons produce an integer result. Softfloat
110
* routines return float_relation types which we convert to the 0/-1
111
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
112
index XXXXXXX..XXXXXXX 100644
113
--- a/target/arm/translate-a64.c
114
+++ b/target/arm/translate-a64.c
115
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
116
* multiply-add */
117
tcg_gen_xori_i32(tcg_op, tcg_op, 0x80008000);
118
}
119
- gen_helper_advsimd_muladdh(tcg_res, tcg_op, tcg_idx,
120
- tcg_res, fpst);
121
+ if (is_scalar) {
122
+ gen_helper_advsimd_muladdh(tcg_res, tcg_op, tcg_idx,
123
+ tcg_res, fpst);
124
+ } else {
125
+ gen_helper_advsimd_muladd2h(tcg_res, tcg_op, tcg_idx,
126
+ tcg_res, fpst);
127
+ }
128
break;
129
case 2:
130
if (opcode == 0x5) {
131
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
132
switch (size) {
133
case 1:
134
if (u) {
135
- gen_helper_advsimd_mulxh(tcg_res, tcg_op, tcg_idx,
136
- fpst);
137
+ if (is_scalar) {
138
+ gen_helper_advsimd_mulxh(tcg_res, tcg_op,
139
+ tcg_idx, fpst);
140
+ } else {
141
+ gen_helper_advsimd_mulx2h(tcg_res, tcg_op,
142
+ tcg_idx, fpst);
143
+ }
144
} else {
145
- g_assert_not_reached();
146
+ if (is_scalar) {
147
+ gen_helper_advsimd_mulh(tcg_res, tcg_op,
148
+ tcg_idx, fpst);
149
+ } else {
150
+ gen_helper_advsimd_mul2h(tcg_res, tcg_op,
151
+ tcg_idx, fpst);
152
+ }
153
}
154
break;
155
case 2:
156
--
68
--
157
2.16.2
69
2.16.2
158
70
159
71
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Instead of loading kernels, device trees, and the like to
2
the system address space, use the CPU's address space. This
3
is important if we're trying to load the file to memory or
4
via an alias memory region that is provided by an SoC
5
object and thus not mapped into the system address space.
2
6
3
Much like recpe the ARM ARM has simplified the pseudo code for the
7
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
calculation which is done on a fixed point 9 bit integer maths. So
8
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
while adding f16 we can also clean this up to be a little less heavy
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
on the floating point and just return the fractional part and leave
10
Message-id: 20180220180325.29818-3-peter.maydell@linaro.org
7
the calle's to do the final packing of the result.
11
---
12
hw/arm/boot.c | 119 +++++++++++++++++++++++++++++++++++++---------------------
13
1 file changed, 76 insertions(+), 43 deletions(-)
8
14
9
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
15
diff --git a/hw/arm/boot.c b/hw/arm/boot.c
10
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
11
Message-id: 20180227143852.11175-27-alex.bennee@linaro.org
12
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
13
---
14
target/arm/helper.h | 1 +
15
target/arm/helper.c | 221 ++++++++++++++++++++++++----------------------------
16
2 files changed, 104 insertions(+), 118 deletions(-)
17
18
diff --git a/target/arm/helper.h b/target/arm/helper.h
19
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
20
--- a/target/arm/helper.h
17
--- a/hw/arm/boot.c
21
+++ b/target/arm/helper.h
18
+++ b/hw/arm/boot.c
22
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(rsqrts_f32, f32, f32, f32, env)
19
@@ -XXX,XX +XXX,XX @@
23
DEF_HELPER_FLAGS_2(recpe_f16, TCG_CALL_NO_RWG, f16, f16, ptr)
20
#define ARM64_TEXT_OFFSET_OFFSET 8
24
DEF_HELPER_FLAGS_2(recpe_f32, TCG_CALL_NO_RWG, f32, f32, ptr)
21
#define ARM64_MAGIC_OFFSET 56
25
DEF_HELPER_FLAGS_2(recpe_f64, TCG_CALL_NO_RWG, f64, f64, ptr)
22
26
+DEF_HELPER_FLAGS_2(rsqrte_f16, TCG_CALL_NO_RWG, f16, f16, ptr)
23
+static AddressSpace *arm_boot_address_space(ARMCPU *cpu,
27
DEF_HELPER_FLAGS_2(rsqrte_f32, TCG_CALL_NO_RWG, f32, f32, ptr)
24
+ const struct arm_boot_info *info)
28
DEF_HELPER_FLAGS_2(rsqrte_f64, TCG_CALL_NO_RWG, f64, f64, ptr)
25
+{
29
DEF_HELPER_2(recpe_u32, i32, i32, ptr)
26
+ /* Return the address space to use for bootloader reads and writes.
30
diff --git a/target/arm/helper.c b/target/arm/helper.c
27
+ * We prefer the secure address space if the CPU has it and we're
31
index XXXXXXX..XXXXXXX 100644
28
+ * going to boot the guest into it.
32
--- a/target/arm/helper.c
29
+ */
33
+++ b/target/arm/helper.c
30
+ int asidx;
34
@@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp)
31
+ CPUState *cs = CPU(cpu);
35
/* The algorithm that must be used to calculate the estimate
36
* is specified by the ARM ARM.
37
*/
38
-static float64 recip_sqrt_estimate(float64 a, float_status *real_fp_status)
39
+
32
+
40
+static int do_recip_sqrt_estimate(int a)
33
+ if (arm_feature(&cpu->env, ARM_FEATURE_EL3) && info->secure_boot) {
41
{
34
+ asidx = ARMASIdx_S;
42
- /* These calculations mustn't set any fp exception flags,
35
+ } else {
43
- * so we use a local copy of the fp_status.
36
+ asidx = ARMASIdx_NS;
44
- */
45
- float_status dummy_status = *real_fp_status;
46
- float_status *s = &dummy_status;
47
- float64 q;
48
- int64_t q_int;
49
+ int b, estimate;
50
51
- if (float64_lt(a, float64_half, s)) {
52
- /* range 0.25 <= a < 0.5 */
53
-
54
- /* a in units of 1/512 rounded down */
55
- /* q0 = (int)(a * 512.0); */
56
- q = float64_mul(float64_512, a, s);
57
- q_int = float64_to_int64_round_to_zero(q, s);
58
-
59
- /* reciprocal root r */
60
- /* r = 1.0 / sqrt(((double)q0 + 0.5) / 512.0); */
61
- q = int64_to_float64(q_int, s);
62
- q = float64_add(q, float64_half, s);
63
- q = float64_div(q, float64_512, s);
64
- q = float64_sqrt(q, s);
65
- q = float64_div(float64_one, q, s);
66
+ assert(128 <= a && a < 512);
67
+ if (a < 256) {
68
+ a = a * 2 + 1;
69
} else {
70
- /* range 0.5 <= a < 1.0 */
71
-
72
- /* a in units of 1/256 rounded down */
73
- /* q1 = (int)(a * 256.0); */
74
- q = float64_mul(float64_256, a, s);
75
- int64_t q_int = float64_to_int64_round_to_zero(q, s);
76
-
77
- /* reciprocal root r */
78
- /* r = 1.0 /sqrt(((double)q1 + 0.5) / 256); */
79
- q = int64_to_float64(q_int, s);
80
- q = float64_add(q, float64_half, s);
81
- q = float64_div(q, float64_256, s);
82
- q = float64_sqrt(q, s);
83
- q = float64_div(float64_one, q, s);
84
+ a = (a >> 1) << 1;
85
+ a = (a + 1) * 2;
86
}
87
- /* r in units of 1/256 rounded to nearest */
88
- /* s = (int)(256.0 * r + 0.5); */
89
+ b = 512;
90
+ while (a * (b + 1) * (b + 1) < (1 << 28)) {
91
+ b += 1;
92
+ }
93
+ estimate = (b + 1) / 2;
94
+ assert(256 <= estimate && estimate < 512);
95
96
- q = float64_mul(q, float64_256,s );
97
- q = float64_add(q, float64_half, s);
98
- q_int = float64_to_int64_round_to_zero(q, s);
99
+ return estimate;
100
+}
101
102
- /* return (double)s / 256.0;*/
103
- return float64_div(int64_to_float64(q_int, s), float64_256, s);
104
+
105
+static uint64_t recip_sqrt_estimate(int *exp , int exp_off, uint64_t frac)
106
+{
107
+ int estimate;
108
+ uint32_t scaled;
109
+
110
+ if (*exp == 0) {
111
+ while (extract64(frac, 51, 1) == 0) {
112
+ frac = frac << 1;
113
+ *exp -= 1;
114
+ }
115
+ frac = extract64(frac, 0, 51) << 1;
116
+ }
37
+ }
117
+
38
+
118
+ if (*exp & 1) {
39
+ return cpu_get_address_space(cs, asidx);
119
+ /* scaled = UInt('01':fraction<51:45>) */
120
+ scaled = deposit32(1 << 7, 0, 7, extract64(frac, 45, 7));
121
+ } else {
122
+ /* scaled = UInt('1':fraction<51:44>) */
123
+ scaled = deposit32(1 << 8, 0, 8, extract64(frac, 44, 8));
124
+ }
125
+ estimate = do_recip_sqrt_estimate(scaled);
126
+
127
+ *exp = (exp_off - *exp) / 2;
128
+ return extract64(estimate, 0, 8) << 44;
129
+}
40
+}
130
+
41
+
131
+float16 HELPER(rsqrte_f16)(float16 input, void *fpstp)
42
typedef enum {
132
+{
43
FIXUP_NONE = 0, /* do nothing */
133
+ float_status *s = fpstp;
44
FIXUP_TERMINATOR, /* end of insns */
134
+ float16 f16 = float16_squash_input_denormal(input, s);
45
@@ -XXX,XX +XXX,XX @@ static const ARMInsnFixup smpboot[] = {
135
+ uint16_t val = float16_val(f16);
46
};
136
+ bool f16_sign = float16_is_neg(f16);
47
137
+ int f16_exp = extract32(val, 10, 5);
48
static void write_bootloader(const char *name, hwaddr addr,
138
+ uint16_t f16_frac = extract32(val, 0, 10);
49
- const ARMInsnFixup *insns, uint32_t *fixupcontext)
139
+ uint64_t f64_frac;
50
+ const ARMInsnFixup *insns, uint32_t *fixupcontext,
51
+ AddressSpace *as)
52
{
53
/* Fix up the specified bootloader fragment and write it into
54
* guest memory using rom_add_blob_fixed(). fixupcontext is
55
@@ -XXX,XX +XXX,XX @@ static void write_bootloader(const char *name, hwaddr addr,
56
code[i] = tswap32(insn);
57
}
58
59
- rom_add_blob_fixed(name, code, len * sizeof(uint32_t), addr);
60
+ rom_add_blob_fixed_as(name, code, len * sizeof(uint32_t), addr, as);
61
62
g_free(code);
63
}
64
@@ -XXX,XX +XXX,XX @@ static void default_write_secondary(ARMCPU *cpu,
65
const struct arm_boot_info *info)
66
{
67
uint32_t fixupcontext[FIXUP_MAX];
68
+ AddressSpace *as = arm_boot_address_space(cpu, info);
69
70
fixupcontext[FIXUP_GIC_CPU_IF] = info->gic_cpu_if_addr;
71
fixupcontext[FIXUP_BOOTREG] = info->smp_bootreg_addr;
72
@@ -XXX,XX +XXX,XX @@ static void default_write_secondary(ARMCPU *cpu,
73
}
74
75
write_bootloader("smpboot", info->smp_loader_start,
76
- smpboot, fixupcontext);
77
+ smpboot, fixupcontext, as);
78
}
79
80
void arm_write_secure_board_setup_dummy_smc(ARMCPU *cpu,
81
const struct arm_boot_info *info,
82
hwaddr mvbar_addr)
83
{
84
+ AddressSpace *as = arm_boot_address_space(cpu, info);
85
int n;
86
uint32_t mvbar_blob[] = {
87
/* mvbar_addr: secure monitor vectors
88
@@ -XXX,XX +XXX,XX @@ void arm_write_secure_board_setup_dummy_smc(ARMCPU *cpu,
89
for (n = 0; n < ARRAY_SIZE(mvbar_blob); n++) {
90
mvbar_blob[n] = tswap32(mvbar_blob[n]);
91
}
92
- rom_add_blob_fixed("board-setup-mvbar", mvbar_blob, sizeof(mvbar_blob),
93
- mvbar_addr);
94
+ rom_add_blob_fixed_as("board-setup-mvbar", mvbar_blob, sizeof(mvbar_blob),
95
+ mvbar_addr, as);
96
97
for (n = 0; n < ARRAY_SIZE(board_setup_blob); n++) {
98
board_setup_blob[n] = tswap32(board_setup_blob[n]);
99
}
100
- rom_add_blob_fixed("board-setup", board_setup_blob,
101
- sizeof(board_setup_blob), info->board_setup_addr);
102
+ rom_add_blob_fixed_as("board-setup", board_setup_blob,
103
+ sizeof(board_setup_blob), info->board_setup_addr, as);
104
}
105
106
static void default_reset_secondary(ARMCPU *cpu,
107
const struct arm_boot_info *info)
108
{
109
+ AddressSpace *as = arm_boot_address_space(cpu, info);
110
CPUState *cs = CPU(cpu);
111
112
- address_space_stl_notdirty(&address_space_memory, info->smp_bootreg_addr,
113
+ address_space_stl_notdirty(as, info->smp_bootreg_addr,
114
0, MEMTXATTRS_UNSPECIFIED, NULL);
115
cpu_set_pc(cs, info->smp_loader_start);
116
}
117
@@ -XXX,XX +XXX,XX @@ static inline bool have_dtb(const struct arm_boot_info *info)
118
}
119
120
#define WRITE_WORD(p, value) do { \
121
- address_space_stl_notdirty(&address_space_memory, p, value, \
122
+ address_space_stl_notdirty(as, p, value, \
123
MEMTXATTRS_UNSPECIFIED, NULL); \
124
p += 4; \
125
} while (0)
126
127
-static void set_kernel_args(const struct arm_boot_info *info)
128
+static void set_kernel_args(const struct arm_boot_info *info, AddressSpace *as)
129
{
130
int initrd_size = info->initrd_size;
131
hwaddr base = info->loader_start;
132
@@ -XXX,XX +XXX,XX @@ static void set_kernel_args(const struct arm_boot_info *info)
133
int cmdline_size;
134
135
cmdline_size = strlen(info->kernel_cmdline);
136
- cpu_physical_memory_write(p + 8, info->kernel_cmdline,
137
- cmdline_size + 1);
138
+ address_space_write(as, p + 8, MEMTXATTRS_UNSPECIFIED,
139
+ (const uint8_t *)info->kernel_cmdline,
140
+ cmdline_size + 1);
141
cmdline_size = (cmdline_size >> 2) + 1;
142
WRITE_WORD(p, cmdline_size + 2);
143
WRITE_WORD(p, 0x54410009);
144
@@ -XXX,XX +XXX,XX @@ static void set_kernel_args(const struct arm_boot_info *info)
145
atag_board_len = (info->atag_board(info, atag_board_buf) + 3) & ~3;
146
WRITE_WORD(p, (atag_board_len + 8) >> 2);
147
WRITE_WORD(p, 0x414f4d50);
148
- cpu_physical_memory_write(p, atag_board_buf, atag_board_len);
149
+ address_space_write(as, p, MEMTXATTRS_UNSPECIFIED,
150
+ atag_board_buf, atag_board_len);
151
p += atag_board_len;
152
}
153
/* ATAG_END */
154
@@ -XXX,XX +XXX,XX @@ static void set_kernel_args(const struct arm_boot_info *info)
155
WRITE_WORD(p, 0);
156
}
157
158
-static void set_kernel_args_old(const struct arm_boot_info *info)
159
+static void set_kernel_args_old(const struct arm_boot_info *info,
160
+ AddressSpace *as)
161
{
162
hwaddr p;
163
const char *s;
164
@@ -XXX,XX +XXX,XX @@ static void set_kernel_args_old(const struct arm_boot_info *info)
165
}
166
s = info->kernel_cmdline;
167
if (s) {
168
- cpu_physical_memory_write(p, s, strlen(s) + 1);
169
+ address_space_write(as, p, MEMTXATTRS_UNSPECIFIED,
170
+ (const uint8_t *)s, strlen(s) + 1);
171
} else {
172
WRITE_WORD(p, 0);
173
}
174
@@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt)
175
* @addr: the address to load the image at
176
* @binfo: struct describing the boot environment
177
* @addr_limit: upper limit of the available memory area at @addr
178
+ * @as: address space to load image to
179
*
180
* Load a device tree supplied by the machine or by the user with the
181
* '-dtb' command line option, and put it at offset @addr in target
182
@@ -XXX,XX +XXX,XX @@ static void fdt_add_psci_node(void *fdt)
183
* Note: Must not be called unless have_dtb(binfo) is true.
184
*/
185
static int load_dtb(hwaddr addr, const struct arm_boot_info *binfo,
186
- hwaddr addr_limit)
187
+ hwaddr addr_limit, AddressSpace *as)
188
{
189
void *fdt = NULL;
190
int size, rc;
191
@@ -XXX,XX +XXX,XX @@ static int load_dtb(hwaddr addr, const struct arm_boot_info *binfo,
192
/* Put the DTB into the memory map as a ROM image: this will ensure
193
* the DTB is copied again upon reset, even if addr points into RAM.
194
*/
195
- rom_add_blob_fixed("dtb", fdt, size, addr);
196
+ rom_add_blob_fixed_as("dtb", fdt, size, addr, as);
197
198
g_free(fdt);
199
200
@@ -XXX,XX +XXX,XX @@ static void do_cpu_reset(void *opaque)
201
}
202
203
if (cs == first_cpu) {
204
+ AddressSpace *as = arm_boot_address_space(cpu, info);
140
+
205
+
141
+ if (float16_is_any_nan(f16)) {
206
cpu_set_pc(cs, info->loader_start);
142
+ float16 nan = f16;
207
143
+ if (float16_is_signaling_nan(f16, s)) {
208
if (!have_dtb(info)) {
144
+ float_raise(float_flag_invalid, s);
209
if (old_param) {
145
+ nan = float16_maybe_silence_nan(f16, s);
210
- set_kernel_args_old(info);
146
+ }
211
+ set_kernel_args_old(info, as);
147
+ if (s->default_nan_mode) {
212
} else {
148
+ nan = float16_default_nan(s);
213
- set_kernel_args(info);
149
+ }
214
+ set_kernel_args(info, as);
150
+ return nan;
215
}
151
+ } else if (float16_is_zero(f16)) {
216
}
152
+ float_raise(float_flag_divbyzero, s);
217
} else {
153
+ return float16_set_sign(float16_infinity, f16_sign);
218
@@ -XXX,XX +XXX,XX @@ static int do_arm_linux_init(Object *obj, void *opaque)
154
+ } else if (f16_sign) {
219
155
+ float_raise(float_flag_invalid, s);
220
static uint64_t arm_load_elf(struct arm_boot_info *info, uint64_t *pentry,
156
+ return float16_default_nan(s);
221
uint64_t *lowaddr, uint64_t *highaddr,
157
+ } else if (float16_is_infinity(f16)) {
222
- int elf_machine)
158
+ return float16_zero;
223
+ int elf_machine, AddressSpace *as)
159
+ }
224
{
160
+
225
bool elf_is64;
161
+ /* Scale and normalize to a double-precision value between 0.25 and 1.0,
226
union {
162
+ * preserving the parity of the exponent. */
227
@@ -XXX,XX +XXX,XX @@ static uint64_t arm_load_elf(struct arm_boot_info *info, uint64_t *pentry,
163
+
228
}
164
+ f64_frac = ((uint64_t) f16_frac) << (52 - 10);
229
}
165
+
230
166
+ f64_frac = recip_sqrt_estimate(&f16_exp, 44, f64_frac);
231
- ret = load_elf(info->kernel_filename, NULL, NULL,
167
+
232
- pentry, lowaddr, highaddr, big_endian, elf_machine,
168
+ /* result = sign : result_exp<4:0> : estimate<7:0> : Zeros(2) */
233
- 1, data_swab);
169
+ val = deposit32(0, 15, 1, f16_sign);
234
+ ret = load_elf_as(info->kernel_filename, NULL, NULL,
170
+ val = deposit32(val, 10, 5, f16_exp);
235
+ pentry, lowaddr, highaddr, big_endian, elf_machine,
171
+ val = deposit32(val, 2, 8, extract64(f64_frac, 52 - 8, 8));
236
+ 1, data_swab, as);
172
+ return make_float16(val);
237
if (ret <= 0) {
173
}
238
/* The header loaded but the image didn't */
174
239
exit(1);
175
float32 HELPER(rsqrte_f32)(float32 input, void *fpstp)
240
@@ -XXX,XX +XXX,XX @@ static uint64_t arm_load_elf(struct arm_boot_info *info, uint64_t *pentry,
176
@@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrte_f32)(float32 input, void *fpstp)
241
}
177
float_status *s = fpstp;
242
178
float32 f32 = float32_squash_input_denormal(input, s);
243
static uint64_t load_aarch64_image(const char *filename, hwaddr mem_base,
179
uint32_t val = float32_val(f32);
244
- hwaddr *entry)
180
- uint32_t f32_sbit = 0x80000000 & val;
245
+ hwaddr *entry, AddressSpace *as)
181
- int32_t f32_exp = extract32(val, 23, 8);
246
{
182
+ uint32_t f32_sign = float32_is_neg(f32);
247
hwaddr kernel_load_offset = KERNEL64_LOAD_ADDR;
183
+ int f32_exp = extract32(val, 23, 8);
248
uint8_t *buffer;
184
uint32_t f32_frac = extract32(val, 0, 23);
249
@@ -XXX,XX +XXX,XX @@ static uint64_t load_aarch64_image(const char *filename, hwaddr mem_base,
185
uint64_t f64_frac;
250
}
186
- uint64_t val64;
251
187
- int result_exp;
252
*entry = mem_base + kernel_load_offset;
188
- float64 f64;
253
- rom_add_blob_fixed(filename, buffer, size, *entry);
189
254
+ rom_add_blob_fixed_as(filename, buffer, size, *entry, as);
190
if (float32_is_any_nan(f32)) {
255
191
float32 nan = f32;
256
g_free(buffer);
192
@@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrte_f32)(float32 input, void *fpstp)
257
193
* preserving the parity of the exponent. */
258
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
194
259
ARMCPU *cpu = n->cpu;
195
f64_frac = ((uint64_t) f32_frac) << 29;
260
struct arm_boot_info *info =
196
- if (f32_exp == 0) {
261
container_of(n, struct arm_boot_info, load_kernel_notifier);
197
- while (extract64(f64_frac, 51, 1) == 0) {
262
+ AddressSpace *as = arm_boot_address_space(cpu, info);
198
- f64_frac = f64_frac << 1;
263
199
- f32_exp = f32_exp-1;
264
/* The board code is not supposed to set secure_board_setup unless
200
- }
265
* running its code in secure mode is actually possible, and KVM
201
- f64_frac = extract64(f64_frac, 0, 51) << 1;
266
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
202
- }
267
* the kernel is supposed to be loaded by the bootloader), copy the
203
268
* DTB to the base of RAM for the bootloader to pick up.
204
- if (extract64(f32_exp, 0, 1) == 0) {
269
*/
205
- f64 = make_float64(((uint64_t) f32_sbit) << 32
270
- if (load_dtb(info->loader_start, info, 0) < 0) {
206
- | (0x3feULL << 52)
271
+ if (load_dtb(info->loader_start, info, 0, as) < 0) {
207
- | f64_frac);
272
exit(1);
208
- } else {
273
}
209
- f64 = make_float64(((uint64_t) f32_sbit) << 32
274
}
210
- | (0x3fdULL << 52)
275
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
211
- | f64_frac);
276
212
- }
277
/* Assume that raw images are linux kernels, and ELF images are not. */
213
+ f64_frac = recip_sqrt_estimate(&f32_exp, 380, f64_frac);
278
kernel_size = arm_load_elf(info, &elf_entry, &elf_low_addr,
214
279
- &elf_high_addr, elf_machine);
215
- result_exp = (380 - f32_exp) / 2;
280
+ &elf_high_addr, elf_machine, as);
216
-
281
if (kernel_size > 0 && have_dtb(info)) {
217
- f64 = recip_sqrt_estimate(f64, s);
282
/* If there is still some room left at the base of RAM, try and put
218
-
283
* the DTB there like we do for images loaded with -bios or -pflash.
219
- val64 = float64_val(f64);
284
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
220
-
285
if (elf_low_addr < info->loader_start) {
221
- val = ((result_exp & 0xff) << 23)
286
elf_low_addr = 0;
222
- | ((val64 >> 29) & 0x7fffff);
287
}
223
+ /* result = sign : result_exp<4:0> : estimate<7:0> : Zeros(15) */
288
- if (load_dtb(info->loader_start, info, elf_low_addr) < 0) {
224
+ val = deposit32(0, 31, 1, f32_sign);
289
+ if (load_dtb(info->loader_start, info, elf_low_addr, as) < 0) {
225
+ val = deposit32(val, 23, 8, f32_exp);
290
exit(1);
226
+ val = deposit32(val, 15, 8, extract64(f64_frac, 52 - 8, 8));
291
}
227
return make_float32(val);
292
}
228
}
293
}
229
294
entry = elf_entry;
230
@@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp)
295
if (kernel_size < 0) {
231
float_status *s = fpstp;
296
- kernel_size = load_uimage(info->kernel_filename, &entry, NULL,
232
float64 f64 = float64_squash_input_denormal(input, s);
297
- &is_linux, NULL, NULL);
233
uint64_t val = float64_val(f64);
298
+ kernel_size = load_uimage_as(info->kernel_filename, &entry, NULL,
234
- uint64_t f64_sbit = 0x8000000000000000ULL & val;
299
+ &is_linux, NULL, NULL, as);
235
- int64_t f64_exp = extract64(val, 52, 11);
300
}
236
+ bool f64_sign = float64_is_neg(f64);
301
if (arm_feature(&cpu->env, ARM_FEATURE_AARCH64) && kernel_size < 0) {
237
+ int f64_exp = extract64(val, 52, 11);
302
kernel_size = load_aarch64_image(info->kernel_filename,
238
uint64_t f64_frac = extract64(val, 0, 52);
303
- info->loader_start, &entry);
239
- int64_t result_exp;
304
+ info->loader_start, &entry, as);
240
- uint64_t result_frac;
305
is_linux = 1;
241
306
} else if (kernel_size < 0) {
242
if (float64_is_any_nan(f64)) {
307
/* 32-bit ARM */
243
float64 nan = f64;
308
entry = info->loader_start + KERNEL_LOAD_ADDR;
244
@@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp)
309
- kernel_size = load_image_targphys(info->kernel_filename, entry,
245
return float64_zero;
310
- info->ram_size - KERNEL_LOAD_ADDR);
246
}
311
+ kernel_size = load_image_targphys_as(info->kernel_filename, entry,
247
312
+ info->ram_size - KERNEL_LOAD_ADDR,
248
- /* Scale and normalize to a double-precision value between 0.25 and 1.0,
313
+ as);
249
- * preserving the parity of the exponent. */
314
is_linux = 1;
250
+ f64_frac = recip_sqrt_estimate(&f64_exp, 3068, f64_frac);
315
}
251
316
if (kernel_size < 0) {
252
- if (f64_exp == 0) {
317
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
253
- while (extract64(f64_frac, 51, 1) == 0) {
318
uint32_t fixupcontext[FIXUP_MAX];
254
- f64_frac = f64_frac << 1;
319
255
- f64_exp = f64_exp - 1;
320
if (info->initrd_filename) {
256
- }
321
- initrd_size = load_ramdisk(info->initrd_filename,
257
- f64_frac = extract64(f64_frac, 0, 51) << 1;
322
- info->initrd_start,
258
- }
323
- info->ram_size -
259
-
324
- info->initrd_start);
260
- if (extract64(f64_exp, 0, 1) == 0) {
325
+ initrd_size = load_ramdisk_as(info->initrd_filename,
261
- f64 = make_float64(f64_sbit
326
+ info->initrd_start,
262
- | (0x3feULL << 52)
327
+ info->ram_size - info->initrd_start,
263
- | f64_frac);
328
+ as);
264
- } else {
329
if (initrd_size < 0) {
265
- f64 = make_float64(f64_sbit
330
- initrd_size = load_image_targphys(info->initrd_filename,
266
- | (0x3fdULL << 52)
331
- info->initrd_start,
267
- | f64_frac);
332
- info->ram_size -
268
- }
333
- info->initrd_start);
269
-
334
+ initrd_size = load_image_targphys_as(info->initrd_filename,
270
- result_exp = (3068 - f64_exp) / 2;
335
+ info->initrd_start,
271
-
336
+ info->ram_size -
272
- f64 = recip_sqrt_estimate(f64, s);
337
+ info->initrd_start,
273
-
338
+ as);
274
- result_frac = extract64(float64_val(f64), 0, 52);
339
}
275
-
340
if (initrd_size < 0) {
276
- return make_float64(f64_sbit |
341
error_report("could not load initrd '%s'",
277
- ((result_exp & 0x7ff) << 52) |
342
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
278
- result_frac);
343
279
+ /* result = sign : result_exp<4:0> : estimate<7:0> : Zeros(44) */
344
/* Place the DTB after the initrd in memory with alignment. */
280
+ val = deposit64(0, 61, 1, f64_sign);
345
dtb_start = QEMU_ALIGN_UP(info->initrd_start + initrd_size, align);
281
+ val = deposit64(val, 52, 11, f64_exp);
346
- if (load_dtb(dtb_start, info, 0) < 0) {
282
+ val = deposit64(val, 44, 8, extract64(f64_frac, 52 - 8, 8));
347
+ if (load_dtb(dtb_start, info, 0, as) < 0) {
283
+ return make_float64(val);
348
exit(1);
284
}
349
}
285
350
fixupcontext[FIXUP_ARGPTR] = dtb_start;
286
uint32_t HELPER(recpe_u32)(uint32_t a, void *fpstp)
351
@@ -XXX,XX +XXX,XX @@ static void arm_load_kernel_notify(Notifier *notifier, void *data)
287
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(recpe_u32)(uint32_t a, void *fpstp)
352
fixupcontext[FIXUP_ENTRYPOINT] = entry;
288
353
289
uint32_t HELPER(rsqrte_u32)(uint32_t a, void *fpstp)
354
write_bootloader("bootloader", info->loader_start,
290
{
355
- primary_loader, fixupcontext);
291
- float_status *fpst = fpstp;
356
+ primary_loader, fixupcontext, as);
292
- float64 f64;
357
293
+ int estimate;
358
if (info->nb_cpus > 1) {
294
359
info->write_secondary_boot(cpu, info);
295
if ((a & 0xc0000000) == 0) {
296
return 0xffffffff;
297
}
298
299
- if (a & 0x80000000) {
300
- f64 = make_float64((0x3feULL << 52)
301
- | ((uint64_t)(a & 0x7fffffff) << 21));
302
- } else { /* bits 31-30 == '01' */
303
- f64 = make_float64((0x3fdULL << 52)
304
- | ((uint64_t)(a & 0x3fffffff) << 22));
305
- }
306
+ estimate = do_recip_sqrt_estimate(extract32(a, 23, 9));
307
308
- f64 = recip_sqrt_estimate(f64, fpst);
309
-
310
- return 0x80000000 | ((float64_val(f64) >> 21) & 0x7fffffff);
311
+ return deposit32(0, 23, 9, estimate);
312
}
313
314
/* VFPv4 fused multiply-accumulate */
315
--
360
--
316
2.16.2
361
2.16.2
317
362
318
363
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Instead of loading guest images to the system address space, use the
2
CPU's address space. This is important if we're trying to load the
3
file to memory or via an alias memory region that is provided by an
4
SoC object and thus not mapped into the system address space.
2
5
3
I re-use the existing handle_2misc_fcmp_zero handler and tweak it
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
slightly to deal with the half-precision case.
7
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Message-id: 20180220180325.29818-4-peter.maydell@linaro.org
10
---
11
hw/arm/armv7m.c | 17 ++++++++++++++---
12
1 file changed, 14 insertions(+), 3 deletions(-)
5
13
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
14
diff --git a/hw/arm/armv7m.c b/hw/arm/armv7m.c
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180227143852.11175-20-alex.bennee@linaro.org
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
11
target/arm/translate-a64.c | 80 +++++++++++++++++++++++++++++++++-------------
12
1 file changed, 57 insertions(+), 23 deletions(-)
13
14
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
15
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/translate-a64.c
16
--- a/hw/arm/armv7m.c
17
+++ b/target/arm/translate-a64.c
17
+++ b/hw/arm/armv7m.c
18
@@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode,
18
@@ -XXX,XX +XXX,XX @@ void armv7m_load_kernel(ARMCPU *cpu, const char *kernel_filename, int mem_size)
19
bool is_scalar, bool is_u, bool is_q,
19
uint64_t entry;
20
int size, int rn, int rd)
20
uint64_t lowaddr;
21
{
21
int big_endian;
22
- bool is_double = (size == 3);
22
+ AddressSpace *as;
23
+ bool is_double = (size == MO_64);
23
+ int asidx;
24
TCGv_ptr fpst;
24
+ CPUState *cs = CPU(cpu);
25
25
26
if (!fp_access_check(s)) {
26
#ifdef TARGET_WORDS_BIGENDIAN
27
return;
27
big_endian = 1;
28
@@ -XXX,XX +XXX,XX @@ void armv7m_load_kernel(ARMCPU *cpu, const char *kernel_filename, int mem_size)
29
exit(1);
28
}
30
}
29
31
30
- fpst = get_fpstatus_ptr(false);
32
+ if (arm_feature(&cpu->env, ARM_FEATURE_EL3)) {
31
+ fpst = get_fpstatus_ptr(size == MO_16);
33
+ asidx = ARMASIdx_S;
32
34
+ } else {
33
if (is_double) {
35
+ asidx = ARMASIdx_NS;
34
TCGv_i64 tcg_op = tcg_temp_new_i64();
36
+ }
35
@@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode,
37
+ as = cpu_get_address_space(cs, asidx);
36
bool swap = false;
38
+
37
int pass, maxpasses;
39
if (kernel_filename) {
38
40
- image_size = load_elf(kernel_filename, NULL, NULL, &entry, &lowaddr,
39
- switch (opcode) {
41
- NULL, big_endian, EM_ARM, 1, 0);
40
- case 0x2e: /* FCMLT (zero) */
42
+ image_size = load_elf_as(kernel_filename, NULL, NULL, &entry, &lowaddr,
41
- swap = true;
43
+ NULL, big_endian, EM_ARM, 1, 0, as);
42
- /* fall through */
44
if (image_size < 0) {
43
- case 0x2c: /* FCMGT (zero) */
45
- image_size = load_image_targphys(kernel_filename, 0, mem_size);
44
- genfn = gen_helper_neon_cgt_f32;
46
+ image_size = load_image_targphys_as(kernel_filename, 0,
45
- break;
47
+ mem_size, as);
46
- case 0x2d: /* FCMEQ (zero) */
48
lowaddr = 0;
47
- genfn = gen_helper_neon_ceq_f32;
48
- break;
49
- case 0x6d: /* FCMLE (zero) */
50
- swap = true;
51
- /* fall through */
52
- case 0x6c: /* FCMGE (zero) */
53
- genfn = gen_helper_neon_cge_f32;
54
- break;
55
- default:
56
- g_assert_not_reached();
57
+ if (size == MO_16) {
58
+ switch (opcode) {
59
+ case 0x2e: /* FCMLT (zero) */
60
+ swap = true;
61
+ /* fall through */
62
+ case 0x2c: /* FCMGT (zero) */
63
+ genfn = gen_helper_advsimd_cgt_f16;
64
+ break;
65
+ case 0x2d: /* FCMEQ (zero) */
66
+ genfn = gen_helper_advsimd_ceq_f16;
67
+ break;
68
+ case 0x6d: /* FCMLE (zero) */
69
+ swap = true;
70
+ /* fall through */
71
+ case 0x6c: /* FCMGE (zero) */
72
+ genfn = gen_helper_advsimd_cge_f16;
73
+ break;
74
+ default:
75
+ g_assert_not_reached();
76
+ }
77
+ } else {
78
+ switch (opcode) {
79
+ case 0x2e: /* FCMLT (zero) */
80
+ swap = true;
81
+ /* fall through */
82
+ case 0x2c: /* FCMGT (zero) */
83
+ genfn = gen_helper_neon_cgt_f32;
84
+ break;
85
+ case 0x2d: /* FCMEQ (zero) */
86
+ genfn = gen_helper_neon_ceq_f32;
87
+ break;
88
+ case 0x6d: /* FCMLE (zero) */
89
+ swap = true;
90
+ /* fall through */
91
+ case 0x6c: /* FCMGE (zero) */
92
+ genfn = gen_helper_neon_cge_f32;
93
+ break;
94
+ default:
95
+ g_assert_not_reached();
96
+ }
97
}
49
}
98
50
if (image_size < 0) {
99
if (is_scalar) {
100
maxpasses = 1;
101
} else {
102
- maxpasses = is_q ? 4 : 2;
103
+ int vector_size = 8 << is_q;
104
+ maxpasses = vector_size >> size;
105
}
106
107
for (pass = 0; pass < maxpasses; pass++) {
108
- read_vec_element_i32(s, tcg_op, rn, pass, MO_32);
109
+ read_vec_element_i32(s, tcg_op, rn, pass, size);
110
if (swap) {
111
genfn(tcg_res, tcg_zero, tcg_op, fpst);
112
} else {
113
@@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode,
114
if (is_scalar) {
115
write_fp_sreg(s, rd, tcg_res);
116
} else {
117
- write_vec_element_i32(s, tcg_res, rd, pass, MO_32);
118
+ write_vec_element_i32(s, tcg_res, rd, pass, size);
119
}
120
}
121
tcg_temp_free_i32(tcg_res);
122
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
123
fpop = deposit32(opcode, 5, 1, a);
124
fpop = deposit32(fpop, 6, 1, u);
125
126
+ rd = extract32(insn, 0, 5);
127
+ rn = extract32(insn, 5, 5);
128
+
129
switch (fpop) {
130
+ break;
131
+ case 0x2c: /* FCMGT (zero) */
132
+ case 0x2d: /* FCMEQ (zero) */
133
+ case 0x2e: /* FCMLT (zero) */
134
+ case 0x6c: /* FCMGE (zero) */
135
+ case 0x6d: /* FCMLE (zero) */
136
+ handle_2misc_fcmp_zero(s, fpop, is_scalar, 0, is_q, MO_16, rn, rd);
137
+ return;
138
case 0x18: /* FRINTN */
139
need_rmode = true;
140
only_in_vector = true;
141
--
51
--
142
2.16.2
52
2.16.2
143
53
144
54
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
In v8M, the Implementation Defined Attribution Unit (IDAU) is
2
2
a small piece of hardware typically implemented in the SoC
3
Half-precision flush to zero behaviour is controlled by a separate
3
which provides board or SoC specific security attribution
4
FZ16 bit in the FPCR. To handle this we pass a pointer to
4
information for each address that the CPU performs MPU/SAU
5
fp_status_fp16 when working on half-precision operations. The value of
5
checks on. For QEMU, we model this with a QOM interface which
6
the presented FPCR is calculated from an amalgam of the two when read.
6
is implemented by the board or SoC object and connected to
7
7
the CPU using a link property.
8
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
8
9
This commit defines the new interface class, adds the link
10
property to the CPU object, and makes the SAU checking
11
code call the IDAU interface if one is present.
12
13
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
14
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
10
Message-id: 20180227143852.11175-5-alex.bennee@linaro.org
15
Message-id: 20180220180325.29818-5-peter.maydell@linaro.org
11
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
12
---
16
---
13
target/arm/cpu.h | 32 ++++++++++++++++++++++------
17
target/arm/cpu.h | 3 +++
14
target/arm/helper.c | 26 ++++++++++++++++++-----
18
target/arm/idau.h | 61 +++++++++++++++++++++++++++++++++++++++++++++++++++++
15
target/arm/translate-a64.c | 53 +++++++++++++++++++++++++---------------------
19
target/arm/cpu.c | 15 +++++++++++++
16
3 files changed, 75 insertions(+), 36 deletions(-)
20
target/arm/helper.c | 28 +++++++++++++++++++++---
21
4 files changed, 104 insertions(+), 3 deletions(-)
22
create mode 100644 target/arm/idau.h
17
23
18
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
24
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
19
index XXXXXXX..XXXXXXX 100644
25
index XXXXXXX..XXXXXXX 100644
20
--- a/target/arm/cpu.h
26
--- a/target/arm/cpu.h
21
+++ b/target/arm/cpu.h
27
+++ b/target/arm/cpu.h
22
@@ -XXX,XX +XXX,XX @@ typedef struct CPUARMState {
28
@@ -XXX,XX +XXX,XX @@ struct ARMCPU {
23
/* scratch space when Tn are not sufficient. */
29
/* MemoryRegion to use for secure physical accesses */
24
uint32_t scratch[8];
30
MemoryRegion *secure_memory;
25
31
26
- /* fp_status is the "normal" fp status. standard_fp_status retains
32
+ /* For v8M, pointer to the IDAU interface provided by board/SoC */
27
- * values corresponding to the ARM "Standard FPSCR Value", ie
33
+ Object *idau;
28
- * default-NaN, flush-to-zero, round-to-nearest and is used by
34
+
29
- * any operations (generally Neon) which the architecture defines
35
/* 'compatible' string for this CPU for Linux device trees */
30
- * as controlled by the standard FPSCR value rather than the FPSCR.
36
const char *dtb_compatible;
31
+ /* There are a number of distinct float control structures:
37
32
+ *
38
diff --git a/target/arm/idau.h b/target/arm/idau.h
33
+ * fp_status: is the "normal" fp status.
39
new file mode 100644
34
+ * fp_status_fp16: used for half-precision calculations
40
index XXXXXXX..XXXXXXX
35
+ * standard_fp_status : the ARM "Standard FPSCR Value"
41
--- /dev/null
36
+ *
42
+++ b/target/arm/idau.h
37
+ * Half-precision operations are governed by a separate
43
@@ -XXX,XX +XXX,XX @@
38
+ * flush-to-zero control bit in FPSCR:FZ16. We pass a separate
44
+/*
39
+ * status structure to control this.
45
+ * QEMU ARM CPU -- interface for the Arm v8M IDAU
40
+ *
46
+ *
41
+ * The "Standard FPSCR", ie default-NaN, flush-to-zero,
47
+ * Copyright (c) 2018 Linaro Ltd
42
+ * round-to-nearest and is used by any operations (generally
48
+ *
43
+ * Neon) which the architecture defines as controlled by the
49
+ * This program is free software; you can redistribute it and/or
44
+ * standard FPSCR value rather than the FPSCR.
50
+ * modify it under the terms of the GNU General Public License
45
*
51
+ * as published by the Free Software Foundation; either version 2
46
* To avoid having to transfer exception bits around, we simply
52
+ * of the License, or (at your option) any later version.
47
* say that the FPSCR cumulative exception flags are the logical
53
+ *
48
- * OR of the flags in the two fp statuses. This relies on the
54
+ * This program is distributed in the hope that it will be useful,
49
+ * OR of the flags in the three fp statuses. This relies on the
55
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
50
* only thing which needs to read the exception flags being
56
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
51
* an explicit FPSCR read.
57
+ * GNU General Public License for more details.
52
*/
58
+ *
53
float_status fp_status;
59
+ * You should have received a copy of the GNU General Public License
54
+ float_status fp_status_f16;
60
+ * along with this program; if not, see
55
float_status standard_fp_status;
61
+ * <http://www.gnu.org/licenses/gpl-2.0.html>
56
62
+ *
57
/* ZCR_EL[1-3] */
63
+ * In the v8M architecture, the IDAU is a small piece of hardware
58
@@ -XXX,XX +XXX,XX @@ static inline void xpsr_write(CPUARMState *env, uint32_t val, uint32_t mask)
64
+ * typically implemented in the SoC which provides board or SoC
59
uint32_t vfp_get_fpscr(CPUARMState *env);
65
+ * specific security attribution information for each address that
60
void vfp_set_fpscr(CPUARMState *env, uint32_t val);
66
+ * the CPU performs MPU/SAU checks on. For QEMU, we model this with a
61
67
+ * QOM interface which is implemented by the board or SoC object and
62
-/* For A64 the FPSCR is split into two logically distinct registers,
68
+ * connected to the CPU using a link property.
63
+/* FPCR, Floating Point Control Register
69
+ */
64
+ * FPSR, Floating Poiht Status Register
70
+
65
+ *
71
+#ifndef TARGET_ARM_IDAU_H
66
+ * For A64 the FPSCR is split into two logically distinct registers,
72
+#define TARGET_ARM_IDAU_H
67
* FPCR and FPSR. However since they still use non-overlapping bits
73
+
68
* we store the underlying state in fpscr and just mask on read/write.
74
+#include "qom/object.h"
75
+
76
+#define TYPE_IDAU_INTERFACE "idau-interface"
77
+#define IDAU_INTERFACE(obj) \
78
+ INTERFACE_CHECK(IDAUInterface, (obj), TYPE_IDAU_INTERFACE)
79
+#define IDAU_INTERFACE_CLASS(class) \
80
+ OBJECT_CLASS_CHECK(IDAUInterfaceClass, (class), TYPE_IDAU_INTERFACE)
81
+#define IDAU_INTERFACE_GET_CLASS(obj) \
82
+ OBJECT_GET_CLASS(IDAUInterfaceClass, (obj), TYPE_IDAU_INTERFACE)
83
+
84
+typedef struct IDAUInterface {
85
+ Object parent;
86
+} IDAUInterface;
87
+
88
+#define IREGION_NOTVALID -1
89
+
90
+typedef struct IDAUInterfaceClass {
91
+ InterfaceClass parent;
92
+
93
+ /* Check the specified address and return the IDAU security information
94
+ * for it by filling in iregion, exempt, ns and nsc:
95
+ * iregion: IDAU region number, or IREGION_NOTVALID if not valid
96
+ * exempt: true if address is exempt from security attribution
97
+ * ns: true if the address is NonSecure
98
+ * nsc: true if the address is NonSecure-callable
99
+ */
100
+ void (*check)(IDAUInterface *ii, uint32_t address, int *iregion,
101
+ bool *exempt, bool *ns, bool *nsc);
102
+} IDAUInterfaceClass;
103
+
104
+#endif
105
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
106
index XXXXXXX..XXXXXXX 100644
107
--- a/target/arm/cpu.c
108
+++ b/target/arm/cpu.c
109
@@ -XXX,XX +XXX,XX @@
69
*/
110
*/
70
#define FPSR_MASK 0xf800009f
111
71
#define FPCR_MASK 0x07f79f00
112
#include "qemu/osdep.h"
72
+
113
+#include "target/arm/idau.h"
73
+#define FPCR_FZ16 (1 << 19) /* ARMv8.2+, FP16 flush-to-zero */
114
#include "qemu/error-report.h"
74
+#define FPCR_FZ (1 << 24) /* Flush-to-zero enable bit */
115
#include "qapi/error.h"
75
+#define FPCR_DN (1 << 25) /* Default NaN enable bit */
116
#include "cpu.h"
76
+
117
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_post_init(Object *obj)
77
static inline uint32_t vfp_get_fpsr(CPUARMState *env)
118
}
119
}
120
121
+ if (arm_feature(&cpu->env, ARM_FEATURE_M_SECURITY)) {
122
+ object_property_add_link(obj, "idau", TYPE_IDAU_INTERFACE, &cpu->idau,
123
+ qdev_prop_allow_set_link_before_realize,
124
+ OBJ_PROP_LINK_UNREF_ON_RELEASE,
125
+ &error_abort);
126
+ }
127
+
128
qdev_property_add_static(DEVICE(obj), &arm_cpu_cfgend_property,
129
&error_abort);
130
}
131
@@ -XXX,XX +XXX,XX @@ static const TypeInfo arm_cpu_type_info = {
132
.class_init = arm_cpu_class_init,
133
};
134
135
+static const TypeInfo idau_interface_type_info = {
136
+ .name = TYPE_IDAU_INTERFACE,
137
+ .parent = TYPE_INTERFACE,
138
+ .class_size = sizeof(IDAUInterfaceClass),
139
+};
140
+
141
static void arm_cpu_register_types(void)
78
{
142
{
79
return vfp_get_fpscr(env) & FPSR_MASK;
143
const ARMCPUInfo *info = arm_cpus;
144
145
type_register_static(&arm_cpu_type_info);
146
+ type_register_static(&idau_interface_type_info);
147
148
while (info->name) {
149
cpu_register(info);
80
diff --git a/target/arm/helper.c b/target/arm/helper.c
150
diff --git a/target/arm/helper.c b/target/arm/helper.c
81
index XXXXXXX..XXXXXXX 100644
151
index XXXXXXX..XXXXXXX 100644
82
--- a/target/arm/helper.c
152
--- a/target/arm/helper.c
83
+++ b/target/arm/helper.c
153
+++ b/target/arm/helper.c
84
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(vfp_get_fpscr)(CPUARMState *env)
154
@@ -XXX,XX +XXX,XX @@
85
| (env->vfp.vec_stride << 20);
155
#include "qemu/osdep.h"
86
i = get_float_exception_flags(&env->vfp.fp_status);
156
+#include "target/arm/idau.h"
87
i |= get_float_exception_flags(&env->vfp.standard_fp_status);
157
#include "trace.h"
88
+ i |= get_float_exception_flags(&env->vfp.fp_status_f16);
158
#include "cpu.h"
89
fpscr |= vfp_exceptbits_from_host(i);
159
#include "internals.h"
90
return fpscr;
160
@@ -XXX,XX +XXX,XX @@ static void v8m_security_lookup(CPUARMState *env, uint32_t address,
161
*/
162
ARMCPU *cpu = arm_env_get_cpu(env);
163
int r;
164
+ bool idau_exempt = false, idau_ns = true, idau_nsc = true;
165
+ int idau_region = IREGION_NOTVALID;
166
167
- /* TODO: implement IDAU */
168
+ if (cpu->idau) {
169
+ IDAUInterfaceClass *iic = IDAU_INTERFACE_GET_CLASS(cpu->idau);
170
+ IDAUInterface *ii = IDAU_INTERFACE(cpu->idau);
171
+
172
+ iic->check(ii, address, &idau_region, &idau_exempt, &idau_ns,
173
+ &idau_nsc);
174
+ }
175
176
if (access_type == MMU_INST_FETCH && extract32(address, 28, 4) == 0xf) {
177
/* 0xf0000000..0xffffffff is always S for insn fetches */
178
return;
179
}
180
181
- if (v8m_is_sau_exempt(env, address, access_type)) {
182
+ if (idau_exempt || v8m_is_sau_exempt(env, address, access_type)) {
183
sattrs->ns = !regime_is_secure(env, mmu_idx);
184
return;
185
}
186
187
+ if (idau_region != IREGION_NOTVALID) {
188
+ sattrs->irvalid = true;
189
+ sattrs->iregion = idau_region;
190
+ }
191
+
192
switch (env->sau.ctrl & 3) {
193
case 0: /* SAU.ENABLE == 0, SAU.ALLNS == 0 */
194
break;
195
@@ -XXX,XX +XXX,XX @@ static void v8m_security_lookup(CPUARMState *env, uint32_t address,
196
}
197
}
198
199
- /* TODO when we support the IDAU then it may override the result here */
200
+ /* The IDAU will override the SAU lookup results if it specifies
201
+ * higher security than the SAU does.
202
+ */
203
+ if (!idau_ns) {
204
+ if (sattrs->ns || (!idau_nsc && sattrs->nsc)) {
205
+ sattrs->ns = false;
206
+ sattrs->nsc = idau_nsc;
207
+ }
208
+ }
209
break;
210
}
91
}
211
}
92
@@ -XXX,XX +XXX,XX @@ void HELPER(vfp_set_fpscr)(CPUARMState *env, uint32_t val)
93
break;
94
}
95
set_float_rounding_mode(i, &env->vfp.fp_status);
96
+ set_float_rounding_mode(i, &env->vfp.fp_status_f16);
97
}
98
- if (changed & (1 << 24)) {
99
- set_flush_to_zero((val & (1 << 24)) != 0, &env->vfp.fp_status);
100
- set_flush_inputs_to_zero((val & (1 << 24)) != 0, &env->vfp.fp_status);
101
+ if (changed & FPCR_FZ16) {
102
+ bool ftz_enabled = val & FPCR_FZ16;
103
+ set_flush_to_zero(ftz_enabled, &env->vfp.fp_status_f16);
104
+ set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status_f16);
105
+ }
106
+ if (changed & FPCR_FZ) {
107
+ bool ftz_enabled = val & FPCR_FZ;
108
+ set_flush_to_zero(ftz_enabled, &env->vfp.fp_status);
109
+ set_flush_inputs_to_zero(ftz_enabled, &env->vfp.fp_status);
110
+ }
111
+ if (changed & FPCR_DN) {
112
+ bool dnan_enabled = val & FPCR_DN;
113
+ set_default_nan_mode(dnan_enabled, &env->vfp.fp_status);
114
+ set_default_nan_mode(dnan_enabled, &env->vfp.fp_status_f16);
115
}
116
- if (changed & (1 << 25))
117
- set_default_nan_mode((val & (1 << 25)) != 0, &env->vfp.fp_status);
118
119
+ /* The exception flags are ORed together when we read fpscr so we
120
+ * only need to preserve the current state in one of our
121
+ * float_status values.
122
+ */
123
i = vfp_exceptbits_to_host(val);
124
set_float_exception_flags(i, &env->vfp.fp_status);
125
+ set_float_exception_flags(0, &env->vfp.fp_status_f16);
126
set_float_exception_flags(0, &env->vfp.standard_fp_status);
127
}
128
129
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
130
index XXXXXXX..XXXXXXX 100644
131
--- a/target/arm/translate-a64.c
132
+++ b/target/arm/translate-a64.c
133
@@ -XXX,XX +XXX,XX @@ static void write_fp_sreg(DisasContext *s, int reg, TCGv_i32 v)
134
tcg_temp_free_i64(tmp);
135
}
136
137
-static TCGv_ptr get_fpstatus_ptr(void)
138
+static TCGv_ptr get_fpstatus_ptr(bool is_f16)
139
{
140
TCGv_ptr statusptr = tcg_temp_new_ptr();
141
int offset;
142
143
- /* In A64 all instructions (both FP and Neon) use the FPCR;
144
- * there is no equivalent of the A32 Neon "standard FPSCR value"
145
- * and all operations use vfp.fp_status.
146
+ /* In A64 all instructions (both FP and Neon) use the FPCR; there
147
+ * is no equivalent of the A32 Neon "standard FPSCR value".
148
+ * However half-precision operations operate under a different
149
+ * FZ16 flag and use vfp.fp_status_f16 instead of vfp.fp_status.
150
*/
151
- offset = offsetof(CPUARMState, vfp.fp_status);
152
+ if (is_f16) {
153
+ offset = offsetof(CPUARMState, vfp.fp_status_f16);
154
+ } else {
155
+ offset = offsetof(CPUARMState, vfp.fp_status);
156
+ }
157
tcg_gen_addi_ptr(statusptr, cpu_env, offset);
158
return statusptr;
159
}
160
@@ -XXX,XX +XXX,XX @@ static void handle_fp_compare(DisasContext *s, bool is_double,
161
bool cmp_with_zero, bool signal_all_nans)
162
{
163
TCGv_i64 tcg_flags = tcg_temp_new_i64();
164
- TCGv_ptr fpst = get_fpstatus_ptr();
165
+ TCGv_ptr fpst = get_fpstatus_ptr(false);
166
167
if (is_double) {
168
TCGv_i64 tcg_vn, tcg_vm;
169
@@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_single(DisasContext *s, int opcode, int rd, int rn)
170
TCGv_i32 tcg_op;
171
TCGv_i32 tcg_res;
172
173
- fpst = get_fpstatus_ptr();
174
+ fpst = get_fpstatus_ptr(false);
175
tcg_op = read_fp_sreg(s, rn);
176
tcg_res = tcg_temp_new_i32();
177
178
@@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_double(DisasContext *s, int opcode, int rd, int rn)
179
return;
180
}
181
182
- fpst = get_fpstatus_ptr();
183
+ fpst = get_fpstatus_ptr(false);
184
tcg_op = read_fp_dreg(s, rn);
185
tcg_res = tcg_temp_new_i64();
186
187
@@ -XXX,XX +XXX,XX @@ static void handle_fp_2src_single(DisasContext *s, int opcode,
188
TCGv_ptr fpst;
189
190
tcg_res = tcg_temp_new_i32();
191
- fpst = get_fpstatus_ptr();
192
+ fpst = get_fpstatus_ptr(false);
193
tcg_op1 = read_fp_sreg(s, rn);
194
tcg_op2 = read_fp_sreg(s, rm);
195
196
@@ -XXX,XX +XXX,XX @@ static void handle_fp_2src_double(DisasContext *s, int opcode,
197
TCGv_ptr fpst;
198
199
tcg_res = tcg_temp_new_i64();
200
- fpst = get_fpstatus_ptr();
201
+ fpst = get_fpstatus_ptr(false);
202
tcg_op1 = read_fp_dreg(s, rn);
203
tcg_op2 = read_fp_dreg(s, rm);
204
205
@@ -XXX,XX +XXX,XX @@ static void handle_fp_3src_single(DisasContext *s, bool o0, bool o1,
206
{
207
TCGv_i32 tcg_op1, tcg_op2, tcg_op3;
208
TCGv_i32 tcg_res = tcg_temp_new_i32();
209
- TCGv_ptr fpst = get_fpstatus_ptr();
210
+ TCGv_ptr fpst = get_fpstatus_ptr(false);
211
212
tcg_op1 = read_fp_sreg(s, rn);
213
tcg_op2 = read_fp_sreg(s, rm);
214
@@ -XXX,XX +XXX,XX @@ static void handle_fp_3src_double(DisasContext *s, bool o0, bool o1,
215
{
216
TCGv_i64 tcg_op1, tcg_op2, tcg_op3;
217
TCGv_i64 tcg_res = tcg_temp_new_i64();
218
- TCGv_ptr fpst = get_fpstatus_ptr();
219
+ TCGv_ptr fpst = get_fpstatus_ptr(false);
220
221
tcg_op1 = read_fp_dreg(s, rn);
222
tcg_op2 = read_fp_dreg(s, rm);
223
@@ -XXX,XX +XXX,XX @@ static void handle_fpfpcvt(DisasContext *s, int rd, int rn, int opcode,
224
TCGv_ptr tcg_fpstatus;
225
TCGv_i32 tcg_shift;
226
227
- tcg_fpstatus = get_fpstatus_ptr();
228
+ tcg_fpstatus = get_fpstatus_ptr(false);
229
230
tcg_shift = tcg_const_i32(64 - scale);
231
232
@@ -XXX,XX +XXX,XX @@ static void disas_simd_across_lanes(DisasContext *s, uint32_t insn)
233
TCGv_i32 tcg_elt1 = tcg_temp_new_i32();
234
TCGv_i32 tcg_elt2 = tcg_temp_new_i32();
235
TCGv_i32 tcg_elt3 = tcg_temp_new_i32();
236
- TCGv_ptr fpst = get_fpstatus_ptr();
237
+ TCGv_ptr fpst = get_fpstatus_ptr(false);
238
239
assert(esize == 32);
240
assert(elements == 4);
241
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_pairwise(DisasContext *s, uint32_t insn)
242
}
243
244
size = extract32(size, 0, 1) ? 3 : 2;
245
- fpst = get_fpstatus_ptr();
246
+ fpst = get_fpstatus_ptr(false);
247
break;
248
default:
249
unallocated_encoding(s);
250
@@ -XXX,XX +XXX,XX @@ static void handle_simd_intfp_conv(DisasContext *s, int rd, int rn,
251
int fracbits, int size)
252
{
253
bool is_double = size == 3 ? true : false;
254
- TCGv_ptr tcg_fpst = get_fpstatus_ptr();
255
+ TCGv_ptr tcg_fpst = get_fpstatus_ptr(false);
256
TCGv_i32 tcg_shift = tcg_const_i32(fracbits);
257
TCGv_i64 tcg_int = tcg_temp_new_i64();
258
TCGMemOp mop = size | (is_signed ? MO_SIGN : 0);
259
@@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,
260
261
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(FPROUNDING_ZERO));
262
gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
263
- tcg_fpstatus = get_fpstatus_ptr();
264
+ tcg_fpstatus = get_fpstatus_ptr(false);
265
tcg_shift = tcg_const_i32(fracbits);
266
267
if (is_double) {
268
@@ -XXX,XX +XXX,XX @@ static void handle_3same_float(DisasContext *s, int size, int elements,
269
int fpopcode, int rd, int rn, int rm)
270
{
271
int pass;
272
- TCGv_ptr fpst = get_fpstatus_ptr();
273
+ TCGv_ptr fpst = get_fpstatus_ptr(false);
274
275
for (pass = 0; pass < elements; pass++) {
276
if (size) {
277
@@ -XXX,XX +XXX,XX @@ static void handle_2misc_fcmp_zero(DisasContext *s, int opcode,
278
return;
279
}
280
281
- fpst = get_fpstatus_ptr();
282
+ fpst = get_fpstatus_ptr(false);
283
284
if (is_double) {
285
TCGv_i64 tcg_op = tcg_temp_new_i64();
286
@@ -XXX,XX +XXX,XX @@ static void handle_2misc_reciprocal(DisasContext *s, int opcode,
287
int size, int rn, int rd)
288
{
289
bool is_double = (size == 3);
290
- TCGv_ptr fpst = get_fpstatus_ptr();
291
+ TCGv_ptr fpst = get_fpstatus_ptr(false);
292
293
if (is_double) {
294
TCGv_i64 tcg_op = tcg_temp_new_i64();
295
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_two_reg_misc(DisasContext *s, uint32_t insn)
296
if (is_fcvt) {
297
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode));
298
gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
299
- tcg_fpstatus = get_fpstatus_ptr();
300
+ tcg_fpstatus = get_fpstatus_ptr(false);
301
} else {
302
tcg_rmode = NULL;
303
tcg_fpstatus = NULL;
304
@@ -XXX,XX +XXX,XX @@ static void handle_simd_3same_pair(DisasContext *s, int is_q, int u, int opcode,
305
306
/* Floating point operations need fpst */
307
if (opcode >= 0x58) {
308
- fpst = get_fpstatus_ptr();
309
+ fpst = get_fpstatus_ptr(false);
310
} else {
311
fpst = NULL;
312
}
313
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn)
314
}
315
316
if (need_fpstatus) {
317
- tcg_fpstatus = get_fpstatus_ptr();
318
+ tcg_fpstatus = get_fpstatus_ptr(false);
319
} else {
320
tcg_fpstatus = NULL;
321
}
322
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
323
}
324
325
if (is_fp) {
326
- fpst = get_fpstatus_ptr();
327
+ fpst = get_fpstatus_ptr(false);
328
} else {
329
fpst = NULL;
330
}
331
--
212
--
332
2.16.2
213
2.16.2
333
214
334
215
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Create an "idau" property on the armv7m container object which
2
we can forward to the CPU object. Annoyingly, we can't use
3
object_property_add_alias() because the CPU object we want to
4
forward to doesn't exist until the armv7m container is realized.
2
5
3
We do implement all the opcodes.
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180220180325.29818-6-peter.maydell@linaro.org
9
---
10
include/hw/arm/armv7m.h | 3 +++
11
hw/arm/armv7m.c | 9 +++++++++
12
2 files changed, 12 insertions(+)
4
13
5
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
14
diff --git a/include/hw/arm/armv7m.h b/include/hw/arm/armv7m.h
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
7
Message-id: 20180227143852.11175-8-alex.bennee@linaro.org
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
---
10
target/arm/translate-a64.c | 3 +--
11
1 file changed, 1 insertion(+), 2 deletions(-)
12
13
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
14
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/translate-a64.c
16
--- a/include/hw/arm/armv7m.h
16
+++ b/target/arm/translate-a64.c
17
+++ b/include/hw/arm/armv7m.h
17
@@ -XXX,XX +XXX,XX @@ static void handle_3same_64(DisasContext *s, int opcode, bool u,
18
@@ -XXX,XX +XXX,XX @@
18
/* Handle 64x64->64 opcodes which are shared between the scalar
19
19
* and vector 3-same groups. We cover every opcode where size == 3
20
#include "hw/sysbus.h"
20
* is valid in either the three-reg-same (integer, not pairwise)
21
#include "hw/intc/armv7m_nvic.h"
21
- * or scalar-three-reg-same groups. (Some opcodes are not yet
22
+#include "target/arm/idau.h"
22
- * implemented.)
23
23
+ * or scalar-three-reg-same groups.
24
#define TYPE_BITBAND "ARM,bitband-memory"
24
*/
25
#define BITBAND(obj) OBJECT_CHECK(BitBandState, (obj), TYPE_BITBAND)
25
TCGCond cond;
26
@@ -XXX,XX +XXX,XX @@ typedef struct {
27
* + Property "memory": MemoryRegion defining the physical address space
28
* that CPU accesses see. (The NVIC, bitbanding and other CPU-internal
29
* devices will be automatically layered on top of this view.)
30
+ * + Property "idau": IDAU interface (forwarded to CPU object)
31
*/
32
typedef struct ARMv7MState {
33
/*< private >*/
34
@@ -XXX,XX +XXX,XX @@ typedef struct ARMv7MState {
35
char *cpu_type;
36
/* MemoryRegion the board provides to us (with its devices, RAM, etc) */
37
MemoryRegion *board_memory;
38
+ Object *idau;
39
} ARMv7MState;
40
41
#endif
42
diff --git a/hw/arm/armv7m.c b/hw/arm/armv7m.c
43
index XXXXXXX..XXXXXXX 100644
44
--- a/hw/arm/armv7m.c
45
+++ b/hw/arm/armv7m.c
46
@@ -XXX,XX +XXX,XX @@
47
#include "sysemu/qtest.h"
48
#include "qemu/error-report.h"
49
#include "exec/address-spaces.h"
50
+#include "target/arm/idau.h"
51
52
/* Bitbanded IO. Each word corresponds to a single bit. */
53
54
@@ -XXX,XX +XXX,XX @@ static void armv7m_realize(DeviceState *dev, Error **errp)
55
56
object_property_set_link(OBJECT(s->cpu), OBJECT(&s->container), "memory",
57
&error_abort);
58
+ if (object_property_find(OBJECT(s->cpu), "idau", NULL)) {
59
+ object_property_set_link(OBJECT(s->cpu), s->idau, "idau", &err);
60
+ if (err != NULL) {
61
+ error_propagate(errp, err);
62
+ return;
63
+ }
64
+ }
65
object_property_set_bool(OBJECT(s->cpu), true, "realized", &err);
66
if (err != NULL) {
67
error_propagate(errp, err);
68
@@ -XXX,XX +XXX,XX @@ static Property armv7m_properties[] = {
69
DEFINE_PROP_STRING("cpu-type", ARMv7MState, cpu_type),
70
DEFINE_PROP_LINK("memory", ARMv7MState, board_memory, TYPE_MEMORY_REGION,
71
MemoryRegion *),
72
+ DEFINE_PROP_LINK("idau", ARMv7MState, idau, TYPE_IDAU_INTERFACE, Object *),
73
DEFINE_PROP_END_OF_LIST(),
74
};
26
75
27
--
76
--
28
2.16.2
77
2.16.2
29
78
30
79
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
The Cortex-M33 allows the system to specify the reset value of the
2
secure Vector Table Offset Register (VTOR) by asserting config
3
signals. In particular, guest images for the MPS2 AN505 board rely
4
on the MPS2's initial VTOR being correct for that board.
5
Implement a QEMU property so board and SoC code can set the reset
6
value to the correct value.
2
7
3
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
5
Message-id: 20180227143852.11175-4-alex.bennee@linaro.org
10
Message-id: 20180220180325.29818-7-peter.maydell@linaro.org
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
---
11
---
8
target/arm/cpu.h | 1 +
12
target/arm/cpu.h | 3 +++
9
1 file changed, 1 insertion(+)
13
target/arm/cpu.c | 18 ++++++++++++++----
14
2 files changed, 17 insertions(+), 4 deletions(-)
10
15
11
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
16
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
12
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
13
--- a/target/arm/cpu.h
18
--- a/target/arm/cpu.h
14
+++ b/target/arm/cpu.h
19
+++ b/target/arm/cpu.h
15
@@ -XXX,XX +XXX,XX @@ typedef struct {
20
@@ -XXX,XX +XXX,XX @@ struct ARMCPU {
16
* Qn = regs[n].d[1]:regs[n].d[0]
21
*/
17
* Dn = regs[n].d[0]
22
uint32_t psci_conduit;
18
* Sn = regs[n].d[0] bits 31..0
23
19
+ * Hn = regs[n].d[0] bits 15..0
24
+ /* For v8M, initial value of the Secure VTOR */
20
*
25
+ uint32_t init_svtor;
21
* This corresponds to the architecturally defined mapping between
26
+
22
* the two execution states, and means we do not need to explicitly
27
/* [QEMU_]KVM_ARM_TARGET_* constant for this CPU, or
28
* QEMU_KVM_ARM_TARGET_NONE if the kernel doesn't support this CPU type.
29
*/
30
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
31
index XXXXXXX..XXXXXXX 100644
32
--- a/target/arm/cpu.c
33
+++ b/target/arm/cpu.c
34
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(CPUState *s)
35
uint32_t initial_msp; /* Loaded from 0x0 */
36
uint32_t initial_pc; /* Loaded from 0x4 */
37
uint8_t *rom;
38
+ uint32_t vecbase;
39
40
if (arm_feature(env, ARM_FEATURE_M_SECURITY)) {
41
env->v7m.secure = true;
42
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(CPUState *s)
43
/* Unlike A/R profile, M profile defines the reset LR value */
44
env->regs[14] = 0xffffffff;
45
46
- /* Load the initial SP and PC from the vector table at address 0 */
47
- rom = rom_ptr(0);
48
+ env->v7m.vecbase[M_REG_S] = cpu->init_svtor & 0xffffff80;
49
+
50
+ /* Load the initial SP and PC from offset 0 and 4 in the vector table */
51
+ vecbase = env->v7m.vecbase[env->v7m.secure];
52
+ rom = rom_ptr(vecbase);
53
if (rom) {
54
/* Address zero is covered by ROM which hasn't yet been
55
* copied into physical memory.
56
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_reset(CPUState *s)
57
* it got copied into memory. In the latter case, rom_ptr
58
* will return a NULL pointer and we should use ldl_phys instead.
59
*/
60
- initial_msp = ldl_phys(s->as, 0);
61
- initial_pc = ldl_phys(s->as, 4);
62
+ initial_msp = ldl_phys(s->as, vecbase);
63
+ initial_pc = ldl_phys(s->as, vecbase + 4);
64
}
65
66
env->regs[13] = initial_msp & 0xFFFFFFFC;
67
@@ -XXX,XX +XXX,XX @@ static Property arm_cpu_pmsav7_dregion_property =
68
pmsav7_dregion,
69
qdev_prop_uint32, uint32_t);
70
71
+/* M profile: initial value of the Secure VTOR */
72
+static Property arm_cpu_initsvtor_property =
73
+ DEFINE_PROP_UINT32("init-svtor", ARMCPU, init_svtor, 0);
74
+
75
static void arm_cpu_post_init(Object *obj)
76
{
77
ARMCPU *cpu = ARM_CPU(obj);
78
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_post_init(Object *obj)
79
qdev_prop_allow_set_link_before_realize,
80
OBJ_PROP_LINK_UNREF_ON_RELEASE,
81
&error_abort);
82
+ qdev_property_add_static(DEVICE(obj), &arm_cpu_initsvtor_property,
83
+ &error_abort);
84
}
85
86
qdev_property_add_static(DEVICE(obj), &arm_cpu_cfgend_property,
23
--
87
--
24
2.16.2
88
2.16.2
25
89
26
90
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Create an "init-svtor" property on the armv7m container
2
object which we can forward to the CPU object.
2
3
3
I only needed to do a little light re-factoring to support the
4
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
half-precision helpers.
5
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
Message-id: 20180220180325.29818-8-peter.maydell@linaro.org
7
---
8
include/hw/arm/armv7m.h | 2 ++
9
hw/arm/armv7m.c | 9 +++++++++
10
2 files changed, 11 insertions(+)
5
11
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
12
diff --git a/include/hw/arm/armv7m.h b/include/hw/arm/armv7m.h
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180227143852.11175-30-alex.bennee@linaro.org
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
11
target/arm/translate-a64.c | 80 +++++++++++++++++++++++++++++++---------------
12
1 file changed, 54 insertions(+), 26 deletions(-)
13
14
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
15
index XXXXXXX..XXXXXXX 100644
13
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/translate-a64.c
14
--- a/include/hw/arm/armv7m.h
17
+++ b/target/arm/translate-a64.c
15
+++ b/include/hw/arm/armv7m.h
18
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_pairwise(DisasContext *s, uint32_t insn)
16
@@ -XXX,XX +XXX,XX @@ typedef struct {
19
case 0xf: /* FMAXP */
17
* that CPU accesses see. (The NVIC, bitbanding and other CPU-internal
20
case 0x2c: /* FMINNMP */
18
* devices will be automatically layered on top of this view.)
21
case 0x2f: /* FMINP */
19
* + Property "idau": IDAU interface (forwarded to CPU object)
22
- /* FP op, size[0] is 32 or 64 bit */
20
+ * + Property "init-svtor": secure VTOR reset value (forwarded to CPU object)
23
+ /* FP op, size[0] is 32 or 64 bit*/
21
*/
24
if (!u) {
22
typedef struct ARMv7MState {
25
- unallocated_encoding(s);
23
/*< private >*/
26
- return;
24
@@ -XXX,XX +XXX,XX @@ typedef struct ARMv7MState {
27
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
25
/* MemoryRegion the board provides to us (with its devices, RAM, etc) */
28
+ unallocated_encoding(s);
26
MemoryRegion *board_memory;
29
+ return;
27
Object *idau;
30
+ } else {
28
+ uint32_t init_svtor;
31
+ size = MO_16;
29
} ARMv7MState;
32
+ }
30
33
+ } else {
31
#endif
34
+ size = extract32(size, 0, 1) ? MO_64 : MO_32;
32
diff --git a/hw/arm/armv7m.c b/hw/arm/armv7m.c
35
}
33
index XXXXXXX..XXXXXXX 100644
36
+
34
--- a/hw/arm/armv7m.c
37
if (!fp_access_check(s)) {
35
+++ b/hw/arm/armv7m.c
36
@@ -XXX,XX +XXX,XX @@ static void armv7m_realize(DeviceState *dev, Error **errp)
38
return;
37
return;
39
}
38
}
40
41
- size = extract32(size, 0, 1) ? 3 : 2;
42
- fpst = get_fpstatus_ptr(false);
43
+ fpst = get_fpstatus_ptr(size == MO_16);
44
break;
45
default:
46
unallocated_encoding(s);
47
return;
48
}
39
}
49
40
+ if (object_property_find(OBJECT(s->cpu), "init-svtor", NULL)) {
50
- if (size == 3) {
41
+ object_property_set_uint(OBJECT(s->cpu), s->init_svtor,
51
+ if (size == MO_64) {
42
+ "init-svtor", &err);
52
TCGv_i64 tcg_op1 = tcg_temp_new_i64();
43
+ if (err != NULL) {
53
TCGv_i64 tcg_op2 = tcg_temp_new_i64();
44
+ error_propagate(errp, err);
54
TCGv_i64 tcg_res = tcg_temp_new_i64();
45
+ return;
55
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_pairwise(DisasContext *s, uint32_t insn)
46
+ }
56
TCGv_i32 tcg_op2 = tcg_temp_new_i32();
47
+ }
57
TCGv_i32 tcg_res = tcg_temp_new_i32();
48
object_property_set_bool(OBJECT(s->cpu), true, "realized", &err);
58
49
if (err != NULL) {
59
- read_vec_element_i32(s, tcg_op1, rn, 0, MO_32);
50
error_propagate(errp, err);
60
- read_vec_element_i32(s, tcg_op2, rn, 1, MO_32);
51
@@ -XXX,XX +XXX,XX @@ static Property armv7m_properties[] = {
61
+ read_vec_element_i32(s, tcg_op1, rn, 0, size);
52
DEFINE_PROP_LINK("memory", ARMv7MState, board_memory, TYPE_MEMORY_REGION,
62
+ read_vec_element_i32(s, tcg_op2, rn, 1, size);
53
MemoryRegion *),
63
54
DEFINE_PROP_LINK("idau", ARMv7MState, idau, TYPE_IDAU_INTERFACE, Object *),
64
- switch (opcode) {
55
+ DEFINE_PROP_UINT32("init-svtor", ARMv7MState, init_svtor, 0),
65
- case 0xc: /* FMAXNMP */
56
DEFINE_PROP_END_OF_LIST(),
66
- gen_helper_vfp_maxnums(tcg_res, tcg_op1, tcg_op2, fpst);
57
};
67
- break;
58
68
- case 0xd: /* FADDP */
69
- gen_helper_vfp_adds(tcg_res, tcg_op1, tcg_op2, fpst);
70
- break;
71
- case 0xf: /* FMAXP */
72
- gen_helper_vfp_maxs(tcg_res, tcg_op1, tcg_op2, fpst);
73
- break;
74
- case 0x2c: /* FMINNMP */
75
- gen_helper_vfp_minnums(tcg_res, tcg_op1, tcg_op2, fpst);
76
- break;
77
- case 0x2f: /* FMINP */
78
- gen_helper_vfp_mins(tcg_res, tcg_op1, tcg_op2, fpst);
79
- break;
80
- default:
81
- g_assert_not_reached();
82
+ if (size == MO_16) {
83
+ switch (opcode) {
84
+ case 0xc: /* FMAXNMP */
85
+ gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst);
86
+ break;
87
+ case 0xd: /* FADDP */
88
+ gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst);
89
+ break;
90
+ case 0xf: /* FMAXP */
91
+ gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst);
92
+ break;
93
+ case 0x2c: /* FMINNMP */
94
+ gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst);
95
+ break;
96
+ case 0x2f: /* FMINP */
97
+ gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst);
98
+ break;
99
+ default:
100
+ g_assert_not_reached();
101
+ }
102
+ } else {
103
+ switch (opcode) {
104
+ case 0xc: /* FMAXNMP */
105
+ gen_helper_vfp_maxnums(tcg_res, tcg_op1, tcg_op2, fpst);
106
+ break;
107
+ case 0xd: /* FADDP */
108
+ gen_helper_vfp_adds(tcg_res, tcg_op1, tcg_op2, fpst);
109
+ break;
110
+ case 0xf: /* FMAXP */
111
+ gen_helper_vfp_maxs(tcg_res, tcg_op1, tcg_op2, fpst);
112
+ break;
113
+ case 0x2c: /* FMINNMP */
114
+ gen_helper_vfp_minnums(tcg_res, tcg_op1, tcg_op2, fpst);
115
+ break;
116
+ case 0x2f: /* FMINP */
117
+ gen_helper_vfp_mins(tcg_res, tcg_op1, tcg_op2, fpst);
118
+ break;
119
+ default:
120
+ g_assert_not_reached();
121
+ }
122
}
123
124
write_fp_sreg(s, rd, tcg_res);
125
--
59
--
126
2.16.2
60
2.16.2
127
61
128
62
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Add a Cortex-M33 definition. The M33 is an M profile CPU
2
which implements the ARM v8M architecture, including the
3
M profile Security Extension.
2
4
3
This includes FMOV, FABS, FNEG, FSQRT and FRINT[NPMZAXI]. We re-use
5
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
existing helpers to achieve this.
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
7
Message-id: 20180220180325.29818-9-peter.maydell@linaro.org
8
---
9
target/arm/cpu.c | 31 +++++++++++++++++++++++++++++++
10
1 file changed, 31 insertions(+)
5
11
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
12
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180227143852.11175-32-alex.bennee@linaro.org
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
11
target/arm/translate-a64.c | 71 ++++++++++++++++++++++++++++++++++++++++++++++
12
1 file changed, 71 insertions(+)
13
14
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
15
index XXXXXXX..XXXXXXX 100644
13
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/translate-a64.c
14
--- a/target/arm/cpu.c
17
+++ b/target/arm/translate-a64.c
15
+++ b/target/arm/cpu.c
18
@@ -XXX,XX +XXX,XX @@ static void disas_fp_csel(DisasContext *s, uint32_t insn)
16
@@ -XXX,XX +XXX,XX @@ static void cortex_m4_initfn(Object *obj)
19
tcg_temp_free_i64(t_true);
17
cpu->id_isar5 = 0x00000000;
20
}
18
}
21
19
22
+/* Floating-point data-processing (1 source) - half precision */
20
+static void cortex_m33_initfn(Object *obj)
23
+static void handle_fp_1src_half(DisasContext *s, int opcode, int rd, int rn)
24
+{
21
+{
25
+ TCGv_ptr fpst = NULL;
22
+ ARMCPU *cpu = ARM_CPU(obj);
26
+ TCGv_i32 tcg_op = tcg_temp_new_i32();
27
+ TCGv_i32 tcg_res = tcg_temp_new_i32();
28
+
23
+
29
+ read_vec_element_i32(s, tcg_op, rn, 0, MO_16);
24
+ set_feature(&cpu->env, ARM_FEATURE_V8);
30
+
25
+ set_feature(&cpu->env, ARM_FEATURE_M);
31
+ switch (opcode) {
26
+ set_feature(&cpu->env, ARM_FEATURE_M_SECURITY);
32
+ case 0x0: /* FMOV */
27
+ set_feature(&cpu->env, ARM_FEATURE_THUMB_DSP);
33
+ tcg_gen_mov_i32(tcg_res, tcg_op);
28
+ cpu->midr = 0x410fd213; /* r0p3 */
34
+ break;
29
+ cpu->pmsav7_dregion = 16;
35
+ case 0x1: /* FABS */
30
+ cpu->sau_sregion = 8;
36
+ tcg_gen_andi_i32(tcg_res, tcg_op, 0x7fff);
31
+ cpu->id_pfr0 = 0x00000030;
37
+ break;
32
+ cpu->id_pfr1 = 0x00000210;
38
+ case 0x2: /* FNEG */
33
+ cpu->id_dfr0 = 0x00200000;
39
+ tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000);
34
+ cpu->id_afr0 = 0x00000000;
40
+ break;
35
+ cpu->id_mmfr0 = 0x00101F40;
41
+ case 0x3: /* FSQRT */
36
+ cpu->id_mmfr1 = 0x00000000;
42
+ gen_helper_sqrt_f16(tcg_res, tcg_op, cpu_env);
37
+ cpu->id_mmfr2 = 0x01000000;
43
+ break;
38
+ cpu->id_mmfr3 = 0x00000000;
44
+ case 0x8: /* FRINTN */
39
+ cpu->id_isar0 = 0x01101110;
45
+ case 0x9: /* FRINTP */
40
+ cpu->id_isar1 = 0x02212000;
46
+ case 0xa: /* FRINTM */
41
+ cpu->id_isar2 = 0x20232232;
47
+ case 0xb: /* FRINTZ */
42
+ cpu->id_isar3 = 0x01111131;
48
+ case 0xc: /* FRINTA */
43
+ cpu->id_isar4 = 0x01310132;
49
+ {
44
+ cpu->id_isar5 = 0x00000000;
50
+ TCGv_i32 tcg_rmode = tcg_const_i32(arm_rmode_to_sf(opcode & 7));
45
+ cpu->clidr = 0x00000000;
51
+ fpst = get_fpstatus_ptr(true);
46
+ cpu->ctr = 0x8000c000;
52
+
53
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
54
+ gen_helper_advsimd_rinth(tcg_res, tcg_op, fpst);
55
+
56
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
57
+ tcg_temp_free_i32(tcg_rmode);
58
+ break;
59
+ }
60
+ case 0xe: /* FRINTX */
61
+ fpst = get_fpstatus_ptr(true);
62
+ gen_helper_advsimd_rinth_exact(tcg_res, tcg_op, fpst);
63
+ break;
64
+ case 0xf: /* FRINTI */
65
+ fpst = get_fpstatus_ptr(true);
66
+ gen_helper_advsimd_rinth(tcg_res, tcg_op, fpst);
67
+ break;
68
+ default:
69
+ abort();
70
+ }
71
+
72
+ write_fp_sreg(s, rd, tcg_res);
73
+
74
+ if (fpst) {
75
+ tcg_temp_free_ptr(fpst);
76
+ }
77
+ tcg_temp_free_i32(tcg_op);
78
+ tcg_temp_free_i32(tcg_res);
79
+}
47
+}
80
+
48
+
81
/* Floating-point data-processing (1 source) - single precision */
49
static void arm_v7m_class_init(ObjectClass *oc, void *data)
82
static void handle_fp_1src_single(DisasContext *s, int opcode, int rd, int rn)
83
{
50
{
84
@@ -XXX,XX +XXX,XX @@ static void disas_fp_1src(DisasContext *s, uint32_t insn)
51
CPUClass *cc = CPU_CLASS(oc);
85
52
@@ -XXX,XX +XXX,XX @@ static const ARMCPUInfo arm_cpus[] = {
86
handle_fp_1src_double(s, opcode, rd, rn);
53
.class_init = arm_v7m_class_init },
87
break;
54
{ .name = "cortex-m4", .initfn = cortex_m4_initfn,
88
+ case 3:
55
.class_init = arm_v7m_class_init },
89
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
56
+ { .name = "cortex-m33", .initfn = cortex_m33_initfn,
90
+ unallocated_encoding(s);
57
+ .class_init = arm_v7m_class_init },
91
+ return;
58
{ .name = "cortex-r5", .initfn = cortex_r5_initfn },
92
+ }
59
{ .name = "cortex-a7", .initfn = cortex_a7_initfn },
93
+
60
{ .name = "cortex-a8", .initfn = cortex_a8_initfn },
94
+ if (!fp_access_check(s)) {
95
+ return;
96
+ }
97
+
98
+ handle_fp_1src_half(s, opcode, rd, rn);
99
+ break;
100
default:
101
unallocated_encoding(s);
102
}
103
--
61
--
104
2.16.2
62
2.16.2
105
63
106
64
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Move the definition of the struct for the unimplemented-device
2
from unimp.c to unimp.h, so that users can embed the struct
3
in their own device structs if they prefer.
2
4
3
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
4
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
5
Message-id: 20180227143852.11175-28-alex.bennee@linaro.org
8
Message-id: 20180220180325.29818-10-peter.maydell@linaro.org
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
---
9
---
8
target/arm/translate-a64.c | 7 +++++++
10
include/hw/misc/unimp.h | 10 ++++++++++
9
1 file changed, 7 insertions(+)
11
hw/misc/unimp.c | 10 ----------
12
2 files changed, 10 insertions(+), 10 deletions(-)
10
13
11
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
14
diff --git a/include/hw/misc/unimp.h b/include/hw/misc/unimp.h
12
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
13
--- a/target/arm/translate-a64.c
16
--- a/include/hw/misc/unimp.h
14
+++ b/target/arm/translate-a64.c
17
+++ b/include/hw/misc/unimp.h
15
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
18
@@ -XXX,XX +XXX,XX @@
16
case 0x6f: /* FNEG */
19
17
need_fpst = false;
20
#define TYPE_UNIMPLEMENTED_DEVICE "unimplemented-device"
18
break;
21
19
+ case 0x7d: /* FRSQRTE */
22
+#define UNIMPLEMENTED_DEVICE(obj) \
20
case 0x7f: /* FSQRT (vector) */
23
+ OBJECT_CHECK(UnimplementedDeviceState, (obj), TYPE_UNIMPLEMENTED_DEVICE)
21
break;
24
+
22
default:
25
+typedef struct {
23
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
26
+ SysBusDevice parent_obj;
24
case 0x6f: /* FNEG */
27
+ MemoryRegion iomem;
25
tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000);
28
+ char *name;
26
break;
29
+ uint64_t size;
27
+ case 0x7d: /* FRSQRTE */
30
+} UnimplementedDeviceState;
28
+ gen_helper_rsqrte_f16(tcg_res, tcg_op, tcg_fpstatus);
31
+
29
+ break;
32
/**
30
default:
33
* create_unimplemented_device: create and map a dummy device
31
g_assert_not_reached();
34
* @name: name of the device for debug logging
32
}
35
diff --git a/hw/misc/unimp.c b/hw/misc/unimp.c
33
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
36
index XXXXXXX..XXXXXXX 100644
34
case 0x6f: /* FNEG */
37
--- a/hw/misc/unimp.c
35
tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000);
38
+++ b/hw/misc/unimp.c
36
break;
39
@@ -XXX,XX +XXX,XX @@
37
+ case 0x7d: /* FRSQRTE */
40
#include "qemu/log.h"
38
+ gen_helper_rsqrte_f16(tcg_res, tcg_op, tcg_fpstatus);
41
#include "qapi/error.h"
39
+ break;
42
40
case 0x7f: /* FSQRT */
43
-#define UNIMPLEMENTED_DEVICE(obj) \
41
gen_helper_sqrt_f16(tcg_res, tcg_op, tcg_fpstatus);
44
- OBJECT_CHECK(UnimplementedDeviceState, (obj), TYPE_UNIMPLEMENTED_DEVICE)
42
break;
45
-
46
-typedef struct {
47
- SysBusDevice parent_obj;
48
- MemoryRegion iomem;
49
- char *name;
50
- uint64_t size;
51
-} UnimplementedDeviceState;
52
-
53
static uint64_t unimp_read(void *opaque, hwaddr offset, unsigned size)
54
{
55
UnimplementedDeviceState *s = UNIMPLEMENTED_DEVICE(opaque);
43
--
56
--
44
2.16.2
57
2.16.2
45
58
46
59
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
The or-irq.h header file is missing the customary guard against
2
multiple inclusion, which means compilation fails if it gets
3
included twice. Fix the omission.
2
4
3
Now we have added f16 during the re-factoring we can simply call the
5
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
helper.
6
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180220180325.29818-11-peter.maydell@linaro.org
9
---
10
include/hw/or-irq.h | 5 +++++
11
1 file changed, 5 insertions(+)
5
12
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
13
diff --git a/include/hw/or-irq.h b/include/hw/or-irq.h
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180227143852.11175-24-alex.bennee@linaro.org
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
11
target/arm/translate-a64.c | 8 ++++++++
12
1 file changed, 8 insertions(+)
13
14
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
15
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/translate-a64.c
15
--- a/include/hw/or-irq.h
17
+++ b/target/arm/translate-a64.c
16
+++ b/include/hw/or-irq.h
18
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
17
@@ -XXX,XX +XXX,XX @@
19
case 0x6d: /* FCMLE (zero) */
18
* THE SOFTWARE.
20
handle_2misc_fcmp_zero(s, fpop, is_scalar, 0, is_q, MO_16, rn, rd);
19
*/
21
return;
20
22
+ case 0x3d: /* FRECPE */
21
+#ifndef HW_OR_IRQ_H
23
+ break;
22
+#define HW_OR_IRQ_H
24
case 0x18: /* FRINTN */
23
+
25
need_rmode = true;
24
#include "hw/irq.h"
26
only_in_vector = true;
25
#include "hw/sysbus.h"
27
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
26
#include "qom/object.h"
28
case 0x3b: /* FCVTZS */
27
@@ -XXX,XX +XXX,XX @@ struct OrIRQState {
29
gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus);
28
bool levels[MAX_OR_LINES];
30
break;
29
uint16_t num_lines;
31
+ case 0x3d: /* FRECPE */
30
};
32
+ gen_helper_recpe_f16(tcg_res, tcg_op, tcg_fpstatus);
31
+
33
+ break;
32
+#endif
34
case 0x5a: /* FCVTNU */
35
case 0x5b: /* FCVTMU */
36
case 0x5c: /* FCVTAU */
37
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
38
case 0x3b: /* FCVTZS */
39
gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus);
40
break;
41
+ case 0x3d: /* FRECPE */
42
+ gen_helper_recpe_f16(tcg_res, tcg_op, tcg_fpstatus);
43
+ break;
44
case 0x5a: /* FCVTNU */
45
case 0x5b: /* FCVTMU */
46
case 0x5c: /* FCVTAU */
47
--
33
--
48
2.16.2
34
2.16.2
49
35
50
36
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
The function qdev_init_gpio_in_named() passes the DeviceState pointer
2
as the opaque data pointor for the irq handler function. Usually
3
this is what you want, but in some cases it would be helpful to use
4
some other data pointer.
2
5
3
The fprintf is only there for debugging as the skeleton is added to,
6
Add a new function qdev_init_gpio_in_named_with_opaque() which allows
4
it will be removed once the skeleton is complete.
7
the caller to specify the data pointer they want.
5
8
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
11
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180227143852.11175-10-alex.bennee@linaro.org
12
Message-id: 20180220180325.29818-12-peter.maydell@linaro.org
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
13
---
11
target/arm/helper-a64.h | 4 ++++
14
include/hw/qdev-core.h | 30 ++++++++++++++++++++++++++++--
12
target/arm/helper-a64.c | 4 ++++
15
hw/core/qdev.c | 8 +++++---
13
target/arm/translate-a64.c | 28 ++++++++++++++++++++++++++++
16
2 files changed, 33 insertions(+), 5 deletions(-)
14
3 files changed, 36 insertions(+)
15
17
16
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
18
diff --git a/include/hw/qdev-core.h b/include/hw/qdev-core.h
17
index XXXXXXX..XXXXXXX 100644
19
index XXXXXXX..XXXXXXX 100644
18
--- a/target/arm/helper-a64.h
20
--- a/include/hw/qdev-core.h
19
+++ b/target/arm/helper-a64.h
21
+++ b/include/hw/qdev-core.h
20
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(advsimd_maxh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
22
@@ -XXX,XX +XXX,XX @@ BusState *qdev_get_child_bus(DeviceState *dev, const char *name);
21
DEF_HELPER_FLAGS_3(advsimd_minh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
23
/* GPIO inputs also double as IRQ sinks. */
22
DEF_HELPER_FLAGS_3(advsimd_maxnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
24
void qdev_init_gpio_in(DeviceState *dev, qemu_irq_handler handler, int n);
23
DEF_HELPER_FLAGS_3(advsimd_minnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
25
void qdev_init_gpio_out(DeviceState *dev, qemu_irq *pins, int n);
24
+DEF_HELPER_3(advsimd_addh, f16, f16, f16, ptr)
26
-void qdev_init_gpio_in_named(DeviceState *dev, qemu_irq_handler handler,
25
+DEF_HELPER_3(advsimd_subh, f16, f16, f16, ptr)
27
- const char *name, int n);
26
+DEF_HELPER_3(advsimd_mulh, f16, f16, f16, ptr)
28
void qdev_init_gpio_out_named(DeviceState *dev, qemu_irq *pins,
27
+DEF_HELPER_3(advsimd_divh, f16, f16, f16, ptr)
29
const char *name, int n);
28
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
30
+/**
31
+ * qdev_init_gpio_in_named_with_opaque: create an array of input GPIO lines
32
+ * for the specified device
33
+ *
34
+ * @dev: Device to create input GPIOs for
35
+ * @handler: Function to call when GPIO line value is set
36
+ * @opaque: Opaque data pointer to pass to @handler
37
+ * @name: Name of the GPIO input (must be unique for this device)
38
+ * @n: Number of GPIO lines in this input set
39
+ */
40
+void qdev_init_gpio_in_named_with_opaque(DeviceState *dev,
41
+ qemu_irq_handler handler,
42
+ void *opaque,
43
+ const char *name, int n);
44
+
45
+/**
46
+ * qdev_init_gpio_in_named: create an array of input GPIO lines
47
+ * for the specified device
48
+ *
49
+ * Like qdev_init_gpio_in_named_with_opaque(), but the opaque pointer
50
+ * passed to the handler is @dev (which is the most commonly desired behaviour).
51
+ */
52
+static inline void qdev_init_gpio_in_named(DeviceState *dev,
53
+ qemu_irq_handler handler,
54
+ const char *name, int n)
55
+{
56
+ qdev_init_gpio_in_named_with_opaque(dev, handler, dev, name, n);
57
+}
58
59
void qdev_pass_gpios(DeviceState *dev, DeviceState *container,
60
const char *name);
61
diff --git a/hw/core/qdev.c b/hw/core/qdev.c
29
index XXXXXXX..XXXXXXX 100644
62
index XXXXXXX..XXXXXXX 100644
30
--- a/target/arm/helper-a64.c
63
--- a/hw/core/qdev.c
31
+++ b/target/arm/helper-a64.c
64
+++ b/hw/core/qdev.c
32
@@ -XXX,XX +XXX,XX @@ float16 ADVSIMD_HELPER(name, h)(float16 a, float16 b, void *fpstp) \
65
@@ -XXX,XX +XXX,XX @@ static NamedGPIOList *qdev_get_named_gpio_list(DeviceState *dev,
33
return float16_ ## name(a, b, fpst); \
66
return ngl;
34
}
67
}
35
68
36
+ADVSIMD_HALFOP(add)
69
-void qdev_init_gpio_in_named(DeviceState *dev, qemu_irq_handler handler,
37
+ADVSIMD_HALFOP(sub)
70
- const char *name, int n)
38
+ADVSIMD_HALFOP(mul)
71
+void qdev_init_gpio_in_named_with_opaque(DeviceState *dev,
39
+ADVSIMD_HALFOP(div)
72
+ qemu_irq_handler handler,
40
ADVSIMD_HALFOP(min)
73
+ void *opaque,
41
ADVSIMD_HALFOP(max)
74
+ const char *name, int n)
42
ADVSIMD_HALFOP(minnum)
75
{
43
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
76
int i;
44
index XXXXXXX..XXXXXXX 100644
77
NamedGPIOList *gpio_list = qdev_get_named_gpio_list(dev, name);
45
--- a/target/arm/translate-a64.c
78
46
+++ b/target/arm/translate-a64.c
79
assert(gpio_list->num_out == 0 || !name);
47
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
80
gpio_list->in = qemu_extend_irqs(gpio_list->in, gpio_list->num_in, handler,
48
read_vec_element_i32(s, tcg_op2, rm, pass, MO_16);
81
- dev, n);
49
82
+ opaque, n);
50
switch (fpopcode) {
83
51
+ case 0x0: /* FMAXNM */
84
if (!name) {
52
+ gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst);
85
name = "unnamed-gpio-in";
53
+ break;
54
+ case 0x2: /* FADD */
55
+ gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst);
56
+ break;
57
+ case 0x6: /* FMAX */
58
+ gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst);
59
+ break;
60
+ case 0x8: /* FMINNM */
61
+ gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst);
62
+ break;
63
+ case 0xa: /* FSUB */
64
+ gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
65
+ break;
66
+ case 0xe: /* FMIN */
67
+ gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst);
68
+ break;
69
+ case 0x13: /* FMUL */
70
+ gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst);
71
+ break;
72
+ case 0x17: /* FDIV */
73
+ gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst);
74
+ break;
75
+ case 0x1a: /* FABD */
76
+ gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
77
+ tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff);
78
+ break;
79
default:
80
fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n",
81
__func__, insn, fpopcode, s->pc);
82
--
86
--
83
2.16.2
87
2.16.2
84
88
85
89
diff view generated by jsdifflib
1
From: Corey Minyard <cminyard@mvista.com>
1
In some board or SoC models it is necessary to split a qemu_irq line
2
2
so that one input can feed multiple outputs. We currently have
3
Some devices need access to it.
3
qemu_irq_split() for this, but that has several deficiencies:
4
4
* it can only handle splitting a line into two
5
Signed-off-by: Corey Minyard <cminyard@mvista.com>
5
* it unavoidably leaks memory, so it can't be used
6
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
6
in a device that can be deleted
7
Signed-off-by: Linus Walleij <linus.walleij@linaro.org>
7
8
Message-id: 20180227104903.21353-3-linus.walleij@linaro.org
8
Implement a qdev device that encapsulates splitting of IRQs, with a
9
configurable number of outputs. (This is in some ways the inverse of
10
the TYPE_OR_IRQ device.)
11
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
12
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
13
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
14
Message-id: 20180220180325.29818-13-peter.maydell@linaro.org
10
---
15
---
11
include/hw/i2c/i2c.h | 17 +++++++++++++++++
16
hw/core/Makefile.objs | 1 +
12
hw/i2c/core.c | 17 -----------------
17
include/hw/core/split-irq.h | 57 +++++++++++++++++++++++++++++
13
2 files changed, 17 insertions(+), 17 deletions(-)
18
include/hw/irq.h | 4 +-
14
19
hw/core/split-irq.c | 89 +++++++++++++++++++++++++++++++++++++++++++++
15
diff --git a/include/hw/i2c/i2c.h b/include/hw/i2c/i2c.h
20
4 files changed, 150 insertions(+), 1 deletion(-)
21
create mode 100644 include/hw/core/split-irq.h
22
create mode 100644 hw/core/split-irq.c
23
24
diff --git a/hw/core/Makefile.objs b/hw/core/Makefile.objs
16
index XXXXXXX..XXXXXXX 100644
25
index XXXXXXX..XXXXXXX 100644
17
--- a/include/hw/i2c/i2c.h
26
--- a/hw/core/Makefile.objs
18
+++ b/include/hw/i2c/i2c.h
27
+++ b/hw/core/Makefile.objs
19
@@ -XXX,XX +XXX,XX @@ struct I2CSlave {
28
@@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_FITLOADER) += loader-fit.o
20
uint8_t address;
29
common-obj-$(CONFIG_SOFTMMU) += qdev-properties-system.o
21
};
30
common-obj-$(CONFIG_SOFTMMU) += register.o
22
31
common-obj-$(CONFIG_SOFTMMU) += or-irq.o
23
+#define TYPE_I2C_BUS "i2c-bus"
32
+common-obj-$(CONFIG_SOFTMMU) += split-irq.o
24
+#define I2C_BUS(obj) OBJECT_CHECK(I2CBus, (obj), TYPE_I2C_BUS)
33
common-obj-$(CONFIG_PLATFORM_BUS) += platform-bus.o
25
+
34
26
+typedef struct I2CNode I2CNode;
35
obj-$(CONFIG_SOFTMMU) += generic-loader.o
27
+
36
diff --git a/include/hw/core/split-irq.h b/include/hw/core/split-irq.h
28
+struct I2CNode {
37
new file mode 100644
29
+ I2CSlave *elt;
38
index XXXXXXX..XXXXXXX
30
+ QLIST_ENTRY(I2CNode) next;
39
--- /dev/null
40
+++ b/include/hw/core/split-irq.h
41
@@ -XXX,XX +XXX,XX @@
42
+/*
43
+ * IRQ splitter device.
44
+ *
45
+ * Copyright (c) 2018 Linaro Limited.
46
+ * Written by Peter Maydell
47
+ *
48
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
49
+ * of this software and associated documentation files (the "Software"), to deal
50
+ * in the Software without restriction, including without limitation the rights
51
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
52
+ * copies of the Software, and to permit persons to whom the Software is
53
+ * furnished to do so, subject to the following conditions:
54
+ *
55
+ * The above copyright notice and this permission notice shall be included in
56
+ * all copies or substantial portions of the Software.
57
+ *
58
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
59
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
60
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
61
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
62
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
63
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
64
+ * THE SOFTWARE.
65
+ */
66
+
67
+/* This is a simple device which has one GPIO input line and multiple
68
+ * GPIO output lines. Any change on the input line is forwarded to all
69
+ * of the outputs.
70
+ *
71
+ * QEMU interface:
72
+ * + one unnamed GPIO input: the input line
73
+ * + N unnamed GPIO outputs: the output lines
74
+ * + QOM property "num-lines": sets the number of output lines
75
+ */
76
+#ifndef HW_SPLIT_IRQ_H
77
+#define HW_SPLIT_IRQ_H
78
+
79
+#include "hw/irq.h"
80
+#include "hw/sysbus.h"
81
+#include "qom/object.h"
82
+
83
+#define TYPE_SPLIT_IRQ "split-irq"
84
+
85
+#define MAX_SPLIT_LINES 16
86
+
87
+typedef struct SplitIRQ SplitIRQ;
88
+
89
+#define SPLIT_IRQ(obj) OBJECT_CHECK(SplitIRQ, (obj), TYPE_SPLIT_IRQ)
90
+
91
+struct SplitIRQ {
92
+ DeviceState parent_obj;
93
+
94
+ qemu_irq out_irq[MAX_SPLIT_LINES];
95
+ uint16_t num_lines;
31
+};
96
+};
32
+
97
+
33
+struct I2CBus {
98
+#endif
34
+ BusState qbus;
99
diff --git a/include/hw/irq.h b/include/hw/irq.h
35
+ QLIST_HEAD(, I2CNode) current_devs;
100
index XXXXXXX..XXXXXXX 100644
36
+ uint8_t saved_address;
101
--- a/include/hw/irq.h
37
+ bool broadcast;
102
+++ b/include/hw/irq.h
103
@@ -XXX,XX +XXX,XX @@ void qemu_free_irq(qemu_irq irq);
104
/* Returns a new IRQ with opposite polarity. */
105
qemu_irq qemu_irq_invert(qemu_irq irq);
106
107
-/* Returns a new IRQ which feeds into both the passed IRQs */
108
+/* Returns a new IRQ which feeds into both the passed IRQs.
109
+ * It's probably better to use the TYPE_SPLIT_IRQ device instead.
110
+ */
111
qemu_irq qemu_irq_split(qemu_irq irq1, qemu_irq irq2);
112
113
/* Returns a new IRQ set which connects 1:1 to another IRQ set, which
114
diff --git a/hw/core/split-irq.c b/hw/core/split-irq.c
115
new file mode 100644
116
index XXXXXXX..XXXXXXX
117
--- /dev/null
118
+++ b/hw/core/split-irq.c
119
@@ -XXX,XX +XXX,XX @@
120
+/*
121
+ * IRQ splitter device.
122
+ *
123
+ * Copyright (c) 2018 Linaro Limited.
124
+ * Written by Peter Maydell
125
+ *
126
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
127
+ * of this software and associated documentation files (the "Software"), to deal
128
+ * in the Software without restriction, including without limitation the rights
129
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
130
+ * copies of the Software, and to permit persons to whom the Software is
131
+ * furnished to do so, subject to the following conditions:
132
+ *
133
+ * The above copyright notice and this permission notice shall be included in
134
+ * all copies or substantial portions of the Software.
135
+ *
136
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
137
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
138
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
139
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
140
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
141
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
142
+ * THE SOFTWARE.
143
+ */
144
+
145
+#include "qemu/osdep.h"
146
+#include "hw/core/split-irq.h"
147
+#include "qapi/error.h"
148
+
149
+static void split_irq_handler(void *opaque, int n, int level)
150
+{
151
+ SplitIRQ *s = SPLIT_IRQ(opaque);
152
+ int i;
153
+
154
+ for (i = 0; i < s->num_lines; i++) {
155
+ qemu_set_irq(s->out_irq[i], level);
156
+ }
157
+}
158
+
159
+static void split_irq_init(Object *obj)
160
+{
161
+ qdev_init_gpio_in(DEVICE(obj), split_irq_handler, 1);
162
+}
163
+
164
+static void split_irq_realize(DeviceState *dev, Error **errp)
165
+{
166
+ SplitIRQ *s = SPLIT_IRQ(dev);
167
+
168
+ if (s->num_lines < 1 || s->num_lines >= MAX_SPLIT_LINES) {
169
+ error_setg(errp,
170
+ "IRQ splitter number of lines %d is not between 1 and %d",
171
+ s->num_lines, MAX_SPLIT_LINES);
172
+ return;
173
+ }
174
+
175
+ qdev_init_gpio_out(dev, s->out_irq, s->num_lines);
176
+}
177
+
178
+static Property split_irq_properties[] = {
179
+ DEFINE_PROP_UINT16("num-lines", SplitIRQ, num_lines, 1),
180
+ DEFINE_PROP_END_OF_LIST(),
38
+};
181
+};
39
+
182
+
40
I2CBus *i2c_init_bus(DeviceState *parent, const char *name);
183
+static void split_irq_class_init(ObjectClass *klass, void *data)
41
void i2c_set_slave_address(I2CSlave *dev, uint8_t address);
184
+{
42
int i2c_bus_busy(I2CBus *bus);
185
+ DeviceClass *dc = DEVICE_CLASS(klass);
43
diff --git a/hw/i2c/core.c b/hw/i2c/core.c
186
+
44
index XXXXXXX..XXXXXXX 100644
187
+ /* No state to reset or migrate */
45
--- a/hw/i2c/core.c
188
+ dc->props = split_irq_properties;
46
+++ b/hw/i2c/core.c
189
+ dc->realize = split_irq_realize;
47
@@ -XXX,XX +XXX,XX @@
190
+
48
#include "qemu/osdep.h"
191
+ /* Reason: Needs to be wired up to work */
49
#include "hw/i2c/i2c.h"
192
+ dc->user_creatable = false;
50
193
+}
51
-typedef struct I2CNode I2CNode;
194
+
52
-
195
+static const TypeInfo split_irq_type_info = {
53
-struct I2CNode {
196
+ .name = TYPE_SPLIT_IRQ,
54
- I2CSlave *elt;
197
+ .parent = TYPE_DEVICE,
55
- QLIST_ENTRY(I2CNode) next;
198
+ .instance_size = sizeof(SplitIRQ),
56
-};
199
+ .instance_init = split_irq_init,
57
-
200
+ .class_init = split_irq_class_init,
58
#define I2C_BROADCAST 0x00
201
+};
59
202
+
60
-struct I2CBus {
203
+static void split_irq_register_types(void)
61
- BusState qbus;
204
+{
62
- QLIST_HEAD(, I2CNode) current_devs;
205
+ type_register_static(&split_irq_type_info);
63
- uint8_t saved_address;
206
+}
64
- bool broadcast;
207
+
65
-};
208
+type_init(split_irq_register_types)
66
-
67
static Property i2c_props[] = {
68
DEFINE_PROP_UINT8("address", struct I2CSlave, address, 0),
69
DEFINE_PROP_END_OF_LIST(),
70
};
71
72
-#define TYPE_I2C_BUS "i2c-bus"
73
-#define I2C_BUS(obj) OBJECT_CHECK(I2CBus, (obj), TYPE_I2C_BUS)
74
-
75
static const TypeInfo i2c_bus_info = {
76
.name = TYPE_I2C_BUS,
77
.parent = TYPE_BUS,
78
--
209
--
79
2.16.2
210
2.16.2
80
211
81
212
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
The MPS2 AN505 FPGA image includes a "FPGA control block"
2
2
which is a small set of registers handling LEDs, buttons
3
This includes FMAXNMP, FADDP, FMAXP, FMINNMP, FMINP.
3
and some counters.
4
4
5
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
7
Message-id: 20180227143852.11175-14-alex.bennee@linaro.org
7
Message-id: 20180220180325.29818-14-peter.maydell@linaro.org
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
---
8
---
10
target/arm/translate-a64.c | 208 +++++++++++++++++++++++++++++----------------
9
hw/misc/Makefile.objs | 1 +
11
1 file changed, 133 insertions(+), 75 deletions(-)
10
include/hw/misc/mps2-fpgaio.h | 43 ++++++++++
12
11
hw/misc/mps2-fpgaio.c | 176 ++++++++++++++++++++++++++++++++++++++++
13
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
12
default-configs/arm-softmmu.mak | 1 +
13
hw/misc/trace-events | 6 ++
14
5 files changed, 227 insertions(+)
15
create mode 100644 include/hw/misc/mps2-fpgaio.h
16
create mode 100644 hw/misc/mps2-fpgaio.c
17
18
diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs
14
index XXXXXXX..XXXXXXX 100644
19
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/translate-a64.c
20
--- a/hw/misc/Makefile.objs
16
+++ b/target/arm/translate-a64.c
21
+++ b/hw/misc/Makefile.objs
17
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
22
@@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_STM32F2XX_SYSCFG) += stm32f2xx_syscfg.o
18
int datasize, elements;
23
obj-$(CONFIG_MIPS_CPS) += mips_cmgcr.o
19
int pass;
24
obj-$(CONFIG_MIPS_CPS) += mips_cpc.o
20
TCGv_ptr fpst;
25
obj-$(CONFIG_MIPS_ITU) += mips_itu.o
21
+ bool pairwise = false;
26
+obj-$(CONFIG_MPS2_FPGAIO) += mps2-fpgaio.o
22
27
obj-$(CONFIG_MPS2_SCC) += mps2-scc.o
23
if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
28
24
unallocated_encoding(s);
29
obj-$(CONFIG_PVPANIC) += pvpanic.o
25
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
30
diff --git a/include/hw/misc/mps2-fpgaio.h b/include/hw/misc/mps2-fpgaio.h
26
datasize = is_q ? 128 : 64;
31
new file mode 100644
27
elements = datasize / 16;
32
index XXXXXXX..XXXXXXX
28
33
--- /dev/null
29
+ switch (fpopcode) {
34
+++ b/include/hw/misc/mps2-fpgaio.h
30
+ case 0x10: /* FMAXNMP */
35
@@ -XXX,XX +XXX,XX @@
31
+ case 0x12: /* FADDP */
36
+/*
32
+ case 0x16: /* FMAXP */
37
+ * ARM MPS2 FPGAIO emulation
33
+ case 0x18: /* FMINNMP */
38
+ *
34
+ case 0x1e: /* FMINP */
39
+ * Copyright (c) 2018 Linaro Limited
35
+ pairwise = true;
40
+ * Written by Peter Maydell
41
+ *
42
+ * This program is free software; you can redistribute it and/or modify
43
+ * it under the terms of the GNU General Public License version 2 or
44
+ * (at your option) any later version.
45
+ */
46
+
47
+/* This is a model of the FPGAIO register block in the AN505
48
+ * FPGA image for the MPS2 dev board; it is documented in the
49
+ * application note:
50
+ * http://infocenter.arm.com/help/topic/com.arm.doc.dai0505b/index.html
51
+ *
52
+ * QEMU interface:
53
+ * + sysbus MMIO region 0: the register bank
54
+ */
55
+
56
+#ifndef MPS2_FPGAIO_H
57
+#define MPS2_FPGAIO_H
58
+
59
+#include "hw/sysbus.h"
60
+
61
+#define TYPE_MPS2_FPGAIO "mps2-fpgaio"
62
+#define MPS2_FPGAIO(obj) OBJECT_CHECK(MPS2FPGAIO, (obj), TYPE_MPS2_FPGAIO)
63
+
64
+typedef struct {
65
+ /*< private >*/
66
+ SysBusDevice parent_obj;
67
+
68
+ /*< public >*/
69
+ MemoryRegion iomem;
70
+
71
+ uint32_t led0;
72
+ uint32_t prescale;
73
+ uint32_t misc;
74
+
75
+ uint32_t prescale_clk;
76
+} MPS2FPGAIO;
77
+
78
+#endif
79
diff --git a/hw/misc/mps2-fpgaio.c b/hw/misc/mps2-fpgaio.c
80
new file mode 100644
81
index XXXXXXX..XXXXXXX
82
--- /dev/null
83
+++ b/hw/misc/mps2-fpgaio.c
84
@@ -XXX,XX +XXX,XX @@
85
+/*
86
+ * ARM MPS2 AN505 FPGAIO emulation
87
+ *
88
+ * Copyright (c) 2018 Linaro Limited
89
+ * Written by Peter Maydell
90
+ *
91
+ * This program is free software; you can redistribute it and/or modify
92
+ * it under the terms of the GNU General Public License version 2 or
93
+ * (at your option) any later version.
94
+ */
95
+
96
+/* This is a model of the "FPGA system control and I/O" block found
97
+ * in the AN505 FPGA image for the MPS2 devboard.
98
+ * It is documented in AN505:
99
+ * http://infocenter.arm.com/help/topic/com.arm.doc.dai0505b/index.html
100
+ */
101
+
102
+#include "qemu/osdep.h"
103
+#include "qemu/log.h"
104
+#include "qapi/error.h"
105
+#include "trace.h"
106
+#include "hw/sysbus.h"
107
+#include "hw/registerfields.h"
108
+#include "hw/misc/mps2-fpgaio.h"
109
+
110
+REG32(LED0, 0)
111
+REG32(BUTTON, 8)
112
+REG32(CLK1HZ, 0x10)
113
+REG32(CLK100HZ, 0x14)
114
+REG32(COUNTER, 0x18)
115
+REG32(PRESCALE, 0x1c)
116
+REG32(PSCNTR, 0x20)
117
+REG32(MISC, 0x4c)
118
+
119
+static uint64_t mps2_fpgaio_read(void *opaque, hwaddr offset, unsigned size)
120
+{
121
+ MPS2FPGAIO *s = MPS2_FPGAIO(opaque);
122
+ uint64_t r;
123
+
124
+ switch (offset) {
125
+ case A_LED0:
126
+ r = s->led0;
127
+ break;
128
+ case A_BUTTON:
129
+ /* User-pressable board buttons. We don't model that, so just return
130
+ * zeroes.
131
+ */
132
+ r = 0;
133
+ break;
134
+ case A_PRESCALE:
135
+ r = s->prescale;
136
+ break;
137
+ case A_MISC:
138
+ r = s->misc;
139
+ break;
140
+ case A_CLK1HZ:
141
+ case A_CLK100HZ:
142
+ case A_COUNTER:
143
+ case A_PSCNTR:
144
+ /* These are all upcounters of various frequencies. */
145
+ qemu_log_mask(LOG_UNIMP, "MPS2 FPGAIO: counters unimplemented\n");
146
+ r = 0;
147
+ break;
148
+ default:
149
+ qemu_log_mask(LOG_GUEST_ERROR,
150
+ "MPS2 FPGAIO read: bad offset %x\n", (int) offset);
151
+ r = 0;
36
+ break;
152
+ break;
37
+ }
153
+ }
38
+
154
+
39
fpst = get_fpstatus_ptr(true);
155
+ trace_mps2_fpgaio_read(offset, r, size);
40
156
+ return r;
41
- for (pass = 0; pass < elements; pass++) {
157
+}
42
+ if (pairwise) {
158
+
43
+ int maxpass = is_q ? 8 : 4;
159
+static void mps2_fpgaio_write(void *opaque, hwaddr offset, uint64_t value,
44
TCGv_i32 tcg_op1 = tcg_temp_new_i32();
160
+ unsigned size)
45
TCGv_i32 tcg_op2 = tcg_temp_new_i32();
161
+{
46
- TCGv_i32 tcg_res = tcg_temp_new_i32();
162
+ MPS2FPGAIO *s = MPS2_FPGAIO(opaque);
47
+ TCGv_i32 tcg_res[8];
163
+
48
164
+ trace_mps2_fpgaio_write(offset, value, size);
49
- read_vec_element_i32(s, tcg_op1, rn, pass, MO_16);
165
+
50
- read_vec_element_i32(s, tcg_op2, rm, pass, MO_16);
166
+ switch (offset) {
51
+ for (pass = 0; pass < maxpass; pass++) {
167
+ case A_LED0:
52
+ int passreg = pass < (maxpass / 2) ? rn : rm;
168
+ /* LED bits [1:0] control board LEDs. We don't currently have
53
+ int passelt = (pass << 1) & (maxpass - 1);
169
+ * a mechanism for displaying this graphically, so use a trace event.
54
170
+ */
55
- switch (fpopcode) {
171
+ trace_mps2_fpgaio_leds(value & 0x02 ? '*' : '.',
56
- case 0x0: /* FMAXNM */
172
+ value & 0x01 ? '*' : '.');
57
- gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst);
173
+ s->led0 = value & 0x3;
58
- break;
174
+ break;
59
- case 0x1: /* FMLA */
175
+ case A_PRESCALE:
60
- read_vec_element_i32(s, tcg_res, rd, pass, MO_16);
176
+ s->prescale = value;
61
- gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res,
177
+ break;
62
- fpst);
178
+ case A_MISC:
63
- break;
179
+ /* These are control bits for some of the other devices on the
64
- case 0x2: /* FADD */
180
+ * board (SPI, CLCD, etc). We don't implement that yet, so just
65
- gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst);
181
+ * make the bits read as written.
66
- break;
182
+ */
67
- case 0x3: /* FMULX */
183
+ qemu_log_mask(LOG_UNIMP,
68
- gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst);
184
+ "MPS2 FPGAIO: MISC control bits unimplemented\n");
69
- break;
185
+ s->misc = value;
70
- case 0x4: /* FCMEQ */
186
+ break;
71
- gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst);
187
+ default:
72
- break;
188
+ qemu_log_mask(LOG_GUEST_ERROR,
73
- case 0x6: /* FMAX */
189
+ "MPS2 FPGAIO write: bad offset 0x%x\n", (int) offset);
74
- gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst);
190
+ break;
75
- break;
191
+ }
76
- case 0x7: /* FRECPS */
192
+}
77
- gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
193
+
78
- break;
194
+static const MemoryRegionOps mps2_fpgaio_ops = {
79
- case 0x8: /* FMINNM */
195
+ .read = mps2_fpgaio_read,
80
- gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst);
196
+ .write = mps2_fpgaio_write,
81
- break;
197
+ .endianness = DEVICE_LITTLE_ENDIAN,
82
- case 0x9: /* FMLS */
198
+};
83
- /* As usual for ARM, separate negation for fused multiply-add */
199
+
84
- tcg_gen_xori_i32(tcg_op1, tcg_op1, 0x8000);
200
+static void mps2_fpgaio_reset(DeviceState *dev)
85
- read_vec_element_i32(s, tcg_res, rd, pass, MO_16);
201
+{
86
- gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res,
202
+ MPS2FPGAIO *s = MPS2_FPGAIO(dev);
87
- fpst);
203
+
88
- break;
204
+ trace_mps2_fpgaio_reset();
89
- case 0xa: /* FSUB */
205
+ s->led0 = 0;
90
- gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
206
+ s->prescale = 0;
91
- break;
207
+ s->misc = 0;
92
- case 0xe: /* FMIN */
208
+}
93
- gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst);
209
+
94
- break;
210
+static void mps2_fpgaio_init(Object *obj)
95
- case 0xf: /* FRSQRTS */
211
+{
96
- gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
212
+ SysBusDevice *sbd = SYS_BUS_DEVICE(obj);
97
- break;
213
+ MPS2FPGAIO *s = MPS2_FPGAIO(obj);
98
- case 0x13: /* FMUL */
214
+
99
- gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst);
215
+ memory_region_init_io(&s->iomem, obj, &mps2_fpgaio_ops, s,
100
- break;
216
+ "mps2-fpgaio", 0x1000);
101
- case 0x14: /* FCMGE */
217
+ sysbus_init_mmio(sbd, &s->iomem);
102
- gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
218
+}
103
- break;
219
+
104
- case 0x15: /* FACGE */
220
+static const VMStateDescription mps2_fpgaio_vmstate = {
105
- gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
221
+ .name = "mps2-fpgaio",
106
- break;
222
+ .version_id = 1,
107
- case 0x17: /* FDIV */
223
+ .minimum_version_id = 1,
108
- gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst);
224
+ .fields = (VMStateField[]) {
109
- break;
225
+ VMSTATE_UINT32(led0, MPS2FPGAIO),
110
- case 0x1a: /* FABD */
226
+ VMSTATE_UINT32(prescale, MPS2FPGAIO),
111
- gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
227
+ VMSTATE_UINT32(misc, MPS2FPGAIO),
112
- tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff);
228
+ VMSTATE_END_OF_LIST()
113
- break;
229
+ }
114
- case 0x1c: /* FCMGT */
230
+};
115
- gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
231
+
116
- break;
232
+static Property mps2_fpgaio_properties[] = {
117
- case 0x1d: /* FACGT */
233
+ /* Frequency of the prescale counter */
118
- gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
234
+ DEFINE_PROP_UINT32("prescale-clk", MPS2FPGAIO, prescale_clk, 20000000),
119
- break;
235
+ DEFINE_PROP_END_OF_LIST(),
120
- default:
236
+};
121
- fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n",
237
+
122
- __func__, insn, fpopcode, s->pc);
238
+static void mps2_fpgaio_class_init(ObjectClass *klass, void *data)
123
- g_assert_not_reached();
239
+{
124
+ read_vec_element_i32(s, tcg_op1, passreg, passelt, MO_16);
240
+ DeviceClass *dc = DEVICE_CLASS(klass);
125
+ read_vec_element_i32(s, tcg_op2, passreg, passelt + 1, MO_16);
241
+
126
+ tcg_res[pass] = tcg_temp_new_i32();
242
+ dc->vmsd = &mps2_fpgaio_vmstate;
127
+
243
+ dc->reset = mps2_fpgaio_reset;
128
+ switch (fpopcode) {
244
+ dc->props = mps2_fpgaio_properties;
129
+ case 0x10: /* FMAXNMP */
245
+}
130
+ gen_helper_advsimd_maxnumh(tcg_res[pass], tcg_op1, tcg_op2,
246
+
131
+ fpst);
247
+static const TypeInfo mps2_fpgaio_info = {
132
+ break;
248
+ .name = TYPE_MPS2_FPGAIO,
133
+ case 0x12: /* FADDP */
249
+ .parent = TYPE_SYS_BUS_DEVICE,
134
+ gen_helper_advsimd_addh(tcg_res[pass], tcg_op1, tcg_op2, fpst);
250
+ .instance_size = sizeof(MPS2FPGAIO),
135
+ break;
251
+ .instance_init = mps2_fpgaio_init,
136
+ case 0x16: /* FMAXP */
252
+ .class_init = mps2_fpgaio_class_init,
137
+ gen_helper_advsimd_maxh(tcg_res[pass], tcg_op1, tcg_op2, fpst);
253
+};
138
+ break;
254
+
139
+ case 0x18: /* FMINNMP */
255
+static void mps2_fpgaio_register_types(void)
140
+ gen_helper_advsimd_minnumh(tcg_res[pass], tcg_op1, tcg_op2,
256
+{
141
+ fpst);
257
+ type_register_static(&mps2_fpgaio_info);
142
+ break;
258
+}
143
+ case 0x1e: /* FMINP */
259
+
144
+ gen_helper_advsimd_minh(tcg_res[pass], tcg_op1, tcg_op2, fpst);
260
+type_init(mps2_fpgaio_register_types);
145
+ break;
261
diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak
146
+ default:
262
index XXXXXXX..XXXXXXX 100644
147
+ g_assert_not_reached();
263
--- a/default-configs/arm-softmmu.mak
148
+ }
264
+++ b/default-configs/arm-softmmu.mak
149
+ }
265
@@ -XXX,XX +XXX,XX @@ CONFIG_STM32F205_SOC=y
150
+
266
CONFIG_CMSDK_APB_TIMER=y
151
+ for (pass = 0; pass < maxpass; pass++) {
267
CONFIG_CMSDK_APB_UART=y
152
+ write_vec_element_i32(s, tcg_res[pass], rd, pass, MO_16);
268
153
+ tcg_temp_free_i32(tcg_res[pass]);
269
+CONFIG_MPS2_FPGAIO=y
154
}
270
CONFIG_MPS2_SCC=y
155
271
156
- write_vec_element_i32(s, tcg_res, rd, pass, MO_16);
272
CONFIG_VERSATILE_PCI=y
157
- tcg_temp_free_i32(tcg_res);
273
diff --git a/hw/misc/trace-events b/hw/misc/trace-events
158
tcg_temp_free_i32(tcg_op1);
274
index XXXXXXX..XXXXXXX 100644
159
tcg_temp_free_i32(tcg_op2);
275
--- a/hw/misc/trace-events
160
+
276
+++ b/hw/misc/trace-events
161
+ } else {
277
@@ -XXX,XX +XXX,XX @@ mps2_scc_leds(char led7, char led6, char led5, char led4, char led3, char led2,
162
+ for (pass = 0; pass < elements; pass++) {
278
mps2_scc_cfg_write(unsigned function, unsigned device, uint32_t value) "MPS2 SCC config write: function %d device %d data 0x%" PRIx32
163
+ TCGv_i32 tcg_op1 = tcg_temp_new_i32();
279
mps2_scc_cfg_read(unsigned function, unsigned device, uint32_t value) "MPS2 SCC config read: function %d device %d data 0x%" PRIx32
164
+ TCGv_i32 tcg_op2 = tcg_temp_new_i32();
280
165
+ TCGv_i32 tcg_res = tcg_temp_new_i32();
281
+# hw/misc/mps2_fpgaio.c
166
+
282
+mps2_fpgaio_read(uint64_t offset, uint64_t data, unsigned size) "MPS2 FPGAIO read: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u"
167
+ read_vec_element_i32(s, tcg_op1, rn, pass, MO_16);
283
+mps2_fpgaio_write(uint64_t offset, uint64_t data, unsigned size) "MPS2 FPGAIO write: offset 0x%" PRIx64 " data 0x%" PRIx64 " size %u"
168
+ read_vec_element_i32(s, tcg_op2, rm, pass, MO_16);
284
+mps2_fpgaio_reset(void) "MPS2 FPGAIO: reset"
169
+
285
+mps2_fpgaio_leds(char led1, char led0) "MPS2 FPGAIO LEDs: %c%c"
170
+ switch (fpopcode) {
286
+
171
+ case 0x0: /* FMAXNM */
287
# hw/misc/msf2-sysreg.c
172
+ gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst);
288
msf2_sysreg_write(uint64_t offset, uint32_t val, uint32_t prev) "msf2-sysreg write: addr 0x%08" HWADDR_PRIx " data 0x%" PRIx32 " prev 0x%" PRIx32
173
+ break;
289
msf2_sysreg_read(uint64_t offset, uint32_t val) "msf2-sysreg read: addr 0x%08" HWADDR_PRIx " data 0x%08" PRIx32
174
+ case 0x1: /* FMLA */
175
+ read_vec_element_i32(s, tcg_res, rd, pass, MO_16);
176
+ gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res,
177
+ fpst);
178
+ break;
179
+ case 0x2: /* FADD */
180
+ gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst);
181
+ break;
182
+ case 0x3: /* FMULX */
183
+ gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst);
184
+ break;
185
+ case 0x4: /* FCMEQ */
186
+ gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst);
187
+ break;
188
+ case 0x6: /* FMAX */
189
+ gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst);
190
+ break;
191
+ case 0x7: /* FRECPS */
192
+ gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
193
+ break;
194
+ case 0x8: /* FMINNM */
195
+ gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst);
196
+ break;
197
+ case 0x9: /* FMLS */
198
+ /* As usual for ARM, separate negation for fused multiply-add */
199
+ tcg_gen_xori_i32(tcg_op1, tcg_op1, 0x8000);
200
+ read_vec_element_i32(s, tcg_res, rd, pass, MO_16);
201
+ gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res,
202
+ fpst);
203
+ break;
204
+ case 0xa: /* FSUB */
205
+ gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
206
+ break;
207
+ case 0xe: /* FMIN */
208
+ gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst);
209
+ break;
210
+ case 0xf: /* FRSQRTS */
211
+ gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
212
+ break;
213
+ case 0x13: /* FMUL */
214
+ gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst);
215
+ break;
216
+ case 0x14: /* FCMGE */
217
+ gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
218
+ break;
219
+ case 0x15: /* FACGE */
220
+ gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
221
+ break;
222
+ case 0x17: /* FDIV */
223
+ gen_helper_advsimd_divh(tcg_res, tcg_op1, tcg_op2, fpst);
224
+ break;
225
+ case 0x1a: /* FABD */
226
+ gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
227
+ tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff);
228
+ break;
229
+ case 0x1c: /* FCMGT */
230
+ gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
231
+ break;
232
+ case 0x1d: /* FACGT */
233
+ gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
234
+ break;
235
+ default:
236
+ fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n",
237
+ __func__, insn, fpopcode, s->pc);
238
+ g_assert_not_reached();
239
+ }
240
+
241
+ write_vec_element_i32(s, tcg_res, rd, pass, MO_16);
242
+ tcg_temp_free_i32(tcg_res);
243
+ tcg_temp_free_i32(tcg_op1);
244
+ tcg_temp_free_i32(tcg_op2);
245
+ }
246
}
247
248
tcg_temp_free_ptr(fpst);
249
--
290
--
250
2.16.2
291
2.16.2
251
292
252
293
diff view generated by jsdifflib
1
From: Linus Walleij <linus.walleij@linaro.org>
1
Add a model of the TrustZone peripheral protection controller (PPC),
2
which is used to gate transactions to non-TZ-aware peripherals so
3
that secure software can configure them to not be accessible to
4
non-secure software.
2
5
3
This adds the SiI9022 (and implicitly EDID I2C) device to the ARM
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
Versatile Express machine, and selects the two I2C devices necessary
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
5
in the arm-softmmu.mak configuration so everything will build
8
Message-id: 20180220180325.29818-15-peter.maydell@linaro.org
6
smoothly.
9
---
10
hw/misc/Makefile.objs | 2 +
11
include/hw/misc/tz-ppc.h | 101 ++++++++++++++
12
hw/misc/tz-ppc.c | 302 ++++++++++++++++++++++++++++++++++++++++
13
default-configs/arm-softmmu.mak | 2 +
14
hw/misc/trace-events | 11 ++
15
5 files changed, 418 insertions(+)
16
create mode 100644 include/hw/misc/tz-ppc.h
17
create mode 100644 hw/misc/tz-ppc.c
7
18
8
I am implementing proper handling of the graphics in the Linux
19
diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs
9
kernel and adding proper emulation of SiI9022 and EDID makes the
10
driver probe as nicely as before, retrieving the resolutions
11
supported by the "QEMU monitor" and overall just working nice.
12
13
Cc: Peter Maydell <peter.maydell@linaro.org>
14
Signed-off-by: Linus Walleij <linus.walleij@linaro.org>
15
Message-id: 20180227104903.21353-6-linus.walleij@linaro.org
16
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
17
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
18
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
19
---
20
hw/arm/vexpress.c | 6 +++++-
21
default-configs/arm-softmmu.mak | 2 ++
22
2 files changed, 7 insertions(+), 1 deletion(-)
23
24
diff --git a/hw/arm/vexpress.c b/hw/arm/vexpress.c
25
index XXXXXXX..XXXXXXX 100644
20
index XXXXXXX..XXXXXXX 100644
26
--- a/hw/arm/vexpress.c
21
--- a/hw/misc/Makefile.objs
27
+++ b/hw/arm/vexpress.c
22
+++ b/hw/misc/Makefile.objs
23
@@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_MIPS_ITU) += mips_itu.o
24
obj-$(CONFIG_MPS2_FPGAIO) += mps2-fpgaio.o
25
obj-$(CONFIG_MPS2_SCC) += mps2-scc.o
26
27
+obj-$(CONFIG_TZ_PPC) += tz-ppc.o
28
+
29
obj-$(CONFIG_PVPANIC) += pvpanic.o
30
obj-$(CONFIG_HYPERV_TESTDEV) += hyperv_testdev.o
31
obj-$(CONFIG_AUX) += auxbus.o
32
diff --git a/include/hw/misc/tz-ppc.h b/include/hw/misc/tz-ppc.h
33
new file mode 100644
34
index XXXXXXX..XXXXXXX
35
--- /dev/null
36
+++ b/include/hw/misc/tz-ppc.h
28
@@ -XXX,XX +XXX,XX @@
37
@@ -XXX,XX +XXX,XX @@
29
#include "hw/arm/arm.h"
38
+/*
30
#include "hw/arm/primecell.h"
39
+ * ARM TrustZone peripheral protection controller emulation
31
#include "hw/devices.h"
40
+ *
32
+#include "hw/i2c/i2c.h"
41
+ * Copyright (c) 2018 Linaro Limited
33
#include "net/net.h"
42
+ * Written by Peter Maydell
34
#include "sysemu/sysemu.h"
43
+ *
35
#include "hw/boards.h"
44
+ * This program is free software; you can redistribute it and/or modify
36
@@ -XXX,XX +XXX,XX @@ static void vexpress_common_init(MachineState *machine)
45
+ * it under the terms of the GNU General Public License version 2 or
37
uint32_t sys_id;
46
+ * (at your option) any later version.
38
DriveInfo *dinfo;
47
+ */
39
pflash_t *pflash0;
48
+
40
+ I2CBus *i2c;
49
+/* This is a model of the TrustZone peripheral protection controller (PPC).
41
ram_addr_t vram_size, sram_size;
50
+ * It is documented in the ARM CoreLink SIE-200 System IP for Embedded TRM
42
MemoryRegion *sysmem = get_system_memory();
51
+ * (DDI 0571G):
43
MemoryRegion *vram = g_new(MemoryRegion, 1);
52
+ * https://developer.arm.com/products/architecture/m-profile/docs/ddi0571/g
44
@@ -XXX,XX +XXX,XX @@ static void vexpress_common_init(MachineState *machine)
53
+ *
45
sysbus_create_simple("sp804", map[VE_TIMER01], pic[2]);
54
+ * The PPC sits in front of peripherals and allows secure software to
46
sysbus_create_simple("sp804", map[VE_TIMER23], pic[3]);
55
+ * configure it to either pass through or reject transactions.
47
56
+ * Rejected transactions may be configured to either be aborted, or to
48
- /* VE_SERIALDVI: not modelled */
57
+ * behave as RAZ/WI. An interrupt can be signalled for a rejected transaction.
49
+ dev = sysbus_create_simple("versatile_i2c", map[VE_SERIALDVI], NULL);
58
+ *
50
+ i2c = (I2CBus *)qdev_get_child_bus(dev, "i2c");
59
+ * The PPC has no register interface -- it is configured purely by a
51
+ i2c_create_slave(i2c, "sii9022", 0x39);
60
+ * collection of input signals from other hardware in the system. Typically
52
61
+ * they are either hardwired or exposed in an ad-hoc register interface by
53
sysbus_create_simple("pl031", map[VE_RTC], pic[4]); /* RTC */
62
+ * the SoC that uses the PPC.
54
63
+ *
64
+ * This QEMU model can be used to model either the AHB5 or APB4 TZ PPC,
65
+ * since the only difference between them is that the AHB version has a
66
+ * "default" port which has no security checks applied. In QEMU the default
67
+ * port can be emulated simply by wiring its downstream devices directly
68
+ * into the parent address space, since the PPC does not need to intercept
69
+ * transactions there.
70
+ *
71
+ * In the hardware, selection of which downstream port to use is done by
72
+ * the user's decode logic asserting one of the hsel[] signals. In QEMU,
73
+ * we provide 16 MMIO regions, one per port, and the user maps these into
74
+ * the desired addresses to implement the address decode.
75
+ *
76
+ * QEMU interface:
77
+ * + sysbus MMIO regions 0..15: MemoryRegions defining the upstream end
78
+ * of each of the 16 ports of the PPC
79
+ * + Property "port[0..15]": MemoryRegion defining the downstream device(s)
80
+ * for each of the 16 ports of the PPC
81
+ * + Named GPIO inputs "cfg_nonsec[0..15]": set to 1 if the port should be
82
+ * accessible to NonSecure transactions
83
+ * + Named GPIO inputs "cfg_ap[0..15]": set to 1 if the port should be
84
+ * accessible to non-privileged transactions
85
+ * + Named GPIO input "cfg_sec_resp": set to 1 if a rejected transaction should
86
+ * result in a transaction error, or 0 for the transaction to RAZ/WI
87
+ * + Named GPIO input "irq_enable": set to 1 to enable interrupts
88
+ * + Named GPIO input "irq_clear": set to 1 to clear a pending interrupt
89
+ * + Named GPIO output "irq": set for a transaction-failed interrupt
90
+ * + Property "NONSEC_MASK": if a bit is set in this mask then accesses to
91
+ * the associated port do not have the TZ security check performed. (This
92
+ * corresponds to the hardware allowing this to be set as a Verilog
93
+ * parameter.)
94
+ */
95
+
96
+#ifndef TZ_PPC_H
97
+#define TZ_PPC_H
98
+
99
+#include "hw/sysbus.h"
100
+
101
+#define TYPE_TZ_PPC "tz-ppc"
102
+#define TZ_PPC(obj) OBJECT_CHECK(TZPPC, (obj), TYPE_TZ_PPC)
103
+
104
+#define TZ_NUM_PORTS 16
105
+
106
+typedef struct TZPPC TZPPC;
107
+
108
+typedef struct TZPPCPort {
109
+ TZPPC *ppc;
110
+ MemoryRegion upstream;
111
+ AddressSpace downstream_as;
112
+ MemoryRegion *downstream;
113
+} TZPPCPort;
114
+
115
+struct TZPPC {
116
+ /*< private >*/
117
+ SysBusDevice parent_obj;
118
+
119
+ /*< public >*/
120
+
121
+ /* State: these just track the values of our input signals */
122
+ bool cfg_nonsec[TZ_NUM_PORTS];
123
+ bool cfg_ap[TZ_NUM_PORTS];
124
+ bool cfg_sec_resp;
125
+ bool irq_enable;
126
+ bool irq_clear;
127
+ /* State: are we asserting irq ? */
128
+ bool irq_status;
129
+
130
+ qemu_irq irq;
131
+
132
+ /* Properties */
133
+ uint32_t nonsec_mask;
134
+
135
+ TZPPCPort port[TZ_NUM_PORTS];
136
+};
137
+
138
+#endif
139
diff --git a/hw/misc/tz-ppc.c b/hw/misc/tz-ppc.c
140
new file mode 100644
141
index XXXXXXX..XXXXXXX
142
--- /dev/null
143
+++ b/hw/misc/tz-ppc.c
144
@@ -XXX,XX +XXX,XX @@
145
+/*
146
+ * ARM TrustZone peripheral protection controller emulation
147
+ *
148
+ * Copyright (c) 2018 Linaro Limited
149
+ * Written by Peter Maydell
150
+ *
151
+ * This program is free software; you can redistribute it and/or modify
152
+ * it under the terms of the GNU General Public License version 2 or
153
+ * (at your option) any later version.
154
+ */
155
+
156
+#include "qemu/osdep.h"
157
+#include "qemu/log.h"
158
+#include "qapi/error.h"
159
+#include "trace.h"
160
+#include "hw/sysbus.h"
161
+#include "hw/registerfields.h"
162
+#include "hw/misc/tz-ppc.h"
163
+
164
+static void tz_ppc_update_irq(TZPPC *s)
165
+{
166
+ bool level = s->irq_status && s->irq_enable;
167
+
168
+ trace_tz_ppc_update_irq(level);
169
+ qemu_set_irq(s->irq, level);
170
+}
171
+
172
+static void tz_ppc_cfg_nonsec(void *opaque, int n, int level)
173
+{
174
+ TZPPC *s = TZ_PPC(opaque);
175
+
176
+ assert(n < TZ_NUM_PORTS);
177
+ trace_tz_ppc_cfg_nonsec(n, level);
178
+ s->cfg_nonsec[n] = level;
179
+}
180
+
181
+static void tz_ppc_cfg_ap(void *opaque, int n, int level)
182
+{
183
+ TZPPC *s = TZ_PPC(opaque);
184
+
185
+ assert(n < TZ_NUM_PORTS);
186
+ trace_tz_ppc_cfg_ap(n, level);
187
+ s->cfg_ap[n] = level;
188
+}
189
+
190
+static void tz_ppc_cfg_sec_resp(void *opaque, int n, int level)
191
+{
192
+ TZPPC *s = TZ_PPC(opaque);
193
+
194
+ trace_tz_ppc_cfg_sec_resp(level);
195
+ s->cfg_sec_resp = level;
196
+}
197
+
198
+static void tz_ppc_irq_enable(void *opaque, int n, int level)
199
+{
200
+ TZPPC *s = TZ_PPC(opaque);
201
+
202
+ trace_tz_ppc_irq_enable(level);
203
+ s->irq_enable = level;
204
+ tz_ppc_update_irq(s);
205
+}
206
+
207
+static void tz_ppc_irq_clear(void *opaque, int n, int level)
208
+{
209
+ TZPPC *s = TZ_PPC(opaque);
210
+
211
+ trace_tz_ppc_irq_clear(level);
212
+
213
+ s->irq_clear = level;
214
+ if (level) {
215
+ s->irq_status = false;
216
+ tz_ppc_update_irq(s);
217
+ }
218
+}
219
+
220
+static bool tz_ppc_check(TZPPC *s, int n, MemTxAttrs attrs)
221
+{
222
+ /* Check whether to allow an access to port n; return true if
223
+ * the check passes, and false if the transaction must be blocked.
224
+ * If the latter, the caller must check cfg_sec_resp to determine
225
+ * whether to abort or RAZ/WI the transaction.
226
+ * The checks are:
227
+ * + nonsec_mask suppresses any check of the secure attribute
228
+ * + otherwise, block if cfg_nonsec is 1 and transaction is secure,
229
+ * or if cfg_nonsec is 0 and transaction is non-secure
230
+ * + block if transaction is usermode and cfg_ap is 0
231
+ */
232
+ if ((attrs.secure == s->cfg_nonsec[n] && !(s->nonsec_mask & (1 << n))) ||
233
+ (attrs.user && !s->cfg_ap[n])) {
234
+ /* Block the transaction. */
235
+ if (!s->irq_clear) {
236
+ /* Note that holding irq_clear high suppresses interrupts */
237
+ s->irq_status = true;
238
+ tz_ppc_update_irq(s);
239
+ }
240
+ return false;
241
+ }
242
+ return true;
243
+}
244
+
245
+static MemTxResult tz_ppc_read(void *opaque, hwaddr addr, uint64_t *pdata,
246
+ unsigned size, MemTxAttrs attrs)
247
+{
248
+ TZPPCPort *p = opaque;
249
+ TZPPC *s = p->ppc;
250
+ int n = p - s->port;
251
+ AddressSpace *as = &p->downstream_as;
252
+ uint64_t data;
253
+ MemTxResult res;
254
+
255
+ if (!tz_ppc_check(s, n, attrs)) {
256
+ trace_tz_ppc_read_blocked(n, addr, attrs.secure, attrs.user);
257
+ if (s->cfg_sec_resp) {
258
+ return MEMTX_ERROR;
259
+ } else {
260
+ *pdata = 0;
261
+ return MEMTX_OK;
262
+ }
263
+ }
264
+
265
+ switch (size) {
266
+ case 1:
267
+ data = address_space_ldub(as, addr, attrs, &res);
268
+ break;
269
+ case 2:
270
+ data = address_space_lduw_le(as, addr, attrs, &res);
271
+ break;
272
+ case 4:
273
+ data = address_space_ldl_le(as, addr, attrs, &res);
274
+ break;
275
+ case 8:
276
+ data = address_space_ldq_le(as, addr, attrs, &res);
277
+ break;
278
+ default:
279
+ g_assert_not_reached();
280
+ }
281
+ *pdata = data;
282
+ return res;
283
+}
284
+
285
+static MemTxResult tz_ppc_write(void *opaque, hwaddr addr, uint64_t val,
286
+ unsigned size, MemTxAttrs attrs)
287
+{
288
+ TZPPCPort *p = opaque;
289
+ TZPPC *s = p->ppc;
290
+ AddressSpace *as = &p->downstream_as;
291
+ int n = p - s->port;
292
+ MemTxResult res;
293
+
294
+ if (!tz_ppc_check(s, n, attrs)) {
295
+ trace_tz_ppc_write_blocked(n, addr, attrs.secure, attrs.user);
296
+ if (s->cfg_sec_resp) {
297
+ return MEMTX_ERROR;
298
+ } else {
299
+ return MEMTX_OK;
300
+ }
301
+ }
302
+
303
+ switch (size) {
304
+ case 1:
305
+ address_space_stb(as, addr, val, attrs, &res);
306
+ break;
307
+ case 2:
308
+ address_space_stw_le(as, addr, val, attrs, &res);
309
+ break;
310
+ case 4:
311
+ address_space_stl_le(as, addr, val, attrs, &res);
312
+ break;
313
+ case 8:
314
+ address_space_stq_le(as, addr, val, attrs, &res);
315
+ break;
316
+ default:
317
+ g_assert_not_reached();
318
+ }
319
+ return res;
320
+}
321
+
322
+static const MemoryRegionOps tz_ppc_ops = {
323
+ .read_with_attrs = tz_ppc_read,
324
+ .write_with_attrs = tz_ppc_write,
325
+ .endianness = DEVICE_LITTLE_ENDIAN,
326
+};
327
+
328
+static void tz_ppc_reset(DeviceState *dev)
329
+{
330
+ TZPPC *s = TZ_PPC(dev);
331
+
332
+ trace_tz_ppc_reset();
333
+ s->cfg_sec_resp = false;
334
+ memset(s->cfg_nonsec, 0, sizeof(s->cfg_nonsec));
335
+ memset(s->cfg_ap, 0, sizeof(s->cfg_ap));
336
+}
337
+
338
+static void tz_ppc_init(Object *obj)
339
+{
340
+ DeviceState *dev = DEVICE(obj);
341
+ TZPPC *s = TZ_PPC(obj);
342
+
343
+ qdev_init_gpio_in_named(dev, tz_ppc_cfg_nonsec, "cfg_nonsec", TZ_NUM_PORTS);
344
+ qdev_init_gpio_in_named(dev, tz_ppc_cfg_ap, "cfg_ap", TZ_NUM_PORTS);
345
+ qdev_init_gpio_in_named(dev, tz_ppc_cfg_sec_resp, "cfg_sec_resp", 1);
346
+ qdev_init_gpio_in_named(dev, tz_ppc_irq_enable, "irq_enable", 1);
347
+ qdev_init_gpio_in_named(dev, tz_ppc_irq_clear, "irq_clear", 1);
348
+ qdev_init_gpio_out_named(dev, &s->irq, "irq", 1);
349
+}
350
+
351
+static void tz_ppc_realize(DeviceState *dev, Error **errp)
352
+{
353
+ Object *obj = OBJECT(dev);
354
+ SysBusDevice *sbd = SYS_BUS_DEVICE(dev);
355
+ TZPPC *s = TZ_PPC(dev);
356
+ int i;
357
+
358
+ /* We can't create the upstream end of the port until realize,
359
+ * as we don't know the size of the MR used as the downstream until then.
360
+ */
361
+ for (i = 0; i < TZ_NUM_PORTS; i++) {
362
+ TZPPCPort *port = &s->port[i];
363
+ char *name;
364
+ uint64_t size;
365
+
366
+ if (!port->downstream) {
367
+ continue;
368
+ }
369
+
370
+ name = g_strdup_printf("tz-ppc-port[%d]", i);
371
+
372
+ port->ppc = s;
373
+ address_space_init(&port->downstream_as, port->downstream, name);
374
+
375
+ size = memory_region_size(port->downstream);
376
+ memory_region_init_io(&port->upstream, obj, &tz_ppc_ops,
377
+ port, name, size);
378
+ sysbus_init_mmio(sbd, &port->upstream);
379
+ g_free(name);
380
+ }
381
+}
382
+
383
+static const VMStateDescription tz_ppc_vmstate = {
384
+ .name = "tz-ppc",
385
+ .version_id = 1,
386
+ .minimum_version_id = 1,
387
+ .fields = (VMStateField[]) {
388
+ VMSTATE_BOOL_ARRAY(cfg_nonsec, TZPPC, 16),
389
+ VMSTATE_BOOL_ARRAY(cfg_ap, TZPPC, 16),
390
+ VMSTATE_BOOL(cfg_sec_resp, TZPPC),
391
+ VMSTATE_BOOL(irq_enable, TZPPC),
392
+ VMSTATE_BOOL(irq_clear, TZPPC),
393
+ VMSTATE_BOOL(irq_status, TZPPC),
394
+ VMSTATE_END_OF_LIST()
395
+ }
396
+};
397
+
398
+#define DEFINE_PORT(N) \
399
+ DEFINE_PROP_LINK("port[" #N "]", TZPPC, port[N].downstream, \
400
+ TYPE_MEMORY_REGION, MemoryRegion *)
401
+
402
+static Property tz_ppc_properties[] = {
403
+ DEFINE_PROP_UINT32("NONSEC_MASK", TZPPC, nonsec_mask, 0),
404
+ DEFINE_PORT(0),
405
+ DEFINE_PORT(1),
406
+ DEFINE_PORT(2),
407
+ DEFINE_PORT(3),
408
+ DEFINE_PORT(4),
409
+ DEFINE_PORT(5),
410
+ DEFINE_PORT(6),
411
+ DEFINE_PORT(7),
412
+ DEFINE_PORT(8),
413
+ DEFINE_PORT(9),
414
+ DEFINE_PORT(10),
415
+ DEFINE_PORT(11),
416
+ DEFINE_PORT(12),
417
+ DEFINE_PORT(13),
418
+ DEFINE_PORT(14),
419
+ DEFINE_PORT(15),
420
+ DEFINE_PROP_END_OF_LIST(),
421
+};
422
+
423
+static void tz_ppc_class_init(ObjectClass *klass, void *data)
424
+{
425
+ DeviceClass *dc = DEVICE_CLASS(klass);
426
+
427
+ dc->realize = tz_ppc_realize;
428
+ dc->vmsd = &tz_ppc_vmstate;
429
+ dc->reset = tz_ppc_reset;
430
+ dc->props = tz_ppc_properties;
431
+}
432
+
433
+static const TypeInfo tz_ppc_info = {
434
+ .name = TYPE_TZ_PPC,
435
+ .parent = TYPE_SYS_BUS_DEVICE,
436
+ .instance_size = sizeof(TZPPC),
437
+ .instance_init = tz_ppc_init,
438
+ .class_init = tz_ppc_class_init,
439
+};
440
+
441
+static void tz_ppc_register_types(void)
442
+{
443
+ type_register_static(&tz_ppc_info);
444
+}
445
+
446
+type_init(tz_ppc_register_types);
55
diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak
447
diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak
56
index XXXXXXX..XXXXXXX 100644
448
index XXXXXXX..XXXXXXX 100644
57
--- a/default-configs/arm-softmmu.mak
449
--- a/default-configs/arm-softmmu.mak
58
+++ b/default-configs/arm-softmmu.mak
450
+++ b/default-configs/arm-softmmu.mak
59
@@ -XXX,XX +XXX,XX @@ CONFIG_STELLARIS_INPUT=y
451
@@ -XXX,XX +XXX,XX @@ CONFIG_CMSDK_APB_UART=y
60
CONFIG_STELLARIS_ENET=y
452
CONFIG_MPS2_FPGAIO=y
61
CONFIG_SSD0303=y
453
CONFIG_MPS2_SCC=y
62
CONFIG_SSD0323=y
454
63
+CONFIG_DDC=y
455
+CONFIG_TZ_PPC=y
64
+CONFIG_SII9022=y
456
+
65
CONFIG_ADS7846=y
457
CONFIG_VERSATILE_PCI=y
66
CONFIG_MAX111X=y
458
CONFIG_VERSATILE_I2C=y
67
CONFIG_SSI=y
459
460
diff --git a/hw/misc/trace-events b/hw/misc/trace-events
461
index XXXXXXX..XXXXXXX 100644
462
--- a/hw/misc/trace-events
463
+++ b/hw/misc/trace-events
464
@@ -XXX,XX +XXX,XX @@ mos6522_get_next_irq_time(uint16_t latch, int64_t d, int64_t delta) "latch=%d co
465
mos6522_set_sr_int(void) "set sr_int"
466
mos6522_write(uint64_t addr, uint64_t val) "reg=0x%"PRIx64 " val=0x%"PRIx64
467
mos6522_read(uint64_t addr, unsigned val) "reg=0x%"PRIx64 " val=0x%x"
468
+
469
+# hw/misc/tz-ppc.c
470
+tz_ppc_reset(void) "TZ PPC: reset"
471
+tz_ppc_cfg_nonsec(int n, int level) "TZ PPC: cfg_nonsec[%d] = %d"
472
+tz_ppc_cfg_ap(int n, int level) "TZ PPC: cfg_ap[%d] = %d"
473
+tz_ppc_cfg_sec_resp(int level) "TZ PPC: cfg_sec_resp = %d"
474
+tz_ppc_irq_enable(int level) "TZ PPC: int_enable = %d"
475
+tz_ppc_irq_clear(int level) "TZ PPC: int_clear = %d"
476
+tz_ppc_update_irq(int level) "TZ PPC: setting irq line to %d"
477
+tz_ppc_read_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " read (secure %d user %d) blocked"
478
+tz_ppc_write_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " write (secure %d user %d) blocked"
68
--
479
--
69
2.16.2
480
2.16.2
70
481
71
482
diff view generated by jsdifflib
1
From: Linus Walleij <linus.walleij@linaro.org>
1
The Arm IoT Kit includes a "security controller" which is largely a
2
collection of registers for controlling the PPCs and other bits of
3
glue in the system. This commit provides the initial skeleton of the
4
device, implementing just the ID registers, and a couple of read-only
5
read-as-zero registers.
2
6
3
This adds support for emulating the Silicon Image SII9022 DVI/HDMI
7
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
bridge. It's not very clever right now, it just acknowledges
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
5
the switch into DDC I2C mode and back. Combining this with the
9
Message-id: 20180220180325.29818-16-peter.maydell@linaro.org
6
existing DDC I2C emulation gives the right behavior on the Versatile
10
---
7
Express emulation passing through the QEMU EDID to the emulated
11
hw/misc/Makefile.objs | 1 +
8
platform.
12
include/hw/misc/iotkit-secctl.h | 39 ++++
13
hw/misc/iotkit-secctl.c | 448 ++++++++++++++++++++++++++++++++++++++++
14
default-configs/arm-softmmu.mak | 1 +
15
hw/misc/trace-events | 7 +
16
5 files changed, 496 insertions(+)
17
create mode 100644 include/hw/misc/iotkit-secctl.h
18
create mode 100644 hw/misc/iotkit-secctl.c
9
19
10
Cc: Peter Maydell <peter.maydell@linaro.org>
20
diff --git a/hw/misc/Makefile.objs b/hw/misc/Makefile.objs
11
Signed-off-by: Linus Walleij <linus.walleij@linaro.org>
12
Message-id: 20180227104903.21353-5-linus.walleij@linaro.org
13
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
14
[PMM: explictly reset ddc_req/ddc_skip_finish/ddc]
15
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
16
---
17
hw/display/Makefile.objs | 1 +
18
hw/display/sii9022.c | 191 +++++++++++++++++++++++++++++++++++++++++++++++
19
hw/display/trace-events | 5 ++
20
3 files changed, 197 insertions(+)
21
create mode 100644 hw/display/sii9022.c
22
23
diff --git a/hw/display/Makefile.objs b/hw/display/Makefile.objs
24
index XXXXXXX..XXXXXXX 100644
21
index XXXXXXX..XXXXXXX 100644
25
--- a/hw/display/Makefile.objs
22
--- a/hw/misc/Makefile.objs
26
+++ b/hw/display/Makefile.objs
23
+++ b/hw/misc/Makefile.objs
27
@@ -XXX,XX +XXX,XX @@ common-obj-$(CONFIG_VGA_CIRRUS) += cirrus_vga.o
24
@@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_MPS2_FPGAIO) += mps2-fpgaio.o
28
common-obj-$(CONFIG_G364FB) += g364fb.o
25
obj-$(CONFIG_MPS2_SCC) += mps2-scc.o
29
common-obj-$(CONFIG_JAZZ_LED) += jazz_led.o
26
30
common-obj-$(CONFIG_PL110) += pl110.o
27
obj-$(CONFIG_TZ_PPC) += tz-ppc.o
31
+common-obj-$(CONFIG_SII9022) += sii9022.o
28
+obj-$(CONFIG_IOTKIT_SECCTL) += iotkit-secctl.o
32
common-obj-$(CONFIG_SSD0303) += ssd0303.o
29
33
common-obj-$(CONFIG_SSD0323) += ssd0323.o
30
obj-$(CONFIG_PVPANIC) += pvpanic.o
34
common-obj-$(CONFIG_XEN) += xenfb.o
31
obj-$(CONFIG_HYPERV_TESTDEV) += hyperv_testdev.o
35
diff --git a/hw/display/sii9022.c b/hw/display/sii9022.c
32
diff --git a/include/hw/misc/iotkit-secctl.h b/include/hw/misc/iotkit-secctl.h
36
new file mode 100644
33
new file mode 100644
37
index XXXXXXX..XXXXXXX
34
index XXXXXXX..XXXXXXX
38
--- /dev/null
35
--- /dev/null
39
+++ b/hw/display/sii9022.c
36
+++ b/include/hw/misc/iotkit-secctl.h
40
@@ -XXX,XX +XXX,XX @@
37
@@ -XXX,XX +XXX,XX @@
41
+/*
38
+/*
42
+ * Silicon Image SiI9022
39
+ * ARM IoT Kit security controller
43
+ *
40
+ *
44
+ * This is a pretty hollow emulation: all we do is acknowledge that we
41
+ * Copyright (c) 2018 Linaro Limited
45
+ * exist (chip ID) and confirm that we get switched over into DDC mode
42
+ * Written by Peter Maydell
46
+ * so the emulated host can proceed to read out EDID data. All subsequent
47
+ * set-up of connectors etc will be acknowledged and ignored.
48
+ *
43
+ *
49
+ * Copyright (C) 2018 Linus Walleij
44
+ * This program is free software; you can redistribute it and/or modify
45
+ * it under the terms of the GNU General Public License version 2 or
46
+ * (at your option) any later version.
47
+ */
48
+
49
+/* This is a model of the security controller which is part of the
50
+ * Arm IoT Kit and documented in
51
+ * http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html
50
+ *
52
+ *
51
+ * This work is licensed under the terms of the GNU GPL, version 2 or later.
53
+ * QEMU interface:
52
+ * See the COPYING file in the top-level directory.
54
+ * + sysbus MMIO region 0 is the "secure privilege control block" registers
53
+ * SPDX-License-Identifier: GPL-2.0-or-later
55
+ * + sysbus MMIO region 1 is the "non-secure privilege control block" registers
54
+ */
56
+ */
55
+
57
+
58
+#ifndef IOTKIT_SECCTL_H
59
+#define IOTKIT_SECCTL_H
60
+
61
+#include "hw/sysbus.h"
62
+
63
+#define TYPE_IOTKIT_SECCTL "iotkit-secctl"
64
+#define IOTKIT_SECCTL(obj) OBJECT_CHECK(IoTKitSecCtl, (obj), TYPE_IOTKIT_SECCTL)
65
+
66
+typedef struct IoTKitSecCtl {
67
+ /*< private >*/
68
+ SysBusDevice parent_obj;
69
+
70
+ /*< public >*/
71
+
72
+ MemoryRegion s_regs;
73
+ MemoryRegion ns_regs;
74
+} IoTKitSecCtl;
75
+
76
+#endif
77
diff --git a/hw/misc/iotkit-secctl.c b/hw/misc/iotkit-secctl.c
78
new file mode 100644
79
index XXXXXXX..XXXXXXX
80
--- /dev/null
81
+++ b/hw/misc/iotkit-secctl.c
82
@@ -XXX,XX +XXX,XX @@
83
+/*
84
+ * Arm IoT Kit security controller
85
+ *
86
+ * Copyright (c) 2018 Linaro Limited
87
+ * Written by Peter Maydell
88
+ *
89
+ * This program is free software; you can redistribute it and/or modify
90
+ * it under the terms of the GNU General Public License version 2 or
91
+ * (at your option) any later version.
92
+ */
93
+
56
+#include "qemu/osdep.h"
94
+#include "qemu/osdep.h"
57
+#include "qemu-common.h"
95
+#include "qemu/log.h"
58
+#include "hw/i2c/i2c.h"
96
+#include "qapi/error.h"
59
+#include "hw/i2c/i2c-ddc.h"
60
+#include "trace.h"
97
+#include "trace.h"
61
+
98
+#include "hw/sysbus.h"
62
+#define SII9022_SYS_CTRL_DATA 0x1a
99
+#include "hw/registerfields.h"
63
+#define SII9022_SYS_CTRL_PWR_DWN 0x10
100
+#include "hw/misc/iotkit-secctl.h"
64
+#define SII9022_SYS_CTRL_AV_MUTE 0x08
101
+
65
+#define SII9022_SYS_CTRL_DDC_BUS_REQ 0x04
102
+/* Registers in the secure privilege control block */
66
+#define SII9022_SYS_CTRL_DDC_BUS_GRTD 0x02
103
+REG32(SECRESPCFG, 0x10)
67
+#define SII9022_SYS_CTRL_OUTPUT_MODE 0x01
104
+REG32(NSCCFG, 0x14)
68
+#define SII9022_SYS_CTRL_OUTPUT_HDMI 1
105
+REG32(SECMPCINTSTATUS, 0x1c)
69
+#define SII9022_SYS_CTRL_OUTPUT_DVI 0
106
+REG32(SECPPCINTSTAT, 0x20)
70
+#define SII9022_REG_CHIPID 0x1b
107
+REG32(SECPPCINTCLR, 0x24)
71
+#define SII9022_INT_ENABLE 0x3c
108
+REG32(SECPPCINTEN, 0x28)
72
+#define SII9022_INT_STATUS 0x3d
109
+REG32(SECMSCINTSTAT, 0x30)
73
+#define SII9022_INT_STATUS_HOTPLUG 0x01;
110
+REG32(SECMSCINTCLR, 0x34)
74
+#define SII9022_INT_STATUS_PLUGGED 0x04;
111
+REG32(SECMSCINTEN, 0x38)
75
+
112
+REG32(BRGINTSTAT, 0x40)
76
+#define TYPE_SII9022 "sii9022"
113
+REG32(BRGINTCLR, 0x44)
77
+#define SII9022(obj) OBJECT_CHECK(sii9022_state, (obj), TYPE_SII9022)
114
+REG32(BRGINTEN, 0x48)
78
+
115
+REG32(AHBNSPPC0, 0x50)
79
+typedef struct sii9022_state {
116
+REG32(AHBNSPPCEXP0, 0x60)
80
+ I2CSlave parent_obj;
117
+REG32(AHBNSPPCEXP1, 0x64)
81
+ uint8_t ptr;
118
+REG32(AHBNSPPCEXP2, 0x68)
82
+ bool addr_byte;
119
+REG32(AHBNSPPCEXP3, 0x6c)
83
+ bool ddc_req;
120
+REG32(APBNSPPC0, 0x70)
84
+ bool ddc_skip_finish;
121
+REG32(APBNSPPC1, 0x74)
85
+ bool ddc;
122
+REG32(APBNSPPCEXP0, 0x80)
86
+} sii9022_state;
123
+REG32(APBNSPPCEXP1, 0x84)
87
+
124
+REG32(APBNSPPCEXP2, 0x88)
88
+static const VMStateDescription vmstate_sii9022 = {
125
+REG32(APBNSPPCEXP3, 0x8c)
89
+ .name = "sii9022",
126
+REG32(AHBSPPPC0, 0x90)
127
+REG32(AHBSPPPCEXP0, 0xa0)
128
+REG32(AHBSPPPCEXP1, 0xa4)
129
+REG32(AHBSPPPCEXP2, 0xa8)
130
+REG32(AHBSPPPCEXP3, 0xac)
131
+REG32(APBSPPPC0, 0xb0)
132
+REG32(APBSPPPC1, 0xb4)
133
+REG32(APBSPPPCEXP0, 0xc0)
134
+REG32(APBSPPPCEXP1, 0xc4)
135
+REG32(APBSPPPCEXP2, 0xc8)
136
+REG32(APBSPPPCEXP3, 0xcc)
137
+REG32(NSMSCEXP, 0xd0)
138
+REG32(PID4, 0xfd0)
139
+REG32(PID5, 0xfd4)
140
+REG32(PID6, 0xfd8)
141
+REG32(PID7, 0xfdc)
142
+REG32(PID0, 0xfe0)
143
+REG32(PID1, 0xfe4)
144
+REG32(PID2, 0xfe8)
145
+REG32(PID3, 0xfec)
146
+REG32(CID0, 0xff0)
147
+REG32(CID1, 0xff4)
148
+REG32(CID2, 0xff8)
149
+REG32(CID3, 0xffc)
150
+
151
+/* Registers in the non-secure privilege control block */
152
+REG32(AHBNSPPPC0, 0x90)
153
+REG32(AHBNSPPPCEXP0, 0xa0)
154
+REG32(AHBNSPPPCEXP1, 0xa4)
155
+REG32(AHBNSPPPCEXP2, 0xa8)
156
+REG32(AHBNSPPPCEXP3, 0xac)
157
+REG32(APBNSPPPC0, 0xb0)
158
+REG32(APBNSPPPC1, 0xb4)
159
+REG32(APBNSPPPCEXP0, 0xc0)
160
+REG32(APBNSPPPCEXP1, 0xc4)
161
+REG32(APBNSPPPCEXP2, 0xc8)
162
+REG32(APBNSPPPCEXP3, 0xcc)
163
+/* PID and CID registers are also present in the NS block */
164
+
165
+static const uint8_t iotkit_secctl_s_idregs[] = {
166
+ 0x04, 0x00, 0x00, 0x00,
167
+ 0x52, 0xb8, 0x0b, 0x00,
168
+ 0x0d, 0xf0, 0x05, 0xb1,
169
+};
170
+
171
+static const uint8_t iotkit_secctl_ns_idregs[] = {
172
+ 0x04, 0x00, 0x00, 0x00,
173
+ 0x53, 0xb8, 0x0b, 0x00,
174
+ 0x0d, 0xf0, 0x05, 0xb1,
175
+};
176
+
177
+static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr,
178
+ uint64_t *pdata,
179
+ unsigned size, MemTxAttrs attrs)
180
+{
181
+ uint64_t r;
182
+ uint32_t offset = addr & ~0x3;
183
+
184
+ switch (offset) {
185
+ case A_AHBNSPPC0:
186
+ case A_AHBSPPPC0:
187
+ r = 0;
188
+ break;
189
+ case A_SECRESPCFG:
190
+ case A_NSCCFG:
191
+ case A_SECMPCINTSTATUS:
192
+ case A_SECPPCINTSTAT:
193
+ case A_SECPPCINTEN:
194
+ case A_SECMSCINTSTAT:
195
+ case A_SECMSCINTEN:
196
+ case A_BRGINTSTAT:
197
+ case A_BRGINTEN:
198
+ case A_AHBNSPPCEXP0:
199
+ case A_AHBNSPPCEXP1:
200
+ case A_AHBNSPPCEXP2:
201
+ case A_AHBNSPPCEXP3:
202
+ case A_APBNSPPC0:
203
+ case A_APBNSPPC1:
204
+ case A_APBNSPPCEXP0:
205
+ case A_APBNSPPCEXP1:
206
+ case A_APBNSPPCEXP2:
207
+ case A_APBNSPPCEXP3:
208
+ case A_AHBSPPPCEXP0:
209
+ case A_AHBSPPPCEXP1:
210
+ case A_AHBSPPPCEXP2:
211
+ case A_AHBSPPPCEXP3:
212
+ case A_APBSPPPC0:
213
+ case A_APBSPPPC1:
214
+ case A_APBSPPPCEXP0:
215
+ case A_APBSPPPCEXP1:
216
+ case A_APBSPPPCEXP2:
217
+ case A_APBSPPPCEXP3:
218
+ case A_NSMSCEXP:
219
+ qemu_log_mask(LOG_UNIMP,
220
+ "IoTKit SecCtl S block read: "
221
+ "unimplemented offset 0x%x\n", offset);
222
+ r = 0;
223
+ break;
224
+ case A_PID4:
225
+ case A_PID5:
226
+ case A_PID6:
227
+ case A_PID7:
228
+ case A_PID0:
229
+ case A_PID1:
230
+ case A_PID2:
231
+ case A_PID3:
232
+ case A_CID0:
233
+ case A_CID1:
234
+ case A_CID2:
235
+ case A_CID3:
236
+ r = iotkit_secctl_s_idregs[(offset - A_PID4) / 4];
237
+ break;
238
+ case A_SECPPCINTCLR:
239
+ case A_SECMSCINTCLR:
240
+ case A_BRGINTCLR:
241
+ qemu_log_mask(LOG_GUEST_ERROR,
242
+ "IotKit SecCtl S block read: write-only offset 0x%x\n",
243
+ offset);
244
+ r = 0;
245
+ break;
246
+ default:
247
+ qemu_log_mask(LOG_GUEST_ERROR,
248
+ "IotKit SecCtl S block read: bad offset 0x%x\n", offset);
249
+ r = 0;
250
+ break;
251
+ }
252
+
253
+ if (size != 4) {
254
+ /* None of our registers are access-sensitive, so just pull the right
255
+ * byte out of the word read result.
256
+ */
257
+ r = extract32(r, (addr & 3) * 8, size * 8);
258
+ }
259
+
260
+ trace_iotkit_secctl_s_read(offset, r, size);
261
+ *pdata = r;
262
+ return MEMTX_OK;
263
+}
264
+
265
+static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr,
266
+ uint64_t value,
267
+ unsigned size, MemTxAttrs attrs)
268
+{
269
+ uint32_t offset = addr;
270
+
271
+ trace_iotkit_secctl_s_write(offset, value, size);
272
+
273
+ if (size != 4) {
274
+ /* Byte and halfword writes are ignored */
275
+ qemu_log_mask(LOG_GUEST_ERROR,
276
+ "IotKit SecCtl S block write: bad size, ignored\n");
277
+ return MEMTX_OK;
278
+ }
279
+
280
+ switch (offset) {
281
+ case A_SECRESPCFG:
282
+ case A_NSCCFG:
283
+ case A_SECPPCINTCLR:
284
+ case A_SECPPCINTEN:
285
+ case A_SECMSCINTCLR:
286
+ case A_SECMSCINTEN:
287
+ case A_BRGINTCLR:
288
+ case A_BRGINTEN:
289
+ case A_AHBNSPPCEXP0:
290
+ case A_AHBNSPPCEXP1:
291
+ case A_AHBNSPPCEXP2:
292
+ case A_AHBNSPPCEXP3:
293
+ case A_APBNSPPC0:
294
+ case A_APBNSPPC1:
295
+ case A_APBNSPPCEXP0:
296
+ case A_APBNSPPCEXP1:
297
+ case A_APBNSPPCEXP2:
298
+ case A_APBNSPPCEXP3:
299
+ case A_AHBSPPPCEXP0:
300
+ case A_AHBSPPPCEXP1:
301
+ case A_AHBSPPPCEXP2:
302
+ case A_AHBSPPPCEXP3:
303
+ case A_APBSPPPC0:
304
+ case A_APBSPPPC1:
305
+ case A_APBSPPPCEXP0:
306
+ case A_APBSPPPCEXP1:
307
+ case A_APBSPPPCEXP2:
308
+ case A_APBSPPPCEXP3:
309
+ qemu_log_mask(LOG_UNIMP,
310
+ "IoTKit SecCtl S block write: "
311
+ "unimplemented offset 0x%x\n", offset);
312
+ break;
313
+ case A_SECMPCINTSTATUS:
314
+ case A_SECPPCINTSTAT:
315
+ case A_SECMSCINTSTAT:
316
+ case A_BRGINTSTAT:
317
+ case A_AHBNSPPC0:
318
+ case A_AHBSPPPC0:
319
+ case A_NSMSCEXP:
320
+ case A_PID4:
321
+ case A_PID5:
322
+ case A_PID6:
323
+ case A_PID7:
324
+ case A_PID0:
325
+ case A_PID1:
326
+ case A_PID2:
327
+ case A_PID3:
328
+ case A_CID0:
329
+ case A_CID1:
330
+ case A_CID2:
331
+ case A_CID3:
332
+ qemu_log_mask(LOG_GUEST_ERROR,
333
+ "IoTKit SecCtl S block write: "
334
+ "read-only offset 0x%x\n", offset);
335
+ break;
336
+ default:
337
+ qemu_log_mask(LOG_GUEST_ERROR,
338
+ "IotKit SecCtl S block write: bad offset 0x%x\n",
339
+ offset);
340
+ break;
341
+ }
342
+
343
+ return MEMTX_OK;
344
+}
345
+
346
+static MemTxResult iotkit_secctl_ns_read(void *opaque, hwaddr addr,
347
+ uint64_t *pdata,
348
+ unsigned size, MemTxAttrs attrs)
349
+{
350
+ uint64_t r;
351
+ uint32_t offset = addr & ~0x3;
352
+
353
+ switch (offset) {
354
+ case A_AHBNSPPPC0:
355
+ r = 0;
356
+ break;
357
+ case A_AHBNSPPPCEXP0:
358
+ case A_AHBNSPPPCEXP1:
359
+ case A_AHBNSPPPCEXP2:
360
+ case A_AHBNSPPPCEXP3:
361
+ case A_APBNSPPPC0:
362
+ case A_APBNSPPPC1:
363
+ case A_APBNSPPPCEXP0:
364
+ case A_APBNSPPPCEXP1:
365
+ case A_APBNSPPPCEXP2:
366
+ case A_APBNSPPPCEXP3:
367
+ qemu_log_mask(LOG_UNIMP,
368
+ "IoTKit SecCtl NS block read: "
369
+ "unimplemented offset 0x%x\n", offset);
370
+ break;
371
+ case A_PID4:
372
+ case A_PID5:
373
+ case A_PID6:
374
+ case A_PID7:
375
+ case A_PID0:
376
+ case A_PID1:
377
+ case A_PID2:
378
+ case A_PID3:
379
+ case A_CID0:
380
+ case A_CID1:
381
+ case A_CID2:
382
+ case A_CID3:
383
+ r = iotkit_secctl_ns_idregs[(offset - A_PID4) / 4];
384
+ break;
385
+ default:
386
+ qemu_log_mask(LOG_GUEST_ERROR,
387
+ "IotKit SecCtl NS block write: bad offset 0x%x\n",
388
+ offset);
389
+ r = 0;
390
+ break;
391
+ }
392
+
393
+ if (size != 4) {
394
+ /* None of our registers are access-sensitive, so just pull the right
395
+ * byte out of the word read result.
396
+ */
397
+ r = extract32(r, (addr & 3) * 8, size * 8);
398
+ }
399
+
400
+ trace_iotkit_secctl_ns_read(offset, r, size);
401
+ *pdata = r;
402
+ return MEMTX_OK;
403
+}
404
+
405
+static MemTxResult iotkit_secctl_ns_write(void *opaque, hwaddr addr,
406
+ uint64_t value,
407
+ unsigned size, MemTxAttrs attrs)
408
+{
409
+ uint32_t offset = addr;
410
+
411
+ trace_iotkit_secctl_ns_write(offset, value, size);
412
+
413
+ if (size != 4) {
414
+ /* Byte and halfword writes are ignored */
415
+ qemu_log_mask(LOG_GUEST_ERROR,
416
+ "IotKit SecCtl NS block write: bad size, ignored\n");
417
+ return MEMTX_OK;
418
+ }
419
+
420
+ switch (offset) {
421
+ case A_AHBNSPPPCEXP0:
422
+ case A_AHBNSPPPCEXP1:
423
+ case A_AHBNSPPPCEXP2:
424
+ case A_AHBNSPPPCEXP3:
425
+ case A_APBNSPPPC0:
426
+ case A_APBNSPPPC1:
427
+ case A_APBNSPPPCEXP0:
428
+ case A_APBNSPPPCEXP1:
429
+ case A_APBNSPPPCEXP2:
430
+ case A_APBNSPPPCEXP3:
431
+ qemu_log_mask(LOG_UNIMP,
432
+ "IoTKit SecCtl NS block write: "
433
+ "unimplemented offset 0x%x\n", offset);
434
+ break;
435
+ case A_AHBNSPPPC0:
436
+ case A_PID4:
437
+ case A_PID5:
438
+ case A_PID6:
439
+ case A_PID7:
440
+ case A_PID0:
441
+ case A_PID1:
442
+ case A_PID2:
443
+ case A_PID3:
444
+ case A_CID0:
445
+ case A_CID1:
446
+ case A_CID2:
447
+ case A_CID3:
448
+ qemu_log_mask(LOG_GUEST_ERROR,
449
+ "IoTKit SecCtl NS block write: "
450
+ "read-only offset 0x%x\n", offset);
451
+ break;
452
+ default:
453
+ qemu_log_mask(LOG_GUEST_ERROR,
454
+ "IotKit SecCtl NS block write: bad offset 0x%x\n",
455
+ offset);
456
+ break;
457
+ }
458
+
459
+ return MEMTX_OK;
460
+}
461
+
462
+static const MemoryRegionOps iotkit_secctl_s_ops = {
463
+ .read_with_attrs = iotkit_secctl_s_read,
464
+ .write_with_attrs = iotkit_secctl_s_write,
465
+ .endianness = DEVICE_LITTLE_ENDIAN,
466
+ .valid.min_access_size = 1,
467
+ .valid.max_access_size = 4,
468
+ .impl.min_access_size = 1,
469
+ .impl.max_access_size = 4,
470
+};
471
+
472
+static const MemoryRegionOps iotkit_secctl_ns_ops = {
473
+ .read_with_attrs = iotkit_secctl_ns_read,
474
+ .write_with_attrs = iotkit_secctl_ns_write,
475
+ .endianness = DEVICE_LITTLE_ENDIAN,
476
+ .valid.min_access_size = 1,
477
+ .valid.max_access_size = 4,
478
+ .impl.min_access_size = 1,
479
+ .impl.max_access_size = 4,
480
+};
481
+
482
+static void iotkit_secctl_reset(DeviceState *dev)
483
+{
484
+
485
+}
486
+
487
+static void iotkit_secctl_init(Object *obj)
488
+{
489
+ IoTKitSecCtl *s = IOTKIT_SECCTL(obj);
490
+ SysBusDevice *sbd = SYS_BUS_DEVICE(obj);
491
+
492
+ memory_region_init_io(&s->s_regs, obj, &iotkit_secctl_s_ops,
493
+ s, "iotkit-secctl-s-regs", 0x1000);
494
+ memory_region_init_io(&s->ns_regs, obj, &iotkit_secctl_ns_ops,
495
+ s, "iotkit-secctl-ns-regs", 0x1000);
496
+ sysbus_init_mmio(sbd, &s->s_regs);
497
+ sysbus_init_mmio(sbd, &s->ns_regs);
498
+}
499
+
500
+static const VMStateDescription iotkit_secctl_vmstate = {
501
+ .name = "iotkit-secctl",
90
+ .version_id = 1,
502
+ .version_id = 1,
91
+ .minimum_version_id = 1,
503
+ .minimum_version_id = 1,
92
+ .fields = (VMStateField[]) {
504
+ .fields = (VMStateField[]) {
93
+ VMSTATE_I2C_SLAVE(parent_obj, sii9022_state),
94
+ VMSTATE_UINT8(ptr, sii9022_state),
95
+ VMSTATE_BOOL(addr_byte, sii9022_state),
96
+ VMSTATE_BOOL(ddc_req, sii9022_state),
97
+ VMSTATE_BOOL(ddc_skip_finish, sii9022_state),
98
+ VMSTATE_BOOL(ddc, sii9022_state),
99
+ VMSTATE_END_OF_LIST()
505
+ VMSTATE_END_OF_LIST()
100
+ }
506
+ }
101
+};
507
+};
102
+
508
+
103
+static int sii9022_event(I2CSlave *i2c, enum i2c_event event)
509
+static void iotkit_secctl_class_init(ObjectClass *klass, void *data)
104
+{
105
+ sii9022_state *s = SII9022(i2c);
106
+
107
+ switch (event) {
108
+ case I2C_START_SEND:
109
+ s->addr_byte = true;
110
+ break;
111
+ case I2C_START_RECV:
112
+ break;
113
+ case I2C_FINISH:
114
+ break;
115
+ case I2C_NACK:
116
+ break;
117
+ }
118
+
119
+ return 0;
120
+}
121
+
122
+static int sii9022_rx(I2CSlave *i2c)
123
+{
124
+ sii9022_state *s = SII9022(i2c);
125
+ uint8_t res = 0x00;
126
+
127
+ switch (s->ptr) {
128
+ case SII9022_SYS_CTRL_DATA:
129
+ if (s->ddc_req) {
130
+ /* Acknowledge DDC bus request */
131
+ res = SII9022_SYS_CTRL_DDC_BUS_GRTD | SII9022_SYS_CTRL_DDC_BUS_REQ;
132
+ }
133
+ break;
134
+ case SII9022_REG_CHIPID:
135
+ res = 0xb0;
136
+ break;
137
+ case SII9022_INT_STATUS:
138
+ /* Something is cold-plugged in, no interrupts */
139
+ res = SII9022_INT_STATUS_PLUGGED;
140
+ break;
141
+ default:
142
+ break;
143
+ }
144
+
145
+ trace_sii9022_read_reg(s->ptr, res);
146
+ s->ptr++;
147
+
148
+ return res;
149
+}
150
+
151
+static int sii9022_tx(I2CSlave *i2c, uint8_t data)
152
+{
153
+ sii9022_state *s = SII9022(i2c);
154
+
155
+ if (s->addr_byte) {
156
+ s->ptr = data;
157
+ s->addr_byte = false;
158
+ return 0;
159
+ }
160
+
161
+ switch (s->ptr) {
162
+ case SII9022_SYS_CTRL_DATA:
163
+ if (data & SII9022_SYS_CTRL_DDC_BUS_REQ) {
164
+ s->ddc_req = true;
165
+ if (data & SII9022_SYS_CTRL_DDC_BUS_GRTD) {
166
+ s->ddc = true;
167
+ /* Skip this finish since we just switched to DDC */
168
+ s->ddc_skip_finish = true;
169
+ trace_sii9022_switch_mode("DDC");
170
+ }
171
+ } else {
172
+ s->ddc_req = false;
173
+ s->ddc = false;
174
+ trace_sii9022_switch_mode("normal");
175
+ }
176
+ break;
177
+ default:
178
+ break;
179
+ }
180
+
181
+ trace_sii9022_write_reg(s->ptr, data);
182
+ s->ptr++;
183
+
184
+ return 0;
185
+}
186
+
187
+static void sii9022_reset(DeviceState *dev)
188
+{
189
+ sii9022_state *s = SII9022(dev);
190
+
191
+ s->ptr = 0;
192
+ s->addr_byte = false;
193
+ s->ddc_req = false;
194
+ s->ddc_skip_finish = false;
195
+ s->ddc = false;
196
+}
197
+
198
+static void sii9022_realize(DeviceState *dev, Error **errp)
199
+{
200
+ I2CBus *bus;
201
+
202
+ bus = I2C_BUS(qdev_get_parent_bus(dev));
203
+ i2c_create_slave(bus, TYPE_I2CDDC, 0x50);
204
+}
205
+
206
+static void sii9022_class_init(ObjectClass *klass, void *data)
207
+{
510
+{
208
+ DeviceClass *dc = DEVICE_CLASS(klass);
511
+ DeviceClass *dc = DEVICE_CLASS(klass);
209
+ I2CSlaveClass *k = I2C_SLAVE_CLASS(klass);
512
+
210
+
513
+ dc->vmsd = &iotkit_secctl_vmstate;
211
+ k->event = sii9022_event;
514
+ dc->reset = iotkit_secctl_reset;
212
+ k->recv = sii9022_rx;
515
+}
213
+ k->send = sii9022_tx;
516
+
214
+ dc->reset = sii9022_reset;
517
+static const TypeInfo iotkit_secctl_info = {
215
+ dc->realize = sii9022_realize;
518
+ .name = TYPE_IOTKIT_SECCTL,
216
+ dc->vmsd = &vmstate_sii9022;
519
+ .parent = TYPE_SYS_BUS_DEVICE,
217
+}
520
+ .instance_size = sizeof(IoTKitSecCtl),
218
+
521
+ .instance_init = iotkit_secctl_init,
219
+static const TypeInfo sii9022_info = {
522
+ .class_init = iotkit_secctl_class_init,
220
+ .name = TYPE_SII9022,
221
+ .parent = TYPE_I2C_SLAVE,
222
+ .instance_size = sizeof(sii9022_state),
223
+ .class_init = sii9022_class_init,
224
+};
523
+};
225
+
524
+
226
+static void sii9022_register_types(void)
525
+static void iotkit_secctl_register_types(void)
227
+{
526
+{
228
+ type_register_static(&sii9022_info);
527
+ type_register_static(&iotkit_secctl_info);
229
+}
528
+}
230
+
529
+
231
+type_init(sii9022_register_types)
530
+type_init(iotkit_secctl_register_types);
232
diff --git a/hw/display/trace-events b/hw/display/trace-events
531
diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak
233
index XXXXXXX..XXXXXXX 100644
532
index XXXXXXX..XXXXXXX 100644
234
--- a/hw/display/trace-events
533
--- a/default-configs/arm-softmmu.mak
235
+++ b/hw/display/trace-events
534
+++ b/default-configs/arm-softmmu.mak
236
@@ -XXX,XX +XXX,XX @@ vga_cirrus_read_io(uint32_t addr, uint32_t val) "addr 0x%x, val 0x%x"
535
@@ -XXX,XX +XXX,XX @@ CONFIG_MPS2_FPGAIO=y
237
vga_cirrus_write_io(uint32_t addr, uint32_t val) "addr 0x%x, val 0x%x"
536
CONFIG_MPS2_SCC=y
238
vga_cirrus_read_blt(uint32_t offset, uint32_t val) "offset 0x%x, val 0x%x"
537
239
vga_cirrus_write_blt(uint32_t offset, uint32_t val) "offset 0x%x, val 0x%x"
538
CONFIG_TZ_PPC=y
240
+
539
+CONFIG_IOTKIT_SECCTL=y
241
+# hw/display/sii9022.c
540
242
+sii9022_read_reg(uint8_t addr, uint8_t val) "addr 0x%02x, val 0x%02x"
541
CONFIG_VERSATILE_PCI=y
243
+sii9022_write_reg(uint8_t addr, uint8_t val) "addr 0x%02x, val 0x%02x"
542
CONFIG_VERSATILE_I2C=y
244
+sii9022_switch_mode(const char *mode) "mode: %s"
543
diff --git a/hw/misc/trace-events b/hw/misc/trace-events
544
index XXXXXXX..XXXXXXX 100644
545
--- a/hw/misc/trace-events
546
+++ b/hw/misc/trace-events
547
@@ -XXX,XX +XXX,XX @@ tz_ppc_irq_clear(int level) "TZ PPC: int_clear = %d"
548
tz_ppc_update_irq(int level) "TZ PPC: setting irq line to %d"
549
tz_ppc_read_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " read (secure %d user %d) blocked"
550
tz_ppc_write_blocked(int n, hwaddr offset, bool secure, bool user) "TZ PPC: port %d offset 0x%" HWADDR_PRIx " write (secure %d user %d) blocked"
551
+
552
+# hw/misc/iotkit-secctl.c
553
+iotkit_secctl_s_read(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl S regs read: offset 0x%x data 0x%" PRIx64 " size %u"
554
+iotkit_secctl_s_write(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl S regs write: offset 0x%x data 0x%" PRIx64 " size %u"
555
+iotkit_secctl_ns_read(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl NS regs read: offset 0x%x data 0x%" PRIx64 " size %u"
556
+iotkit_secctl_ns_write(uint32_t offset, uint64_t data, unsigned size) "IoTKit SecCtl NS regs write: offset 0x%x data 0x%" PRIx64 " size %u"
557
+iotkit_secctl_reset(void) "IoTKit SecCtl: reset"
245
--
558
--
246
2.16.2
559
2.16.2
247
560
248
561
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
The IoTKit Security Controller includes various registers
2
that expose to software the controls for the Peripheral
3
Protection Controllers in the system. Implement these.
2
4
3
As some of the constants here will also be needed
5
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
elsewhere (specifically for the upcoming SVE support) we move them out
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
5
to softfloat.h.
7
Message-id: 20180220180325.29818-17-peter.maydell@linaro.org
8
---
9
include/hw/misc/iotkit-secctl.h | 64 +++++++++-
10
hw/misc/iotkit-secctl.c | 270 +++++++++++++++++++++++++++++++++++++---
11
2 files changed, 315 insertions(+), 19 deletions(-)
6
12
7
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
13
diff --git a/include/hw/misc/iotkit-secctl.h b/include/hw/misc/iotkit-secctl.h
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Message-id: 20180227143852.11175-13-alex.bennee@linaro.org
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
12
include/fpu/softfloat.h | 18 +++++++++++++-----
13
target/arm/helper-a64.h | 2 ++
14
target/arm/helper-a64.c | 34 ++++++++++++++++++++++++++++++++++
15
target/arm/translate-a64.c | 6 ++++++
16
4 files changed, 55 insertions(+), 5 deletions(-)
17
18
diff --git a/include/fpu/softfloat.h b/include/fpu/softfloat.h
19
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
20
--- a/include/fpu/softfloat.h
15
--- a/include/hw/misc/iotkit-secctl.h
21
+++ b/include/fpu/softfloat.h
16
+++ b/include/hw/misc/iotkit-secctl.h
22
@@ -XXX,XX +XXX,XX @@ static inline float16 float16_set_sign(float16 a, int sign)
17
@@ -XXX,XX +XXX,XX @@
18
* QEMU interface:
19
* + sysbus MMIO region 0 is the "secure privilege control block" registers
20
* + sysbus MMIO region 1 is the "non-secure privilege control block" registers
21
+ * + named GPIO output "sec_resp_cfg" indicating whether blocked accesses
22
+ * should RAZ/WI or bus error
23
+ * Controlling the 2 APB PPCs in the IoTKit:
24
+ * + named GPIO outputs apb_ppc0_nonsec[0..2] and apb_ppc1_nonsec
25
+ * + named GPIO outputs apb_ppc0_ap[0..2] and apb_ppc1_ap
26
+ * + named GPIO outputs apb_ppc{0,1}_irq_enable
27
+ * + named GPIO outputs apb_ppc{0,1}_irq_clear
28
+ * + named GPIO inputs apb_ppc{0,1}_irq_status
29
+ * Controlling each of the 4 expansion APB PPCs which a system using the IoTKit
30
+ * might provide:
31
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_nonsec[0..15]
32
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_ap[0..15]
33
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_enable
34
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_clear
35
+ * + named GPIO inputs apb_ppcexp{0,1,2,3}_irq_status
36
+ * Controlling each of the 4 expansion AHB PPCs which a system using the IoTKit
37
+ * might provide:
38
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_nonsec[0..15]
39
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_ap[0..15]
40
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_enable
41
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_clear
42
+ * + named GPIO inputs ahb_ppcexp{0,1,2,3}_irq_status
43
*/
44
45
#ifndef IOTKIT_SECCTL_H
46
@@ -XXX,XX +XXX,XX @@
47
#define TYPE_IOTKIT_SECCTL "iotkit-secctl"
48
#define IOTKIT_SECCTL(obj) OBJECT_CHECK(IoTKitSecCtl, (obj), TYPE_IOTKIT_SECCTL)
49
50
-typedef struct IoTKitSecCtl {
51
+#define IOTS_APB_PPC0_NUM_PORTS 3
52
+#define IOTS_APB_PPC1_NUM_PORTS 1
53
+#define IOTS_PPC_NUM_PORTS 16
54
+#define IOTS_NUM_APB_PPC 2
55
+#define IOTS_NUM_APB_EXP_PPC 4
56
+#define IOTS_NUM_AHB_EXP_PPC 4
57
+
58
+typedef struct IoTKitSecCtl IoTKitSecCtl;
59
+
60
+/* State and IRQ lines relating to a PPC. For the
61
+ * PPCs in the IoTKit not all the IRQ lines are used.
62
+ */
63
+typedef struct IoTKitSecCtlPPC {
64
+ qemu_irq nonsec[IOTS_PPC_NUM_PORTS];
65
+ qemu_irq ap[IOTS_PPC_NUM_PORTS];
66
+ qemu_irq irq_enable;
67
+ qemu_irq irq_clear;
68
+
69
+ uint32_t ns;
70
+ uint32_t sp;
71
+ uint32_t nsp;
72
+
73
+ /* Number of ports actually present */
74
+ int numports;
75
+ /* Offset of this PPC's interrupt bits in SECPPCINTSTAT */
76
+ int irq_bit_offset;
77
+ IoTKitSecCtl *parent;
78
+} IoTKitSecCtlPPC;
79
+
80
+struct IoTKitSecCtl {
81
/*< private >*/
82
SysBusDevice parent_obj;
83
84
/*< public >*/
85
+ qemu_irq sec_resp_cfg;
86
87
MemoryRegion s_regs;
88
MemoryRegion ns_regs;
89
-} IoTKitSecCtl;
90
+
91
+ uint32_t secppcintstat;
92
+ uint32_t secppcinten;
93
+ uint32_t secrespcfg;
94
+
95
+ IoTKitSecCtlPPC apb[IOTS_NUM_APB_PPC];
96
+ IoTKitSecCtlPPC apbexp[IOTS_NUM_APB_EXP_PPC];
97
+ IoTKitSecCtlPPC ahbexp[IOTS_NUM_APB_EXP_PPC];
98
+};
99
100
#endif
101
diff --git a/hw/misc/iotkit-secctl.c b/hw/misc/iotkit-secctl.c
102
index XXXXXXX..XXXXXXX 100644
103
--- a/hw/misc/iotkit-secctl.c
104
+++ b/hw/misc/iotkit-secctl.c
105
@@ -XXX,XX +XXX,XX @@ static const uint8_t iotkit_secctl_ns_idregs[] = {
106
0x0d, 0xf0, 0x05, 0xb1,
107
};
108
109
+/* The register sets for the various PPCs (AHB internal, APB internal,
110
+ * AHB expansion, APB expansion) are all set up so that they are
111
+ * in 16-aligned blocks so offsets 0xN0, 0xN4, 0xN8, 0xNC are PPCs
112
+ * 0, 1, 2, 3 of that type, so we can convert a register address offset
113
+ * into an an index into a PPC array easily.
114
+ */
115
+static inline int offset_to_ppc_idx(uint32_t offset)
116
+{
117
+ return extract32(offset, 2, 2);
118
+}
119
+
120
+typedef void PerPPCFunction(IoTKitSecCtlPPC *ppc);
121
+
122
+static void foreach_ppc(IoTKitSecCtl *s, PerPPCFunction *fn)
123
+{
124
+ int i;
125
+
126
+ for (i = 0; i < IOTS_NUM_APB_PPC; i++) {
127
+ fn(&s->apb[i]);
128
+ }
129
+ for (i = 0; i < IOTS_NUM_APB_EXP_PPC; i++) {
130
+ fn(&s->apbexp[i]);
131
+ }
132
+ for (i = 0; i < IOTS_NUM_AHB_EXP_PPC; i++) {
133
+ fn(&s->ahbexp[i]);
134
+ }
135
+}
136
+
137
static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr,
138
uint64_t *pdata,
139
unsigned size, MemTxAttrs attrs)
140
{
141
uint64_t r;
142
uint32_t offset = addr & ~0x3;
143
+ IoTKitSecCtl *s = IOTKIT_SECCTL(opaque);
144
145
switch (offset) {
146
case A_AHBNSPPC0:
147
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr,
148
r = 0;
149
break;
150
case A_SECRESPCFG:
151
- case A_NSCCFG:
152
- case A_SECMPCINTSTATUS:
153
+ r = s->secrespcfg;
154
+ break;
155
case A_SECPPCINTSTAT:
156
+ r = s->secppcintstat;
157
+ break;
158
case A_SECPPCINTEN:
159
- case A_SECMSCINTSTAT:
160
- case A_SECMSCINTEN:
161
- case A_BRGINTSTAT:
162
- case A_BRGINTEN:
163
+ r = s->secppcinten;
164
+ break;
165
case A_AHBNSPPCEXP0:
166
case A_AHBNSPPCEXP1:
167
case A_AHBNSPPCEXP2:
168
case A_AHBNSPPCEXP3:
169
+ r = s->ahbexp[offset_to_ppc_idx(offset)].ns;
170
+ break;
171
case A_APBNSPPC0:
172
case A_APBNSPPC1:
173
+ r = s->apb[offset_to_ppc_idx(offset)].ns;
174
+ break;
175
case A_APBNSPPCEXP0:
176
case A_APBNSPPCEXP1:
177
case A_APBNSPPCEXP2:
178
case A_APBNSPPCEXP3:
179
+ r = s->apbexp[offset_to_ppc_idx(offset)].ns;
180
+ break;
181
case A_AHBSPPPCEXP0:
182
case A_AHBSPPPCEXP1:
183
case A_AHBSPPPCEXP2:
184
case A_AHBSPPPCEXP3:
185
+ r = s->apbexp[offset_to_ppc_idx(offset)].sp;
186
+ break;
187
case A_APBSPPPC0:
188
case A_APBSPPPC1:
189
+ r = s->apb[offset_to_ppc_idx(offset)].sp;
190
+ break;
191
case A_APBSPPPCEXP0:
192
case A_APBSPPPCEXP1:
193
case A_APBSPPPCEXP2:
194
case A_APBSPPPCEXP3:
195
+ r = s->apbexp[offset_to_ppc_idx(offset)].sp;
196
+ break;
197
+ case A_NSCCFG:
198
+ case A_SECMPCINTSTATUS:
199
+ case A_SECMSCINTSTAT:
200
+ case A_SECMSCINTEN:
201
+ case A_BRGINTSTAT:
202
+ case A_BRGINTEN:
203
case A_NSMSCEXP:
204
qemu_log_mask(LOG_UNIMP,
205
"IoTKit SecCtl S block read: "
206
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr,
207
return MEMTX_OK;
23
}
208
}
24
209
25
#define float16_zero make_float16(0)
210
+static void iotkit_secctl_update_ppc_ap(IoTKitSecCtlPPC *ppc)
26
-#define float16_one make_float16(0x3c00)
211
+{
27
#define float16_half make_float16(0x3800)
212
+ int i;
28
+#define float16_one make_float16(0x3c00)
213
+
29
+#define float16_one_point_five make_float16(0x3e00)
214
+ for (i = 0; i < ppc->numports; i++) {
30
+#define float16_two make_float16(0x4000)
215
+ bool v;
31
+#define float16_three make_float16(0x4200)
216
+
32
#define float16_infinity make_float16(0x7c00)
217
+ if (extract32(ppc->ns, i, 1)) {
33
218
+ v = extract32(ppc->nsp, i, 1);
34
/*----------------------------------------------------------------------------
219
+ } else {
35
@@ -XXX,XX +XXX,XX @@ static inline float32 float32_set_sign(float32 a, int sign)
220
+ v = extract32(ppc->sp, i, 1);
221
+ }
222
+ qemu_set_irq(ppc->ap[i], v);
223
+ }
224
+}
225
+
226
+static void iotkit_secctl_ppc_ns_write(IoTKitSecCtlPPC *ppc, uint32_t value)
227
+{
228
+ int i;
229
+
230
+ ppc->ns = value & MAKE_64BIT_MASK(0, ppc->numports);
231
+ for (i = 0; i < ppc->numports; i++) {
232
+ qemu_set_irq(ppc->nonsec[i], extract32(ppc->ns, i, 1));
233
+ }
234
+ iotkit_secctl_update_ppc_ap(ppc);
235
+}
236
+
237
+static void iotkit_secctl_ppc_sp_write(IoTKitSecCtlPPC *ppc, uint32_t value)
238
+{
239
+ ppc->sp = value & MAKE_64BIT_MASK(0, ppc->numports);
240
+ iotkit_secctl_update_ppc_ap(ppc);
241
+}
242
+
243
+static void iotkit_secctl_ppc_nsp_write(IoTKitSecCtlPPC *ppc, uint32_t value)
244
+{
245
+ ppc->nsp = value & MAKE_64BIT_MASK(0, ppc->numports);
246
+ iotkit_secctl_update_ppc_ap(ppc);
247
+}
248
+
249
+static void iotkit_secctl_ppc_update_irq_clear(IoTKitSecCtlPPC *ppc)
250
+{
251
+ uint32_t value = ppc->parent->secppcintstat;
252
+
253
+ qemu_set_irq(ppc->irq_clear, extract32(value, ppc->irq_bit_offset, 1));
254
+}
255
+
256
+static void iotkit_secctl_ppc_update_irq_enable(IoTKitSecCtlPPC *ppc)
257
+{
258
+ uint32_t value = ppc->parent->secppcinten;
259
+
260
+ qemu_set_irq(ppc->irq_enable, extract32(value, ppc->irq_bit_offset, 1));
261
+}
262
+
263
static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr,
264
uint64_t value,
265
unsigned size, MemTxAttrs attrs)
266
{
267
+ IoTKitSecCtl *s = IOTKIT_SECCTL(opaque);
268
uint32_t offset = addr;
269
+ IoTKitSecCtlPPC *ppc;
270
271
trace_iotkit_secctl_s_write(offset, value, size);
272
273
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr,
274
275
switch (offset) {
276
case A_SECRESPCFG:
277
- case A_NSCCFG:
278
+ value &= 1;
279
+ s->secrespcfg = value;
280
+ qemu_set_irq(s->sec_resp_cfg, s->secrespcfg);
281
+ break;
282
case A_SECPPCINTCLR:
283
+ value &= 0x00f000f3;
284
+ foreach_ppc(s, iotkit_secctl_ppc_update_irq_clear);
285
+ break;
286
case A_SECPPCINTEN:
287
- case A_SECMSCINTCLR:
288
- case A_SECMSCINTEN:
289
- case A_BRGINTCLR:
290
- case A_BRGINTEN:
291
+ s->secppcinten = value & 0x00f000f3;
292
+ foreach_ppc(s, iotkit_secctl_ppc_update_irq_enable);
293
+ break;
294
case A_AHBNSPPCEXP0:
295
case A_AHBNSPPCEXP1:
296
case A_AHBNSPPCEXP2:
297
case A_AHBNSPPCEXP3:
298
+ ppc = &s->ahbexp[offset_to_ppc_idx(offset)];
299
+ iotkit_secctl_ppc_ns_write(ppc, value);
300
+ break;
301
case A_APBNSPPC0:
302
case A_APBNSPPC1:
303
+ ppc = &s->apb[offset_to_ppc_idx(offset)];
304
+ iotkit_secctl_ppc_ns_write(ppc, value);
305
+ break;
306
case A_APBNSPPCEXP0:
307
case A_APBNSPPCEXP1:
308
case A_APBNSPPCEXP2:
309
case A_APBNSPPCEXP3:
310
+ ppc = &s->apbexp[offset_to_ppc_idx(offset)];
311
+ iotkit_secctl_ppc_ns_write(ppc, value);
312
+ break;
313
case A_AHBSPPPCEXP0:
314
case A_AHBSPPPCEXP1:
315
case A_AHBSPPPCEXP2:
316
case A_AHBSPPPCEXP3:
317
+ ppc = &s->ahbexp[offset_to_ppc_idx(offset)];
318
+ iotkit_secctl_ppc_sp_write(ppc, value);
319
+ break;
320
case A_APBSPPPC0:
321
case A_APBSPPPC1:
322
+ ppc = &s->apb[offset_to_ppc_idx(offset)];
323
+ iotkit_secctl_ppc_sp_write(ppc, value);
324
+ break;
325
case A_APBSPPPCEXP0:
326
case A_APBSPPPCEXP1:
327
case A_APBSPPPCEXP2:
328
case A_APBSPPPCEXP3:
329
+ ppc = &s->apbexp[offset_to_ppc_idx(offset)];
330
+ iotkit_secctl_ppc_sp_write(ppc, value);
331
+ break;
332
+ case A_NSCCFG:
333
+ case A_SECMSCINTCLR:
334
+ case A_SECMSCINTEN:
335
+ case A_BRGINTCLR:
336
+ case A_BRGINTEN:
337
qemu_log_mask(LOG_UNIMP,
338
"IoTKit SecCtl S block write: "
339
"unimplemented offset 0x%x\n", offset);
340
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_read(void *opaque, hwaddr addr,
341
uint64_t *pdata,
342
unsigned size, MemTxAttrs attrs)
343
{
344
+ IoTKitSecCtl *s = IOTKIT_SECCTL(opaque);
345
uint64_t r;
346
uint32_t offset = addr & ~0x3;
347
348
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_read(void *opaque, hwaddr addr,
349
case A_AHBNSPPPCEXP1:
350
case A_AHBNSPPPCEXP2:
351
case A_AHBNSPPPCEXP3:
352
+ r = s->ahbexp[offset_to_ppc_idx(offset)].nsp;
353
+ break;
354
case A_APBNSPPPC0:
355
case A_APBNSPPPC1:
356
+ r = s->apb[offset_to_ppc_idx(offset)].nsp;
357
+ break;
358
case A_APBNSPPPCEXP0:
359
case A_APBNSPPPCEXP1:
360
case A_APBNSPPPCEXP2:
361
case A_APBNSPPPCEXP3:
362
- qemu_log_mask(LOG_UNIMP,
363
- "IoTKit SecCtl NS block read: "
364
- "unimplemented offset 0x%x\n", offset);
365
+ r = s->apbexp[offset_to_ppc_idx(offset)].nsp;
366
break;
367
case A_PID4:
368
case A_PID5:
369
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_write(void *opaque, hwaddr addr,
370
uint64_t value,
371
unsigned size, MemTxAttrs attrs)
372
{
373
+ IoTKitSecCtl *s = IOTKIT_SECCTL(opaque);
374
uint32_t offset = addr;
375
+ IoTKitSecCtlPPC *ppc;
376
377
trace_iotkit_secctl_ns_write(offset, value, size);
378
379
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_ns_write(void *opaque, hwaddr addr,
380
case A_AHBNSPPPCEXP1:
381
case A_AHBNSPPPCEXP2:
382
case A_AHBNSPPPCEXP3:
383
+ ppc = &s->ahbexp[offset_to_ppc_idx(offset)];
384
+ iotkit_secctl_ppc_nsp_write(ppc, value);
385
+ break;
386
case A_APBNSPPPC0:
387
case A_APBNSPPPC1:
388
+ ppc = &s->apb[offset_to_ppc_idx(offset)];
389
+ iotkit_secctl_ppc_nsp_write(ppc, value);
390
+ break;
391
case A_APBNSPPPCEXP0:
392
case A_APBNSPPPCEXP1:
393
case A_APBNSPPPCEXP2:
394
case A_APBNSPPPCEXP3:
395
- qemu_log_mask(LOG_UNIMP,
396
- "IoTKit SecCtl NS block write: "
397
- "unimplemented offset 0x%x\n", offset);
398
+ ppc = &s->apbexp[offset_to_ppc_idx(offset)];
399
+ iotkit_secctl_ppc_nsp_write(ppc, value);
400
break;
401
case A_AHBNSPPPC0:
402
case A_PID4:
403
@@ -XXX,XX +XXX,XX @@ static const MemoryRegionOps iotkit_secctl_ns_ops = {
404
.impl.max_access_size = 4,
405
};
406
407
+static void iotkit_secctl_reset_ppc(IoTKitSecCtlPPC *ppc)
408
+{
409
+ ppc->ns = 0;
410
+ ppc->sp = 0;
411
+ ppc->nsp = 0;
412
+}
413
+
414
static void iotkit_secctl_reset(DeviceState *dev)
415
{
416
+ IoTKitSecCtl *s = IOTKIT_SECCTL(dev);
417
418
+ s->secppcintstat = 0;
419
+ s->secppcinten = 0;
420
+ s->secrespcfg = 0;
421
+
422
+ foreach_ppc(s, iotkit_secctl_reset_ppc);
423
+}
424
+
425
+static void iotkit_secctl_ppc_irqstatus(void *opaque, int n, int level)
426
+{
427
+ IoTKitSecCtlPPC *ppc = opaque;
428
+ IoTKitSecCtl *s = IOTKIT_SECCTL(ppc->parent);
429
+ int irqbit = ppc->irq_bit_offset + n;
430
+
431
+ s->secppcintstat = deposit32(s->secppcintstat, irqbit, 1, level);
432
+}
433
+
434
+static void iotkit_secctl_init_ppc(IoTKitSecCtl *s,
435
+ IoTKitSecCtlPPC *ppc,
436
+ const char *name,
437
+ int numports,
438
+ int irq_bit_offset)
439
+{
440
+ char *gpioname;
441
+ DeviceState *dev = DEVICE(s);
442
+
443
+ ppc->numports = numports;
444
+ ppc->irq_bit_offset = irq_bit_offset;
445
+ ppc->parent = s;
446
+
447
+ gpioname = g_strdup_printf("%s_nonsec", name);
448
+ qdev_init_gpio_out_named(dev, ppc->nonsec, gpioname, numports);
449
+ g_free(gpioname);
450
+ gpioname = g_strdup_printf("%s_ap", name);
451
+ qdev_init_gpio_out_named(dev, ppc->ap, gpioname, numports);
452
+ g_free(gpioname);
453
+ gpioname = g_strdup_printf("%s_irq_enable", name);
454
+ qdev_init_gpio_out_named(dev, &ppc->irq_enable, gpioname, 1);
455
+ g_free(gpioname);
456
+ gpioname = g_strdup_printf("%s_irq_clear", name);
457
+ qdev_init_gpio_out_named(dev, &ppc->irq_clear, gpioname, 1);
458
+ g_free(gpioname);
459
+ gpioname = g_strdup_printf("%s_irq_status", name);
460
+ qdev_init_gpio_in_named_with_opaque(dev, iotkit_secctl_ppc_irqstatus,
461
+ ppc, gpioname, 1);
462
+ g_free(gpioname);
36
}
463
}
37
464
38
#define float32_zero make_float32(0)
465
static void iotkit_secctl_init(Object *obj)
39
-#define float32_one make_float32(0x3f800000)
466
{
40
#define float32_half make_float32(0x3f000000)
467
IoTKitSecCtl *s = IOTKIT_SECCTL(obj);
41
+#define float32_one make_float32(0x3f800000)
468
SysBusDevice *sbd = SYS_BUS_DEVICE(obj);
42
+#define float32_one_point_five make_float32(0x3fc00000)
469
+ DeviceState *dev = DEVICE(obj);
43
+#define float32_two make_float32(0x40000000)
470
+ int i;
44
+#define float32_three make_float32(0x40400000)
471
+
45
#define float32_infinity make_float32(0x7f800000)
472
+ iotkit_secctl_init_ppc(s, &s->apb[0], "apb_ppc0",
46
473
+ IOTS_APB_PPC0_NUM_PORTS, 0);
47
-
474
+ iotkit_secctl_init_ppc(s, &s->apb[1], "apb_ppc1",
48
/*----------------------------------------------------------------------------
475
+ IOTS_APB_PPC1_NUM_PORTS, 1);
49
| The pattern for a default generated single-precision NaN.
476
+
50
*----------------------------------------------------------------------------*/
477
+ for (i = 0; i < IOTS_NUM_APB_EXP_PPC; i++) {
51
@@ -XXX,XX +XXX,XX @@ static inline float64 float64_set_sign(float64 a, int sign)
478
+ IoTKitSecCtlPPC *ppc = &s->apbexp[i];
479
+ char *ppcname = g_strdup_printf("apb_ppcexp%d", i);
480
+ iotkit_secctl_init_ppc(s, ppc, ppcname, IOTS_PPC_NUM_PORTS, 4 + i);
481
+ g_free(ppcname);
482
+ }
483
+ for (i = 0; i < IOTS_NUM_AHB_EXP_PPC; i++) {
484
+ IoTKitSecCtlPPC *ppc = &s->ahbexp[i];
485
+ char *ppcname = g_strdup_printf("ahb_ppcexp%d", i);
486
+ iotkit_secctl_init_ppc(s, ppc, ppcname, IOTS_PPC_NUM_PORTS, 20 + i);
487
+ g_free(ppcname);
488
+ }
489
+
490
+ qdev_init_gpio_out_named(dev, &s->sec_resp_cfg, "sec_resp_cfg", 1);
491
492
memory_region_init_io(&s->s_regs, obj, &iotkit_secctl_s_ops,
493
s, "iotkit-secctl-s-regs", 0x1000);
494
@@ -XXX,XX +XXX,XX @@ static void iotkit_secctl_init(Object *obj)
495
sysbus_init_mmio(sbd, &s->ns_regs);
52
}
496
}
53
497
54
#define float64_zero make_float64(0)
498
+static const VMStateDescription iotkit_secctl_ppc_vmstate = {
55
-#define float64_one make_float64(0x3ff0000000000000LL)
499
+ .name = "iotkit-secctl-ppc",
56
-#define float64_ln2 make_float64(0x3fe62e42fefa39efLL)
500
+ .version_id = 1,
57
#define float64_half make_float64(0x3fe0000000000000LL)
501
+ .minimum_version_id = 1,
58
+#define float64_one make_float64(0x3ff0000000000000LL)
502
+ .fields = (VMStateField[]) {
59
+#define float64_one_point_five make_float64(0x3FF8000000000000ULL)
503
+ VMSTATE_UINT32(ns, IoTKitSecCtlPPC),
60
+#define float64_two make_float64(0x4000000000000000ULL)
504
+ VMSTATE_UINT32(sp, IoTKitSecCtlPPC),
61
+#define float64_three make_float64(0x4008000000000000ULL)
505
+ VMSTATE_UINT32(nsp, IoTKitSecCtlPPC),
62
+#define float64_ln2 make_float64(0x3fe62e42fefa39efLL)
506
+ VMSTATE_END_OF_LIST()
63
#define float64_infinity make_float64(0x7ff0000000000000LL)
507
+ }
64
508
+};
65
/*----------------------------------------------------------------------------
509
+
66
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
510
static const VMStateDescription iotkit_secctl_vmstate = {
67
index XXXXXXX..XXXXXXX 100644
511
.name = "iotkit-secctl",
68
--- a/target/arm/helper-a64.h
512
.version_id = 1,
69
+++ b/target/arm/helper-a64.h
513
.minimum_version_id = 1,
70
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_3(vfp_mulxd, TCG_CALL_NO_RWG, f64, f64, f64, ptr)
514
.fields = (VMStateField[]) {
71
DEF_HELPER_FLAGS_3(neon_ceq_f64, TCG_CALL_NO_RWG, i64, i64, i64, ptr)
515
+ VMSTATE_UINT32(secppcintstat, IoTKitSecCtl),
72
DEF_HELPER_FLAGS_3(neon_cge_f64, TCG_CALL_NO_RWG, i64, i64, i64, ptr)
516
+ VMSTATE_UINT32(secppcinten, IoTKitSecCtl),
73
DEF_HELPER_FLAGS_3(neon_cgt_f64, TCG_CALL_NO_RWG, i64, i64, i64, ptr)
517
+ VMSTATE_UINT32(secrespcfg, IoTKitSecCtl),
74
+DEF_HELPER_FLAGS_3(recpsf_f16, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
518
+ VMSTATE_STRUCT_ARRAY(apb, IoTKitSecCtl, IOTS_NUM_APB_PPC, 1,
75
DEF_HELPER_FLAGS_3(recpsf_f32, TCG_CALL_NO_RWG, f32, f32, f32, ptr)
519
+ iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC),
76
DEF_HELPER_FLAGS_3(recpsf_f64, TCG_CALL_NO_RWG, f64, f64, f64, ptr)
520
+ VMSTATE_STRUCT_ARRAY(apbexp, IoTKitSecCtl, IOTS_NUM_APB_EXP_PPC, 1,
77
+DEF_HELPER_FLAGS_3(rsqrtsf_f16, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
521
+ iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC),
78
DEF_HELPER_FLAGS_3(rsqrtsf_f32, TCG_CALL_NO_RWG, f32, f32, f32, ptr)
522
+ VMSTATE_STRUCT_ARRAY(ahbexp, IoTKitSecCtl, IOTS_NUM_AHB_EXP_PPC, 1,
79
DEF_HELPER_FLAGS_3(rsqrtsf_f64, TCG_CALL_NO_RWG, f64, f64, f64, ptr)
523
+ iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC),
80
DEF_HELPER_FLAGS_1(neon_addlp_s8, TCG_CALL_NO_RWG_SE, i64, i64)
524
VMSTATE_END_OF_LIST()
81
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
525
}
82
index XXXXXXX..XXXXXXX 100644
526
};
83
--- a/target/arm/helper-a64.c
84
+++ b/target/arm/helper-a64.c
85
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_cgt_f64)(float64 a, float64 b, void *fpstp)
86
* versions, these do a fully fused multiply-add or
87
* multiply-add-and-halve.
88
*/
89
+#define float16_two make_float16(0x4000)
90
+#define float16_three make_float16(0x4200)
91
+#define float16_one_point_five make_float16(0x3e00)
92
+
93
#define float32_two make_float32(0x40000000)
94
#define float32_three make_float32(0x40400000)
95
#define float32_one_point_five make_float32(0x3fc00000)
96
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_cgt_f64)(float64 a, float64 b, void *fpstp)
97
#define float64_three make_float64(0x4008000000000000ULL)
98
#define float64_one_point_five make_float64(0x3FF8000000000000ULL)
99
100
+float16 HELPER(recpsf_f16)(float16 a, float16 b, void *fpstp)
101
+{
102
+ float_status *fpst = fpstp;
103
+
104
+ a = float16_squash_input_denormal(a, fpst);
105
+ b = float16_squash_input_denormal(b, fpst);
106
+
107
+ a = float16_chs(a);
108
+ if ((float16_is_infinity(a) && float16_is_zero(b)) ||
109
+ (float16_is_infinity(b) && float16_is_zero(a))) {
110
+ return float16_two;
111
+ }
112
+ return float16_muladd(a, b, float16_two, 0, fpst);
113
+}
114
+
115
float32 HELPER(recpsf_f32)(float32 a, float32 b, void *fpstp)
116
{
117
float_status *fpst = fpstp;
118
@@ -XXX,XX +XXX,XX @@ float64 HELPER(recpsf_f64)(float64 a, float64 b, void *fpstp)
119
return float64_muladd(a, b, float64_two, 0, fpst);
120
}
121
122
+float16 HELPER(rsqrtsf_f16)(float16 a, float16 b, void *fpstp)
123
+{
124
+ float_status *fpst = fpstp;
125
+
126
+ a = float16_squash_input_denormal(a, fpst);
127
+ b = float16_squash_input_denormal(b, fpst);
128
+
129
+ a = float16_chs(a);
130
+ if ((float16_is_infinity(a) && float16_is_zero(b)) ||
131
+ (float16_is_infinity(b) && float16_is_zero(a))) {
132
+ return float16_one_point_five;
133
+ }
134
+ return float16_muladd(a, b, float16_three, float_muladd_halve_result, fpst);
135
+}
136
+
137
float32 HELPER(rsqrtsf_f32)(float32 a, float32 b, void *fpstp)
138
{
139
float_status *fpst = fpstp;
140
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
141
index XXXXXXX..XXXXXXX 100644
142
--- a/target/arm/translate-a64.c
143
+++ b/target/arm/translate-a64.c
144
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
145
case 0x6: /* FMAX */
146
gen_helper_advsimd_maxh(tcg_res, tcg_op1, tcg_op2, fpst);
147
break;
148
+ case 0x7: /* FRECPS */
149
+ gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
150
+ break;
151
case 0x8: /* FMINNM */
152
gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst);
153
break;
154
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
155
case 0xe: /* FMIN */
156
gen_helper_advsimd_minh(tcg_res, tcg_op1, tcg_op2, fpst);
157
break;
158
+ case 0xf: /* FRSQRTS */
159
+ gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
160
+ break;
161
case 0x13: /* FMUL */
162
gen_helper_advsimd_mulh(tcg_res, tcg_op1, tcg_op2, fpst);
163
break;
164
--
527
--
165
2.16.2
528
2.16.2
166
529
167
530
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Add remaining easy registers to iotkit-secctl:
2
* NSCCFG just routes its two bits out to external GPIO lines
3
* BRGINSTAT/BRGINTCLR/BRGINTEN can be dummies, because QEMU's
4
bus fabric can never report errors
2
5
3
Neither of these operations alter the floating point status registers
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
so we can do a pure bitwise operation, either squashing any sign
7
Message-id: 20180220180325.29818-18-peter.maydell@linaro.org
5
bit (ABS) or inverting it (NEG).
8
---
9
include/hw/misc/iotkit-secctl.h | 4 ++++
10
hw/misc/iotkit-secctl.c | 32 ++++++++++++++++++++++++++------
11
2 files changed, 30 insertions(+), 6 deletions(-)
6
12
7
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
13
diff --git a/include/hw/misc/iotkit-secctl.h b/include/hw/misc/iotkit-secctl.h
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Message-id: 20180227143852.11175-22-alex.bennee@linaro.org
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
12
target/arm/translate-a64.c | 16 +++++++++++++++-
13
1 file changed, 15 insertions(+), 1 deletion(-)
14
15
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
16
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
17
--- a/target/arm/translate-a64.c
15
--- a/include/hw/misc/iotkit-secctl.h
18
+++ b/target/arm/translate-a64.c
16
+++ b/include/hw/misc/iotkit-secctl.h
19
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
17
@@ -XXX,XX +XXX,XX @@
20
TCGv_i32 tcg_rmode = NULL;
18
* + sysbus MMIO region 1 is the "non-secure privilege control block" registers
21
TCGv_ptr tcg_fpstatus = NULL;
19
* + named GPIO output "sec_resp_cfg" indicating whether blocked accesses
22
bool need_rmode = false;
20
* should RAZ/WI or bus error
23
+ bool need_fpst = true;
21
+ * + named GPIO output "nsc_cfg" whose value tracks the NSCCFG register value
24
int rmode;
22
* Controlling the 2 APB PPCs in the IoTKit:
25
23
* + named GPIO outputs apb_ppc0_nonsec[0..2] and apb_ppc1_nonsec
26
if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
24
* + named GPIO outputs apb_ppc0_ap[0..2] and apb_ppc1_ap
27
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
25
@@ -XXX,XX +XXX,XX @@ struct IoTKitSecCtl {
28
need_rmode = true;
26
29
rmode = FPROUNDING_ZERO;
27
/*< public >*/
28
qemu_irq sec_resp_cfg;
29
+ qemu_irq nsc_cfg_irq;
30
31
MemoryRegion s_regs;
32
MemoryRegion ns_regs;
33
@@ -XXX,XX +XXX,XX @@ struct IoTKitSecCtl {
34
uint32_t secppcintstat;
35
uint32_t secppcinten;
36
uint32_t secrespcfg;
37
+ uint32_t nsccfg;
38
+ uint32_t brginten;
39
40
IoTKitSecCtlPPC apb[IOTS_NUM_APB_PPC];
41
IoTKitSecCtlPPC apbexp[IOTS_NUM_APB_EXP_PPC];
42
diff --git a/hw/misc/iotkit-secctl.c b/hw/misc/iotkit-secctl.c
43
index XXXXXXX..XXXXXXX 100644
44
--- a/hw/misc/iotkit-secctl.c
45
+++ b/hw/misc/iotkit-secctl.c
46
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr,
47
case A_SECRESPCFG:
48
r = s->secrespcfg;
30
break;
49
break;
31
+ case 0x2f: /* FABS */
50
+ case A_NSCCFG:
32
+ case 0x6f: /* FNEG */
51
+ r = s->nsccfg;
33
+ need_fpst = false;
34
+ break;
52
+ break;
35
default:
53
case A_SECPPCINTSTAT:
36
fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop);
54
r = s->secppcintstat;
37
g_assert_not_reached();
55
break;
38
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
56
case A_SECPPCINTEN:
39
return;
57
r = s->secppcinten;
58
break;
59
+ case A_BRGINTSTAT:
60
+ /* QEMU's bus fabric can never report errors as it doesn't buffer
61
+ * writes, so we never report bridge interrupts.
62
+ */
63
+ r = 0;
64
+ break;
65
+ case A_BRGINTEN:
66
+ r = s->brginten;
67
+ break;
68
case A_AHBNSPPCEXP0:
69
case A_AHBNSPPCEXP1:
70
case A_AHBNSPPCEXP2:
71
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_read(void *opaque, hwaddr addr,
72
case A_APBSPPPCEXP3:
73
r = s->apbexp[offset_to_ppc_idx(offset)].sp;
74
break;
75
- case A_NSCCFG:
76
case A_SECMPCINTSTATUS:
77
case A_SECMSCINTSTAT:
78
case A_SECMSCINTEN:
79
- case A_BRGINTSTAT:
80
- case A_BRGINTEN:
81
case A_NSMSCEXP:
82
qemu_log_mask(LOG_UNIMP,
83
"IoTKit SecCtl S block read: "
84
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr,
40
}
85
}
41
86
42
- if (need_rmode) {
87
switch (offset) {
43
+ if (need_rmode || need_fpst) {
88
+ case A_NSCCFG:
44
tcg_fpstatus = get_fpstatus_ptr(true);
89
+ s->nsccfg = value & 3;
90
+ qemu_set_irq(s->nsc_cfg_irq, s->nsccfg);
91
+ break;
92
case A_SECRESPCFG:
93
value &= 1;
94
s->secrespcfg = value;
95
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr,
96
s->secppcinten = value & 0x00f000f3;
97
foreach_ppc(s, iotkit_secctl_ppc_update_irq_enable);
98
break;
99
+ case A_BRGINTCLR:
100
+ break;
101
+ case A_BRGINTEN:
102
+ s->brginten = value & 0xffff0000;
103
+ break;
104
case A_AHBNSPPCEXP0:
105
case A_AHBNSPPCEXP1:
106
case A_AHBNSPPCEXP2:
107
@@ -XXX,XX +XXX,XX @@ static MemTxResult iotkit_secctl_s_write(void *opaque, hwaddr addr,
108
ppc = &s->apbexp[offset_to_ppc_idx(offset)];
109
iotkit_secctl_ppc_sp_write(ppc, value);
110
break;
111
- case A_NSCCFG:
112
case A_SECMSCINTCLR:
113
case A_SECMSCINTEN:
114
- case A_BRGINTCLR:
115
- case A_BRGINTEN:
116
qemu_log_mask(LOG_UNIMP,
117
"IoTKit SecCtl S block write: "
118
"unimplemented offset 0x%x\n", offset);
119
@@ -XXX,XX +XXX,XX @@ static void iotkit_secctl_reset(DeviceState *dev)
120
s->secppcintstat = 0;
121
s->secppcinten = 0;
122
s->secrespcfg = 0;
123
+ s->nsccfg = 0;
124
+ s->brginten = 0;
125
126
foreach_ppc(s, iotkit_secctl_reset_ppc);
127
}
128
@@ -XXX,XX +XXX,XX @@ static void iotkit_secctl_init(Object *obj)
45
}
129
}
46
130
47
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
131
qdev_init_gpio_out_named(dev, &s->sec_resp_cfg, "sec_resp_cfg", 1);
48
case 0x7b: /* FCVTZU */
132
+ qdev_init_gpio_out_named(dev, &s->nsc_cfg_irq, "nsc_cfg", 1);
49
gen_helper_advsimd_f16touinth(tcg_res, tcg_op, tcg_fpstatus);
133
50
break;
134
memory_region_init_io(&s->s_regs, obj, &iotkit_secctl_s_ops,
51
+ case 0x6f: /* FNEG */
135
s, "iotkit-secctl-s-regs", 0x1000);
52
+ tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000);
136
@@ -XXX,XX +XXX,XX @@ static const VMStateDescription iotkit_secctl_vmstate = {
53
+ break;
137
VMSTATE_UINT32(secppcintstat, IoTKitSecCtl),
54
default:
138
VMSTATE_UINT32(secppcinten, IoTKitSecCtl),
55
g_assert_not_reached();
139
VMSTATE_UINT32(secrespcfg, IoTKitSecCtl),
56
}
140
+ VMSTATE_UINT32(nsccfg, IoTKitSecCtl),
57
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
141
+ VMSTATE_UINT32(brginten, IoTKitSecCtl),
58
case 0x59: /* FRINTX */
142
VMSTATE_STRUCT_ARRAY(apb, IoTKitSecCtl, IOTS_NUM_APB_PPC, 1,
59
gen_helper_advsimd_rinth_exact(tcg_res, tcg_op, tcg_fpstatus);
143
iotkit_secctl_ppc_vmstate, IoTKitSecCtlPPC),
60
break;
144
VMSTATE_STRUCT_ARRAY(apbexp, IoTKitSecCtl, IOTS_NUM_APB_EXP_PPC, 1,
61
+ case 0x2f: /* FABS */
62
+ tcg_gen_andi_i32(tcg_res, tcg_op, 0x7fff);
63
+ break;
64
+ case 0x6f: /* FNEG */
65
+ tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000);
66
+ break;
67
default:
68
g_assert_not_reached();
69
}
70
--
145
--
71
2.16.2
146
2.16.2
72
147
73
148
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Model the Arm IoT Kit documented in
2
http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html
2
3
3
This adds the full range of half-precision floating point to integral
4
The Arm IoT Kit is a subsystem which includes a CPU and some devices,
4
instructions.
5
and is intended be extended by adding extra devices to form a
6
complete system. It is used in the MPS2 board's AN505 image for the
7
Cortex-M33.
5
8
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
10
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180227143852.11175-18-alex.bennee@linaro.org
11
Message-id: 20180220180325.29818-19-peter.maydell@linaro.org
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
12
---
11
target/arm/helper-a64.h | 2 +
13
hw/arm/Makefile.objs | 1 +
12
target/arm/helper-a64.c | 22 ++++++++
14
include/hw/arm/iotkit.h | 109 ++++++++
13
target/arm/translate-a64.c | 123 +++++++++++++++++++++++++++++++++++++++++++--
15
hw/arm/iotkit.c | 598 ++++++++++++++++++++++++++++++++++++++++
14
3 files changed, 142 insertions(+), 5 deletions(-)
16
default-configs/arm-softmmu.mak | 1 +
17
4 files changed, 709 insertions(+)
18
create mode 100644 include/hw/arm/iotkit.h
19
create mode 100644 hw/arm/iotkit.c
15
20
16
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
21
diff --git a/hw/arm/Makefile.objs b/hw/arm/Makefile.objs
17
index XXXXXXX..XXXXXXX 100644
22
index XXXXXXX..XXXXXXX 100644
18
--- a/target/arm/helper-a64.h
23
--- a/hw/arm/Makefile.objs
19
+++ b/target/arm/helper-a64.h
24
+++ b/hw/arm/Makefile.objs
20
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_maxnum2h, i32, i32, i32, ptr)
25
@@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_FSL_IMX6) += fsl-imx6.o sabrelite.o
21
DEF_HELPER_3(advsimd_minnum2h, i32, i32, i32, ptr)
26
obj-$(CONFIG_ASPEED_SOC) += aspeed_soc.o aspeed.o
22
DEF_HELPER_3(advsimd_mulx2h, i32, i32, i32, ptr)
27
obj-$(CONFIG_MPS2) += mps2.o
23
DEF_HELPER_4(advsimd_muladd2h, i32, i32, i32, i32, ptr)
28
obj-$(CONFIG_MSF2) += msf2-soc.o msf2-som.o
24
+DEF_HELPER_2(advsimd_rinth_exact, f16, f16, ptr)
29
+obj-$(CONFIG_IOTKIT) += iotkit.o
25
+DEF_HELPER_2(advsimd_rinth, f16, f16, ptr)
30
diff --git a/include/hw/arm/iotkit.h b/include/hw/arm/iotkit.h
26
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
31
new file mode 100644
27
index XXXXXXX..XXXXXXX 100644
32
index XXXXXXX..XXXXXXX
28
--- a/target/arm/helper-a64.c
33
--- /dev/null
29
+++ b/target/arm/helper-a64.c
34
+++ b/include/hw/arm/iotkit.h
30
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(advsimd_acgt_f16)(float16 a, float16 b, void *fpstp)
35
@@ -XXX,XX +XXX,XX @@
31
int compare = float16_compare(f0, f1, fpst);
36
+/*
32
return ADVSIMD_CMPRES(compare == float_relation_greater);
37
+ * ARM IoT Kit
33
}
38
+ *
34
+
39
+ * Copyright (c) 2018 Linaro Limited
35
+/* round to integral */
40
+ * Written by Peter Maydell
36
+float16 HELPER(advsimd_rinth_exact)(float16 x, void *fp_status)
41
+ *
37
+{
42
+ * This program is free software; you can redistribute it and/or modify
38
+ return float16_round_to_int(x, fp_status);
43
+ * it under the terms of the GNU General Public License version 2 or
39
+}
44
+ * (at your option) any later version.
40
+
45
+ */
41
+float16 HELPER(advsimd_rinth)(float16 x, void *fp_status)
46
+
42
+{
47
+/* This is a model of the Arm IoT Kit which is documented in
43
+ int old_flags = get_float_exception_flags(fp_status), new_flags;
48
+ * http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html
44
+ float16 ret;
49
+ * It contains:
45
+
50
+ * a Cortex-M33
46
+ ret = float16_round_to_int(x, fp_status);
51
+ * the IDAU
47
+
52
+ * some timers and watchdogs
48
+ /* Suppress any inexact exceptions the conversion produced */
53
+ * two peripheral protection controllers
49
+ if (!(old_flags & float_flag_inexact)) {
54
+ * a memory protection controller
50
+ new_flags = get_float_exception_flags(fp_status);
55
+ * a security controller
51
+ set_float_exception_flags(new_flags & ~float_flag_inexact, fp_status);
56
+ * a bus fabric which arranges that some parts of the address
52
+ }
57
+ * space are secure and non-secure aliases of each other
53
+
58
+ *
54
+ return ret;
59
+ * QEMU interface:
55
+}
60
+ * + QOM property "memory" is a MemoryRegion containing the devices provided
56
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
61
+ * by the board model.
57
index XXXXXXX..XXXXXXX 100644
62
+ * + QOM property "MAINCLK" is the frequency of the main system clock
58
--- a/target/arm/translate-a64.c
63
+ * + QOM property "EXP_NUMIRQ" sets the number of expansion interrupts
59
+++ b/target/arm/translate-a64.c
64
+ * + Named GPIO inputs "EXP_IRQ" 0..n are the expansion interrupts, which
60
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn)
65
+ * are wired to the NVIC lines 32 .. n+32
61
*/
66
+ * Controlling up to 4 AHB expansion PPBs which a system using the IoTKit
62
static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
67
+ * might provide:
63
{
68
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_nonsec[0..15]
64
- int fpop, opcode, a;
69
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_ap[0..15]
65
+ int fpop, opcode, a, u;
70
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_enable
66
+ int rn, rd;
71
+ * + named GPIO outputs apb_ppcexp{0,1,2,3}_irq_clear
67
+ bool is_q;
72
+ * + named GPIO inputs apb_ppcexp{0,1,2,3}_irq_status
68
+ bool is_scalar;
73
+ * Controlling each of the 4 expansion AHB PPCs which a system using the IoTKit
69
+ bool only_in_vector = false;
74
+ * might provide:
70
+
75
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_nonsec[0..15]
71
+ int pass;
76
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_ap[0..15]
72
+ TCGv_i32 tcg_rmode = NULL;
77
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_enable
73
+ TCGv_ptr tcg_fpstatus = NULL;
78
+ * + named GPIO outputs ahb_ppcexp{0,1,2,3}_irq_clear
74
+ bool need_rmode = false;
79
+ * + named GPIO inputs ahb_ppcexp{0,1,2,3}_irq_status
75
+ int rmode;
80
+ */
76
81
+
77
if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
82
+#ifndef IOTKIT_H
78
unallocated_encoding(s);
83
+#define IOTKIT_H
79
return;
84
+
80
}
85
+#include "hw/sysbus.h"
81
86
+#include "hw/arm/armv7m.h"
82
- if (!fp_access_check(s)) {
87
+#include "hw/misc/iotkit-secctl.h"
83
- return;
88
+#include "hw/misc/tz-ppc.h"
84
- }
89
+#include "hw/timer/cmsdk-apb-timer.h"
85
+ rd = extract32(insn, 0, 5);
90
+#include "hw/misc/unimp.h"
86
+ rn = extract32(insn, 5, 5);
91
+#include "hw/or-irq.h"
87
92
+#include "hw/core/split-irq.h"
88
- opcode = extract32(insn, 12, 4);
93
+
89
a = extract32(insn, 23, 1);
94
+#define TYPE_IOTKIT "iotkit"
90
+ u = extract32(insn, 29, 1);
95
+#define IOTKIT(obj) OBJECT_CHECK(IoTKit, (obj), TYPE_IOTKIT)
91
+ is_scalar = extract32(insn, 28, 1);
96
+
92
+ is_q = extract32(insn, 30, 1);
97
+/* We have an IRQ splitter and an OR gate input for each external PPC
93
+
98
+ * and the 2 internal PPCs
94
+ opcode = extract32(insn, 12, 5);
99
+ */
95
fpop = deposit32(opcode, 5, 1, a);
100
+#define NUM_EXTERNAL_PPCS (IOTS_NUM_AHB_EXP_PPC + IOTS_NUM_APB_EXP_PPC)
96
+ fpop = deposit32(fpop, 6, 1, u);
101
+#define NUM_PPCS (NUM_EXTERNAL_PPCS + 2)
97
102
+
98
switch (fpop) {
103
+typedef struct IoTKit {
99
+ case 0x18: /* FRINTN */
104
+ /*< private >*/
100
+ need_rmode = true;
105
+ SysBusDevice parent_obj;
101
+ only_in_vector = true;
106
+
102
+ rmode = FPROUNDING_TIEEVEN;
107
+ /*< public >*/
103
+ break;
108
+ ARMv7MState armv7m;
104
+ case 0x19: /* FRINTM */
109
+ IoTKitSecCtl secctl;
105
+ need_rmode = true;
110
+ TZPPC apb_ppc0;
106
+ only_in_vector = true;
111
+ TZPPC apb_ppc1;
107
+ rmode = FPROUNDING_NEGINF;
112
+ CMSDKAPBTIMER timer0;
108
+ break;
113
+ CMSDKAPBTIMER timer1;
109
+ case 0x38: /* FRINTP */
114
+ qemu_or_irq ppc_irq_orgate;
110
+ need_rmode = true;
115
+ SplitIRQ sec_resp_splitter;
111
+ only_in_vector = true;
116
+ SplitIRQ ppc_irq_splitter[NUM_PPCS];
112
+ rmode = FPROUNDING_POSINF;
117
+
113
+ break;
118
+ UnimplementedDeviceState dualtimer;
114
+ case 0x39: /* FRINTZ */
119
+ UnimplementedDeviceState s32ktimer;
115
+ need_rmode = true;
120
+
116
+ only_in_vector = true;
121
+ MemoryRegion container;
117
+ rmode = FPROUNDING_ZERO;
122
+ MemoryRegion alias1;
118
+ break;
123
+ MemoryRegion alias2;
119
+ case 0x58: /* FRINTA */
124
+ MemoryRegion alias3;
120
+ need_rmode = true;
125
+ MemoryRegion sram0;
121
+ only_in_vector = true;
126
+
122
+ rmode = FPROUNDING_TIEAWAY;
127
+ qemu_irq *exp_irqs;
123
+ break;
128
+ qemu_irq ppc0_irq;
124
+ case 0x59: /* FRINTX */
129
+ qemu_irq ppc1_irq;
125
+ case 0x79: /* FRINTI */
130
+ qemu_irq sec_resp_cfg;
126
+ only_in_vector = true;
131
+ qemu_irq sec_resp_cfg_in;
127
+ /* current rounding mode */
132
+ qemu_irq nsc_cfg_in;
128
+ break;
133
+
129
default:
134
+ qemu_irq irq_status_in[NUM_EXTERNAL_PPCS];
130
fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop);
135
+
131
g_assert_not_reached();
136
+ uint32_t nsccfg;
132
}
137
+
133
138
+ /* Properties */
134
+
139
+ MemoryRegion *board_memory;
135
+ /* Check additional constraints for the scalar encoding */
140
+ uint32_t exp_numirq;
136
+ if (is_scalar) {
141
+ uint32_t mainclk_frq;
137
+ if (!is_q) {
142
+} IoTKit;
138
+ unallocated_encoding(s);
143
+
144
+#endif
145
diff --git a/hw/arm/iotkit.c b/hw/arm/iotkit.c
146
new file mode 100644
147
index XXXXXXX..XXXXXXX
148
--- /dev/null
149
+++ b/hw/arm/iotkit.c
150
@@ -XXX,XX +XXX,XX @@
151
+/*
152
+ * Arm IoT Kit
153
+ *
154
+ * Copyright (c) 2018 Linaro Limited
155
+ * Written by Peter Maydell
156
+ *
157
+ * This program is free software; you can redistribute it and/or modify
158
+ * it under the terms of the GNU General Public License version 2 or
159
+ * (at your option) any later version.
160
+ */
161
+
162
+#include "qemu/osdep.h"
163
+#include "qemu/log.h"
164
+#include "qapi/error.h"
165
+#include "trace.h"
166
+#include "hw/sysbus.h"
167
+#include "hw/registerfields.h"
168
+#include "hw/arm/iotkit.h"
169
+#include "hw/misc/unimp.h"
170
+#include "hw/arm/arm.h"
171
+
172
+/* Create an alias region of @size bytes starting at @base
173
+ * which mirrors the memory starting at @orig.
174
+ */
175
+static void make_alias(IoTKit *s, MemoryRegion *mr, const char *name,
176
+ hwaddr base, hwaddr size, hwaddr orig)
177
+{
178
+ memory_region_init_alias(mr, NULL, name, &s->container, orig, size);
179
+ /* The alias is even lower priority than unimplemented_device regions */
180
+ memory_region_add_subregion_overlap(&s->container, base, mr, -1500);
181
+}
182
+
183
+static void init_sysbus_child(Object *parent, const char *childname,
184
+ void *child, size_t childsize,
185
+ const char *childtype)
186
+{
187
+ object_initialize(child, childsize, childtype);
188
+ object_property_add_child(parent, childname, OBJECT(child), &error_abort);
189
+ qdev_set_parent_bus(DEVICE(child), sysbus_get_default());
190
+}
191
+
192
+static void irq_status_forwarder(void *opaque, int n, int level)
193
+{
194
+ qemu_irq destirq = opaque;
195
+
196
+ qemu_set_irq(destirq, level);
197
+}
198
+
199
+static void nsccfg_handler(void *opaque, int n, int level)
200
+{
201
+ IoTKit *s = IOTKIT(opaque);
202
+
203
+ s->nsccfg = level;
204
+}
205
+
206
+static void iotkit_forward_ppc(IoTKit *s, const char *ppcname, int ppcnum)
207
+{
208
+ /* Each of the 4 AHB and 4 APB PPCs that might be present in a
209
+ * system using the IoTKit has a collection of control lines which
210
+ * are provided by the security controller and which we want to
211
+ * expose as control lines on the IoTKit device itself, so the
212
+ * code using the IoTKit can wire them up to the PPCs.
213
+ */
214
+ SplitIRQ *splitter = &s->ppc_irq_splitter[ppcnum];
215
+ DeviceState *iotkitdev = DEVICE(s);
216
+ DeviceState *dev_secctl = DEVICE(&s->secctl);
217
+ DeviceState *dev_splitter = DEVICE(splitter);
218
+ char *name;
219
+
220
+ name = g_strdup_printf("%s_nonsec", ppcname);
221
+ qdev_pass_gpios(dev_secctl, iotkitdev, name);
222
+ g_free(name);
223
+ name = g_strdup_printf("%s_ap", ppcname);
224
+ qdev_pass_gpios(dev_secctl, iotkitdev, name);
225
+ g_free(name);
226
+ name = g_strdup_printf("%s_irq_enable", ppcname);
227
+ qdev_pass_gpios(dev_secctl, iotkitdev, name);
228
+ g_free(name);
229
+ name = g_strdup_printf("%s_irq_clear", ppcname);
230
+ qdev_pass_gpios(dev_secctl, iotkitdev, name);
231
+ g_free(name);
232
+
233
+ /* irq_status is a little more tricky, because we need to
234
+ * split it so we can send it both to the security controller
235
+ * and to our OR gate for the NVIC interrupt line.
236
+ * Connect up the splitter's outputs, and create a GPIO input
237
+ * which will pass the line state to the input splitter.
238
+ */
239
+ name = g_strdup_printf("%s_irq_status", ppcname);
240
+ qdev_connect_gpio_out(dev_splitter, 0,
241
+ qdev_get_gpio_in_named(dev_secctl,
242
+ name, 0));
243
+ qdev_connect_gpio_out(dev_splitter, 1,
244
+ qdev_get_gpio_in(DEVICE(&s->ppc_irq_orgate), ppcnum));
245
+ s->irq_status_in[ppcnum] = qdev_get_gpio_in(dev_splitter, 0);
246
+ qdev_init_gpio_in_named_with_opaque(iotkitdev, irq_status_forwarder,
247
+ s->irq_status_in[ppcnum], name, 1);
248
+ g_free(name);
249
+}
250
+
251
+static void iotkit_forward_sec_resp_cfg(IoTKit *s)
252
+{
253
+ /* Forward the 3rd output from the splitter device as a
254
+ * named GPIO output of the iotkit object.
255
+ */
256
+ DeviceState *dev = DEVICE(s);
257
+ DeviceState *dev_splitter = DEVICE(&s->sec_resp_splitter);
258
+
259
+ qdev_init_gpio_out_named(dev, &s->sec_resp_cfg, "sec_resp_cfg", 1);
260
+ s->sec_resp_cfg_in = qemu_allocate_irq(irq_status_forwarder,
261
+ s->sec_resp_cfg, 1);
262
+ qdev_connect_gpio_out(dev_splitter, 2, s->sec_resp_cfg_in);
263
+}
264
+
265
+static void iotkit_init(Object *obj)
266
+{
267
+ IoTKit *s = IOTKIT(obj);
268
+ int i;
269
+
270
+ memory_region_init(&s->container, obj, "iotkit-container", UINT64_MAX);
271
+
272
+ init_sysbus_child(obj, "armv7m", &s->armv7m, sizeof(s->armv7m),
273
+ TYPE_ARMV7M);
274
+ qdev_prop_set_string(DEVICE(&s->armv7m), "cpu-type",
275
+ ARM_CPU_TYPE_NAME("cortex-m33"));
276
+
277
+ init_sysbus_child(obj, "secctl", &s->secctl, sizeof(s->secctl),
278
+ TYPE_IOTKIT_SECCTL);
279
+ init_sysbus_child(obj, "apb-ppc0", &s->apb_ppc0, sizeof(s->apb_ppc0),
280
+ TYPE_TZ_PPC);
281
+ init_sysbus_child(obj, "apb-ppc1", &s->apb_ppc1, sizeof(s->apb_ppc1),
282
+ TYPE_TZ_PPC);
283
+ init_sysbus_child(obj, "timer0", &s->timer0, sizeof(s->timer0),
284
+ TYPE_CMSDK_APB_TIMER);
285
+ init_sysbus_child(obj, "timer1", &s->timer1, sizeof(s->timer1),
286
+ TYPE_CMSDK_APB_TIMER);
287
+ init_sysbus_child(obj, "dualtimer", &s->dualtimer, sizeof(s->dualtimer),
288
+ TYPE_UNIMPLEMENTED_DEVICE);
289
+ object_initialize(&s->ppc_irq_orgate, sizeof(s->ppc_irq_orgate),
290
+ TYPE_OR_IRQ);
291
+ object_property_add_child(obj, "ppc-irq-orgate",
292
+ OBJECT(&s->ppc_irq_orgate), &error_abort);
293
+ object_initialize(&s->sec_resp_splitter, sizeof(s->sec_resp_splitter),
294
+ TYPE_SPLIT_IRQ);
295
+ object_property_add_child(obj, "sec-resp-splitter",
296
+ OBJECT(&s->sec_resp_splitter), &error_abort);
297
+ for (i = 0; i < ARRAY_SIZE(s->ppc_irq_splitter); i++) {
298
+ char *name = g_strdup_printf("ppc-irq-splitter-%d", i);
299
+ SplitIRQ *splitter = &s->ppc_irq_splitter[i];
300
+
301
+ object_initialize(splitter, sizeof(*splitter), TYPE_SPLIT_IRQ);
302
+ object_property_add_child(obj, name, OBJECT(splitter), &error_abort);
303
+ }
304
+ init_sysbus_child(obj, "s32ktimer", &s->s32ktimer, sizeof(s->s32ktimer),
305
+ TYPE_UNIMPLEMENTED_DEVICE);
306
+}
307
+
308
+static void iotkit_exp_irq(void *opaque, int n, int level)
309
+{
310
+ IoTKit *s = IOTKIT(opaque);
311
+
312
+ qemu_set_irq(s->exp_irqs[n], level);
313
+}
314
+
315
+static void iotkit_realize(DeviceState *dev, Error **errp)
316
+{
317
+ IoTKit *s = IOTKIT(dev);
318
+ int i;
319
+ MemoryRegion *mr;
320
+ Error *err = NULL;
321
+ SysBusDevice *sbd_apb_ppc0;
322
+ SysBusDevice *sbd_secctl;
323
+ DeviceState *dev_apb_ppc0;
324
+ DeviceState *dev_apb_ppc1;
325
+ DeviceState *dev_secctl;
326
+ DeviceState *dev_splitter;
327
+
328
+ if (!s->board_memory) {
329
+ error_setg(errp, "memory property was not set");
330
+ return;
331
+ }
332
+
333
+ if (!s->mainclk_frq) {
334
+ error_setg(errp, "MAINCLK property was not set");
335
+ return;
336
+ }
337
+
338
+ /* Handling of which devices should be available only to secure
339
+ * code is usually done differently for M profile than for A profile.
340
+ * Instead of putting some devices only into the secure address space,
341
+ * devices exist in both address spaces but with hard-wired security
342
+ * permissions that will cause the CPU to fault for non-secure accesses.
343
+ *
344
+ * The IoTKit has an IDAU (Implementation Defined Access Unit),
345
+ * which specifies hard-wired security permissions for different
346
+ * areas of the physical address space. For the IoTKit IDAU, the
347
+ * top 4 bits of the physical address are the IDAU region ID, and
348
+ * if bit 28 (ie the lowest bit of the ID) is 0 then this is an NS
349
+ * region, otherwise it is an S region.
350
+ *
351
+ * The various devices and RAMs are generally all mapped twice,
352
+ * once into a region that the IDAU defines as secure and once
353
+ * into a non-secure region. They sit behind either a Memory
354
+ * Protection Controller (for RAM) or a Peripheral Protection
355
+ * Controller (for devices), which allow a more fine grained
356
+ * configuration of whether non-secure accesses are permitted.
357
+ *
358
+ * (The other place that guest software can configure security
359
+ * permissions is in the architected SAU (Security Attribution
360
+ * Unit), which is entirely inside the CPU. The IDAU can upgrade
361
+ * the security attributes for a region to more restrictive than
362
+ * the SAU specifies, but cannot downgrade them.)
363
+ *
364
+ * 0x10000000..0x1fffffff alias of 0x00000000..0x0fffffff
365
+ * 0x20000000..0x2007ffff 32KB FPGA block RAM
366
+ * 0x30000000..0x3fffffff alias of 0x20000000..0x2fffffff
367
+ * 0x40000000..0x4000ffff base peripheral region 1
368
+ * 0x40010000..0x4001ffff CPU peripherals (none for IoTKit)
369
+ * 0x40020000..0x4002ffff system control element peripherals
370
+ * 0x40080000..0x400fffff base peripheral region 2
371
+ * 0x50000000..0x5fffffff alias of 0x40000000..0x4fffffff
372
+ */
373
+
374
+ memory_region_add_subregion_overlap(&s->container, 0, s->board_memory, -1);
375
+
376
+ qdev_prop_set_uint32(DEVICE(&s->armv7m), "num-irq", s->exp_numirq + 32);
377
+ /* In real hardware the initial Secure VTOR is set from the INITSVTOR0
378
+ * register in the IoT Kit System Control Register block, and the
379
+ * initial value of that is in turn specifiable by the FPGA that
380
+ * instantiates the IoT Kit. In QEMU we don't implement this wrinkle,
381
+ * and simply set the CPU's init-svtor to the IoT Kit default value.
382
+ */
383
+ qdev_prop_set_uint32(DEVICE(&s->armv7m), "init-svtor", 0x10000000);
384
+ object_property_set_link(OBJECT(&s->armv7m), OBJECT(&s->container),
385
+ "memory", &err);
386
+ if (err) {
387
+ error_propagate(errp, err);
388
+ return;
389
+ }
390
+ object_property_set_link(OBJECT(&s->armv7m), OBJECT(s), "idau", &err);
391
+ if (err) {
392
+ error_propagate(errp, err);
393
+ return;
394
+ }
395
+ object_property_set_bool(OBJECT(&s->armv7m), true, "realized", &err);
396
+ if (err) {
397
+ error_propagate(errp, err);
398
+ return;
399
+ }
400
+
401
+ /* Connect our EXP_IRQ GPIOs to the NVIC's lines 32 and up. */
402
+ s->exp_irqs = g_new(qemu_irq, s->exp_numirq);
403
+ for (i = 0; i < s->exp_numirq; i++) {
404
+ s->exp_irqs[i] = qdev_get_gpio_in(DEVICE(&s->armv7m), i + 32);
405
+ }
406
+ qdev_init_gpio_in_named(dev, iotkit_exp_irq, "EXP_IRQ", s->exp_numirq);
407
+
408
+ /* Set up the big aliases first */
409
+ make_alias(s, &s->alias1, "alias 1", 0x10000000, 0x10000000, 0x00000000);
410
+ make_alias(s, &s->alias2, "alias 2", 0x30000000, 0x10000000, 0x20000000);
411
+ /* The 0x50000000..0x5fffffff region is not a pure alias: it has
412
+ * a few extra devices that only appear there (generally the
413
+ * control interfaces for the protection controllers).
414
+ * We implement this by mapping those devices over the top of this
415
+ * alias MR at a higher priority.
416
+ */
417
+ make_alias(s, &s->alias3, "alias 3", 0x50000000, 0x10000000, 0x40000000);
418
+
419
+ /* This RAM should be behind a Memory Protection Controller, but we
420
+ * don't implement that yet.
421
+ */
422
+ memory_region_init_ram(&s->sram0, NULL, "iotkit.sram0", 0x00008000, &err);
423
+ if (err) {
424
+ error_propagate(errp, err);
425
+ return;
426
+ }
427
+ memory_region_add_subregion(&s->container, 0x20000000, &s->sram0);
428
+
429
+ /* Security controller */
430
+ object_property_set_bool(OBJECT(&s->secctl), true, "realized", &err);
431
+ if (err) {
432
+ error_propagate(errp, err);
433
+ return;
434
+ }
435
+ sbd_secctl = SYS_BUS_DEVICE(&s->secctl);
436
+ dev_secctl = DEVICE(&s->secctl);
437
+ sysbus_mmio_map(sbd_secctl, 0, 0x50080000);
438
+ sysbus_mmio_map(sbd_secctl, 1, 0x40080000);
439
+
440
+ s->nsc_cfg_in = qemu_allocate_irq(nsccfg_handler, s, 1);
441
+ qdev_connect_gpio_out_named(dev_secctl, "nsc_cfg", 0, s->nsc_cfg_in);
442
+
443
+ /* The sec_resp_cfg output from the security controller must be split into
444
+ * multiple lines, one for each of the PPCs within the IoTKit and one
445
+ * that will be an output from the IoTKit to the system.
446
+ */
447
+ object_property_set_int(OBJECT(&s->sec_resp_splitter), 3,
448
+ "num-lines", &err);
449
+ if (err) {
450
+ error_propagate(errp, err);
451
+ return;
452
+ }
453
+ object_property_set_bool(OBJECT(&s->sec_resp_splitter), true,
454
+ "realized", &err);
455
+ if (err) {
456
+ error_propagate(errp, err);
457
+ return;
458
+ }
459
+ dev_splitter = DEVICE(&s->sec_resp_splitter);
460
+ qdev_connect_gpio_out_named(dev_secctl, "sec_resp_cfg", 0,
461
+ qdev_get_gpio_in(dev_splitter, 0));
462
+
463
+ /* Devices behind APB PPC0:
464
+ * 0x40000000: timer0
465
+ * 0x40001000: timer1
466
+ * 0x40002000: dual timer
467
+ * We must configure and realize each downstream device and connect
468
+ * it to the appropriate PPC port; then we can realize the PPC and
469
+ * map its upstream ends to the right place in the container.
470
+ */
471
+ qdev_prop_set_uint32(DEVICE(&s->timer0), "pclk-frq", s->mainclk_frq);
472
+ object_property_set_bool(OBJECT(&s->timer0), true, "realized", &err);
473
+ if (err) {
474
+ error_propagate(errp, err);
475
+ return;
476
+ }
477
+ sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer0), 0,
478
+ qdev_get_gpio_in(DEVICE(&s->armv7m), 3));
479
+ mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->timer0), 0);
480
+ object_property_set_link(OBJECT(&s->apb_ppc0), OBJECT(mr), "port[0]", &err);
481
+ if (err) {
482
+ error_propagate(errp, err);
483
+ return;
484
+ }
485
+
486
+ qdev_prop_set_uint32(DEVICE(&s->timer1), "pclk-frq", s->mainclk_frq);
487
+ object_property_set_bool(OBJECT(&s->timer1), true, "realized", &err);
488
+ if (err) {
489
+ error_propagate(errp, err);
490
+ return;
491
+ }
492
+ sysbus_connect_irq(SYS_BUS_DEVICE(&s->timer1), 0,
493
+ qdev_get_gpio_in(DEVICE(&s->armv7m), 3));
494
+ mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->timer1), 0);
495
+ object_property_set_link(OBJECT(&s->apb_ppc0), OBJECT(mr), "port[1]", &err);
496
+ if (err) {
497
+ error_propagate(errp, err);
498
+ return;
499
+ }
500
+
501
+ qdev_prop_set_string(DEVICE(&s->dualtimer), "name", "Dual timer");
502
+ qdev_prop_set_uint64(DEVICE(&s->dualtimer), "size", 0x1000);
503
+ object_property_set_bool(OBJECT(&s->dualtimer), true, "realized", &err);
504
+ if (err) {
505
+ error_propagate(errp, err);
506
+ return;
507
+ }
508
+ mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->dualtimer), 0);
509
+ object_property_set_link(OBJECT(&s->apb_ppc0), OBJECT(mr), "port[2]", &err);
510
+ if (err) {
511
+ error_propagate(errp, err);
512
+ return;
513
+ }
514
+
515
+ object_property_set_bool(OBJECT(&s->apb_ppc0), true, "realized", &err);
516
+ if (err) {
517
+ error_propagate(errp, err);
518
+ return;
519
+ }
520
+
521
+ sbd_apb_ppc0 = SYS_BUS_DEVICE(&s->apb_ppc0);
522
+ dev_apb_ppc0 = DEVICE(&s->apb_ppc0);
523
+
524
+ mr = sysbus_mmio_get_region(sbd_apb_ppc0, 0);
525
+ memory_region_add_subregion(&s->container, 0x40000000, mr);
526
+ mr = sysbus_mmio_get_region(sbd_apb_ppc0, 1);
527
+ memory_region_add_subregion(&s->container, 0x40001000, mr);
528
+ mr = sysbus_mmio_get_region(sbd_apb_ppc0, 2);
529
+ memory_region_add_subregion(&s->container, 0x40002000, mr);
530
+ for (i = 0; i < IOTS_APB_PPC0_NUM_PORTS; i++) {
531
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_nonsec", i,
532
+ qdev_get_gpio_in_named(dev_apb_ppc0,
533
+ "cfg_nonsec", i));
534
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_ap", i,
535
+ qdev_get_gpio_in_named(dev_apb_ppc0,
536
+ "cfg_ap", i));
537
+ }
538
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_irq_enable", 0,
539
+ qdev_get_gpio_in_named(dev_apb_ppc0,
540
+ "irq_enable", 0));
541
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc0_irq_clear", 0,
542
+ qdev_get_gpio_in_named(dev_apb_ppc0,
543
+ "irq_clear", 0));
544
+ qdev_connect_gpio_out(dev_splitter, 0,
545
+ qdev_get_gpio_in_named(dev_apb_ppc0,
546
+ "cfg_sec_resp", 0));
547
+
548
+ /* All the PPC irq lines (from the 2 internal PPCs and the 8 external
549
+ * ones) are sent individually to the security controller, and also
550
+ * ORed together to give a single combined PPC interrupt to the NVIC.
551
+ */
552
+ object_property_set_int(OBJECT(&s->ppc_irq_orgate),
553
+ NUM_PPCS, "num-lines", &err);
554
+ if (err) {
555
+ error_propagate(errp, err);
556
+ return;
557
+ }
558
+ object_property_set_bool(OBJECT(&s->ppc_irq_orgate), true,
559
+ "realized", &err);
560
+ if (err) {
561
+ error_propagate(errp, err);
562
+ return;
563
+ }
564
+ qdev_connect_gpio_out(DEVICE(&s->ppc_irq_orgate), 0,
565
+ qdev_get_gpio_in(DEVICE(&s->armv7m), 10));
566
+
567
+ /* 0x40010000 .. 0x4001ffff: private CPU region: unused in IoTKit */
568
+
569
+ /* 0x40020000 .. 0x4002ffff : IoTKit system control peripheral region */
570
+ /* Devices behind APB PPC1:
571
+ * 0x4002f000: S32K timer
572
+ */
573
+ qdev_prop_set_string(DEVICE(&s->s32ktimer), "name", "S32KTIMER");
574
+ qdev_prop_set_uint64(DEVICE(&s->s32ktimer), "size", 0x1000);
575
+ object_property_set_bool(OBJECT(&s->s32ktimer), true, "realized", &err);
576
+ if (err) {
577
+ error_propagate(errp, err);
578
+ return;
579
+ }
580
+ mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->s32ktimer), 0);
581
+ object_property_set_link(OBJECT(&s->apb_ppc1), OBJECT(mr), "port[0]", &err);
582
+ if (err) {
583
+ error_propagate(errp, err);
584
+ return;
585
+ }
586
+
587
+ object_property_set_bool(OBJECT(&s->apb_ppc1), true, "realized", &err);
588
+ if (err) {
589
+ error_propagate(errp, err);
590
+ return;
591
+ }
592
+ mr = sysbus_mmio_get_region(SYS_BUS_DEVICE(&s->apb_ppc1), 0);
593
+ memory_region_add_subregion(&s->container, 0x4002f000, mr);
594
+
595
+ dev_apb_ppc1 = DEVICE(&s->apb_ppc1);
596
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_nonsec", 0,
597
+ qdev_get_gpio_in_named(dev_apb_ppc1,
598
+ "cfg_nonsec", 0));
599
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_ap", 0,
600
+ qdev_get_gpio_in_named(dev_apb_ppc1,
601
+ "cfg_ap", 0));
602
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_irq_enable", 0,
603
+ qdev_get_gpio_in_named(dev_apb_ppc1,
604
+ "irq_enable", 0));
605
+ qdev_connect_gpio_out_named(dev_secctl, "apb_ppc1_irq_clear", 0,
606
+ qdev_get_gpio_in_named(dev_apb_ppc1,
607
+ "irq_clear", 0));
608
+ qdev_connect_gpio_out(dev_splitter, 1,
609
+ qdev_get_gpio_in_named(dev_apb_ppc1,
610
+ "cfg_sec_resp", 0));
611
+
612
+ /* Using create_unimplemented_device() maps the stub into the
613
+ * system address space rather than into our container, but the
614
+ * overall effect to the guest is the same.
615
+ */
616
+ create_unimplemented_device("SYSINFO", 0x40020000, 0x1000);
617
+
618
+ create_unimplemented_device("SYSCONTROL", 0x50021000, 0x1000);
619
+ create_unimplemented_device("S32KWATCHDOG", 0x5002e000, 0x1000);
620
+
621
+ /* 0x40080000 .. 0x4008ffff : IoTKit second Base peripheral region */
622
+
623
+ create_unimplemented_device("NS watchdog", 0x40081000, 0x1000);
624
+ create_unimplemented_device("S watchdog", 0x50081000, 0x1000);
625
+
626
+ create_unimplemented_device("SRAM0 MPC", 0x50083000, 0x1000);
627
+
628
+ for (i = 0; i < ARRAY_SIZE(s->ppc_irq_splitter); i++) {
629
+ Object *splitter = OBJECT(&s->ppc_irq_splitter[i]);
630
+
631
+ object_property_set_int(splitter, 2, "num-lines", &err);
632
+ if (err) {
633
+ error_propagate(errp, err);
139
+ return;
634
+ return;
140
+ }
635
+ }
141
+ /* FRINTxx is only in the vector form */
636
+ object_property_set_bool(splitter, true, "realized", &err);
142
+ if (only_in_vector) {
637
+ if (err) {
143
+ unallocated_encoding(s);
638
+ error_propagate(errp, err);
144
+ return;
639
+ return;
145
+ }
640
+ }
146
+ }
641
+ }
147
+
642
+
148
+ if (!fp_access_check(s)) {
643
+ for (i = 0; i < IOTS_NUM_AHB_EXP_PPC; i++) {
149
+ return;
644
+ char *ppcname = g_strdup_printf("ahb_ppcexp%d", i);
150
+ }
645
+
151
+
646
+ iotkit_forward_ppc(s, ppcname, i);
152
+ if (need_rmode) {
647
+ g_free(ppcname);
153
+ tcg_fpstatus = get_fpstatus_ptr(true);
648
+ }
154
+ }
649
+
155
+
650
+ for (i = 0; i < IOTS_NUM_APB_EXP_PPC; i++) {
156
+ if (need_rmode) {
651
+ char *ppcname = g_strdup_printf("apb_ppcexp%d", i);
157
+ tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode));
652
+
158
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
653
+ iotkit_forward_ppc(s, ppcname, i + IOTS_NUM_AHB_EXP_PPC);
159
+ }
654
+ g_free(ppcname);
160
+
655
+ }
161
+ if (is_scalar) {
656
+
162
+ /* no operations yet */
657
+ for (i = NUM_EXTERNAL_PPCS; i < NUM_PPCS; i++) {
163
+ } else {
658
+ /* Wire up IRQ splitter for internal PPCs */
164
+ for (pass = 0; pass < (is_q ? 8 : 4); pass++) {
659
+ DeviceState *devs = DEVICE(&s->ppc_irq_splitter[i]);
165
+ TCGv_i32 tcg_op = tcg_temp_new_i32();
660
+ char *gpioname = g_strdup_printf("apb_ppc%d_irq_status",
166
+ TCGv_i32 tcg_res = tcg_temp_new_i32();
661
+ i - NUM_EXTERNAL_PPCS);
167
+
662
+ TZPPC *ppc = (i == NUM_EXTERNAL_PPCS) ? &s->apb_ppc0 : &s->apb_ppc1;
168
+ read_vec_element_i32(s, tcg_op, rn, pass, MO_16);
663
+
169
+
664
+ qdev_connect_gpio_out(devs, 0,
170
+ switch (fpop) {
665
+ qdev_get_gpio_in_named(dev_secctl, gpioname, 0));
171
+ case 0x18: /* FRINTN */
666
+ qdev_connect_gpio_out(devs, 1,
172
+ case 0x19: /* FRINTM */
667
+ qdev_get_gpio_in(DEVICE(&s->ppc_irq_orgate), i));
173
+ case 0x38: /* FRINTP */
668
+ qdev_connect_gpio_out_named(DEVICE(ppc), "irq", 0,
174
+ case 0x39: /* FRINTZ */
669
+ qdev_get_gpio_in(devs, 0));
175
+ case 0x58: /* FRINTA */
670
+ }
176
+ case 0x79: /* FRINTI */
671
+
177
+ gen_helper_advsimd_rinth(tcg_res, tcg_op, tcg_fpstatus);
672
+ iotkit_forward_sec_resp_cfg(s);
178
+ break;
673
+
179
+ case 0x59: /* FRINTX */
674
+ system_clock_scale = NANOSECONDS_PER_SECOND / s->mainclk_frq;
180
+ gen_helper_advsimd_rinth_exact(tcg_res, tcg_op, tcg_fpstatus);
675
+}
181
+ break;
676
+
182
+ default:
677
+static void iotkit_idau_check(IDAUInterface *ii, uint32_t address,
183
+ g_assert_not_reached();
678
+ int *iregion, bool *exempt, bool *ns, bool *nsc)
184
+ }
679
+{
185
+
680
+ /* For IoTKit systems the IDAU responses are simple logical functions
186
+ write_vec_element_i32(s, tcg_res, rd, pass, MO_16);
681
+ * of the address bits. The NSC attribute is guest-adjustable via the
187
+
682
+ * NSCCFG register in the security controller.
188
+ tcg_temp_free_i32(tcg_res);
683
+ */
189
+ tcg_temp_free_i32(tcg_op);
684
+ IoTKit *s = IOTKIT(ii);
190
+ }
685
+ int region = extract32(address, 28, 4);
191
+
686
+
192
+ clear_vec_high(s, is_q, rd);
687
+ *ns = !(region & 1);
193
+ }
688
+ *nsc = (region == 1 && (s->nsccfg & 1)) || (region == 3 && (s->nsccfg & 2));
194
+
689
+ /* 0xe0000000..0xe00fffff and 0xf0000000..0xf00fffff are exempt */
195
+ if (tcg_rmode) {
690
+ *exempt = (address & 0xeff00000) == 0xe0000000;
196
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
691
+ *iregion = region;
197
+ tcg_temp_free_i32(tcg_rmode);
692
+}
198
+ }
693
+
199
+
694
+static const VMStateDescription iotkit_vmstate = {
200
+ if (tcg_fpstatus) {
695
+ .name = "iotkit",
201
+ tcg_temp_free_ptr(tcg_fpstatus);
696
+ .version_id = 1,
202
+ }
697
+ .minimum_version_id = 1,
203
}
698
+ .fields = (VMStateField[]) {
204
699
+ VMSTATE_UINT32(nsccfg, IoTKit),
205
/* AdvSIMD scalar x indexed element
700
+ VMSTATE_END_OF_LIST()
701
+ }
702
+};
703
+
704
+static Property iotkit_properties[] = {
705
+ DEFINE_PROP_LINK("memory", IoTKit, board_memory, TYPE_MEMORY_REGION,
706
+ MemoryRegion *),
707
+ DEFINE_PROP_UINT32("EXP_NUMIRQ", IoTKit, exp_numirq, 64),
708
+ DEFINE_PROP_UINT32("MAINCLK", IoTKit, mainclk_frq, 0),
709
+ DEFINE_PROP_END_OF_LIST()
710
+};
711
+
712
+static void iotkit_reset(DeviceState *dev)
713
+{
714
+ IoTKit *s = IOTKIT(dev);
715
+
716
+ s->nsccfg = 0;
717
+}
718
+
719
+static void iotkit_class_init(ObjectClass *klass, void *data)
720
+{
721
+ DeviceClass *dc = DEVICE_CLASS(klass);
722
+ IDAUInterfaceClass *iic = IDAU_INTERFACE_CLASS(klass);
723
+
724
+ dc->realize = iotkit_realize;
725
+ dc->vmsd = &iotkit_vmstate;
726
+ dc->props = iotkit_properties;
727
+ dc->reset = iotkit_reset;
728
+ iic->check = iotkit_idau_check;
729
+}
730
+
731
+static const TypeInfo iotkit_info = {
732
+ .name = TYPE_IOTKIT,
733
+ .parent = TYPE_SYS_BUS_DEVICE,
734
+ .instance_size = sizeof(IoTKit),
735
+ .instance_init = iotkit_init,
736
+ .class_init = iotkit_class_init,
737
+ .interfaces = (InterfaceInfo[]) {
738
+ { TYPE_IDAU_INTERFACE },
739
+ { }
740
+ }
741
+};
742
+
743
+static void iotkit_register_types(void)
744
+{
745
+ type_register_static(&iotkit_info);
746
+}
747
+
748
+type_init(iotkit_register_types);
749
diff --git a/default-configs/arm-softmmu.mak b/default-configs/arm-softmmu.mak
750
index XXXXXXX..XXXXXXX 100644
751
--- a/default-configs/arm-softmmu.mak
752
+++ b/default-configs/arm-softmmu.mak
753
@@ -XXX,XX +XXX,XX @@ CONFIG_MPS2_FPGAIO=y
754
CONFIG_MPS2_SCC=y
755
756
CONFIG_TZ_PPC=y
757
+CONFIG_IOTKIT=y
758
CONFIG_IOTKIT_SECCTL=y
759
760
CONFIG_VERSATILE_PCI=y
206
--
761
--
207
2.16.2
762
2.16.2
208
763
209
764
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
Define a new board model for the MPS2 with an AN505 FPGA image
2
containing a Cortex-M33. Since the FPGA images for TrustZone
3
cores (AN505, and the similar AN519 for Cortex-M23) have a
4
significantly different layout of devices to the non-TrustZone
5
images, we use a new source file rather than shoehorning them
6
into the existing mps2.c.
2
7
3
It looks like the ARM ARM has simplified the pseudo code for the
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
4
calculation which is done on a fixed point 9 bit integer maths. So
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
5
while adding f16 we can also clean this up to be a little less heavy
10
Message-id: 20180220180325.29818-20-peter.maydell@linaro.org
6
on the floating point and just return the fractional part and leave
11
---
7
the calle's to do the final packing of the result.
12
hw/arm/Makefile.objs | 1 +
13
hw/arm/mps2-tz.c | 503 +++++++++++++++++++++++++++++++++++++++++++++++++++
14
2 files changed, 504 insertions(+)
15
create mode 100644 hw/arm/mps2-tz.c
8
16
9
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
17
diff --git a/hw/arm/Makefile.objs b/hw/arm/Makefile.objs
10
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
11
Message-id: 20180227143852.11175-23-alex.bennee@linaro.org
12
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
13
---
14
target/arm/helper.h | 1 +
15
target/arm/helper.c | 226 +++++++++++++++++++++++++++++-----------------------
16
2 files changed, 129 insertions(+), 98 deletions(-)
17
18
diff --git a/target/arm/helper.h b/target/arm/helper.h
19
index XXXXXXX..XXXXXXX 100644
18
index XXXXXXX..XXXXXXX 100644
20
--- a/target/arm/helper.h
19
--- a/hw/arm/Makefile.objs
21
+++ b/target/arm/helper.h
20
+++ b/hw/arm/Makefile.objs
22
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_4(vfp_muladds, f32, f32, f32, f32, ptr)
21
@@ -XXX,XX +XXX,XX @@ obj-$(CONFIG_FSL_IMX31) += fsl-imx31.o kzm.o
23
22
obj-$(CONFIG_FSL_IMX6) += fsl-imx6.o sabrelite.o
24
DEF_HELPER_3(recps_f32, f32, f32, f32, env)
23
obj-$(CONFIG_ASPEED_SOC) += aspeed_soc.o aspeed.o
25
DEF_HELPER_3(rsqrts_f32, f32, f32, f32, env)
24
obj-$(CONFIG_MPS2) += mps2.o
26
+DEF_HELPER_FLAGS_2(recpe_f16, TCG_CALL_NO_RWG, f16, f16, ptr)
25
+obj-$(CONFIG_MPS2) += mps2-tz.o
27
DEF_HELPER_FLAGS_2(recpe_f32, TCG_CALL_NO_RWG, f32, f32, ptr)
26
obj-$(CONFIG_MSF2) += msf2-soc.o msf2-som.o
28
DEF_HELPER_FLAGS_2(recpe_f64, TCG_CALL_NO_RWG, f64, f64, ptr)
27
obj-$(CONFIG_IOTKIT) += iotkit.o
29
DEF_HELPER_FLAGS_2(rsqrte_f32, TCG_CALL_NO_RWG, f32, f32, ptr)
28
diff --git a/hw/arm/mps2-tz.c b/hw/arm/mps2-tz.c
30
diff --git a/target/arm/helper.c b/target/arm/helper.c
29
new file mode 100644
31
index XXXXXXX..XXXXXXX 100644
30
index XXXXXXX..XXXXXXX
32
--- a/target/arm/helper.c
31
--- /dev/null
33
+++ b/target/arm/helper.c
32
+++ b/hw/arm/mps2-tz.c
34
@@ -XXX,XX +XXX,XX @@ float32 HELPER(rsqrts_f32)(float32 a, float32 b, CPUARMState *env)
33
@@ -XXX,XX +XXX,XX @@
35
* int->float conversions at run-time. */
34
+/*
36
#define float64_256 make_float64(0x4070000000000000LL)
35
+ * ARM V2M MPS2 board emulation, trustzone aware FPGA images
37
#define float64_512 make_float64(0x4080000000000000LL)
38
+#define float16_maxnorm make_float16(0x7bff)
39
#define float32_maxnorm make_float32(0x7f7fffff)
40
#define float64_maxnorm make_float64(0x7fefffffffffffffLL)
41
42
/* Reciprocal functions
43
*
44
* The algorithm that must be used to calculate the estimate
45
- * is specified by the ARM ARM, see FPRecipEstimate()
46
+ * is specified by the ARM ARM, see FPRecipEstimate()/RecipEstimate
47
*/
48
49
-static float64 recip_estimate(float64 a, float_status *real_fp_status)
50
+/* See RecipEstimate()
51
+ *
36
+ *
52
+ * input is a 9 bit fixed point number
37
+ * Copyright (c) 2017 Linaro Limited
53
+ * input range 256 .. 511 for a number from 0.5 <= x < 1.0.
38
+ * Written by Peter Maydell
54
+ * result range 256 .. 511 for a number from 1.0 to 511/256.
39
+ *
40
+ * This program is free software; you can redistribute it and/or modify
41
+ * it under the terms of the GNU General Public License version 2 or
42
+ * (at your option) any later version.
55
+ */
43
+ */
56
+
44
+
57
+static int recip_estimate(int input)
45
+/* The MPS2 and MPS2+ dev boards are FPGA based (the 2+ has a bigger
58
{
46
+ * FPGA but is otherwise the same as the 2). Since the CPU itself
59
- /* These calculations mustn't set any fp exception flags,
47
+ * and most of the devices are in the FPGA, the details of the board
60
- * so we use a local copy of the fp_status.
48
+ * as seen by the guest depend significantly on the FPGA image.
61
- */
49
+ * This source file covers the following FPGA images, for TrustZone cores:
62
- float_status dummy_status = *real_fp_status;
50
+ * "mps2-an505" -- Cortex-M33 as documented in ARM Application Note AN505
63
- float_status *s = &dummy_status;
64
- /* q = (int)(a * 512.0) */
65
- float64 q = float64_mul(float64_512, a, s);
66
- int64_t q_int = float64_to_int64_round_to_zero(q, s);
67
-
68
- /* r = 1.0 / (((double)q + 0.5) / 512.0) */
69
- q = int64_to_float64(q_int, s);
70
- q = float64_add(q, float64_half, s);
71
- q = float64_div(q, float64_512, s);
72
- q = float64_div(float64_one, q, s);
73
-
74
- /* s = (int)(256.0 * r + 0.5) */
75
- q = float64_mul(q, float64_256, s);
76
- q = float64_add(q, float64_half, s);
77
- q_int = float64_to_int64_round_to_zero(q, s);
78
-
79
- /* return (double)s / 256.0 */
80
- return float64_div(int64_to_float64(q_int, s), float64_256, s);
81
+ int a, b, r;
82
+ assert(256 <= input && input < 512);
83
+ a = (input * 2) + 1;
84
+ b = (1 << 19) / a;
85
+ r = (b + 1) >> 1;
86
+ assert(256 <= r && r < 512);
87
+ return r;
88
}
89
90
-/* Common wrapper to call recip_estimate */
91
-static float64 call_recip_estimate(float64 num, int off, float_status *fpst)
92
-{
93
- uint64_t val64 = float64_val(num);
94
- uint64_t frac = extract64(val64, 0, 52);
95
- int64_t exp = extract64(val64, 52, 11);
96
- uint64_t sbit;
97
- float64 scaled, estimate;
98
+/*
99
+ * Common wrapper to call recip_estimate
100
+ *
51
+ *
101
+ * The parameters are exponent and 64 bit fraction (without implicit
52
+ * Links to the TRM for the board itself and to the various Application
102
+ * bit) where the binary point is nominally at bit 52. Returns a
53
+ * Notes which document the FPGA images can be found here:
103
+ * float64 which can then be rounded to the appropriate size by the
54
+ * https://developer.arm.com/products/system-design/development-boards/fpga-prototyping-boards/mps2
104
+ * callee.
55
+ *
56
+ * Board TRM:
57
+ * http://infocenter.arm.com/help/topic/com.arm.doc.100112_0200_06_en/versatile_express_cortex_m_prototyping_systems_v2m_mps2_and_v2m_mps2plus_technical_reference_100112_0200_06_en.pdf
58
+ * Application Note AN505:
59
+ * http://infocenter.arm.com/help/topic/com.arm.doc.dai0505b/index.html
60
+ *
61
+ * The AN505 defers to the Cortex-M33 processor ARMv8M IoT Kit FVP User Guide
62
+ * (ARM ECM0601256) for the details of some of the device layout:
63
+ * http://infocenter.arm.com/help/index.jsp?topic=/com.arm.doc.ecm0601256/index.html
105
+ */
64
+ */
106
65
+
107
- /* Generate the scaled number for the estimate function */
66
+#include "qemu/osdep.h"
108
- if (exp == 0) {
67
+#include "qapi/error.h"
109
+static uint64_t call_recip_estimate(int *exp, int exp_off, uint64_t frac)
68
+#include "qemu/error-report.h"
110
+{
69
+#include "hw/arm/arm.h"
111
+ uint32_t scaled, estimate;
70
+#include "hw/arm/armv7m.h"
112
+ uint64_t result_frac;
71
+#include "hw/or-irq.h"
113
+ int result_exp;
72
+#include "hw/boards.h"
114
+
73
+#include "exec/address-spaces.h"
115
+ /* Handle sub-normals */
74
+#include "sysemu/sysemu.h"
116
+ if (*exp == 0) {
75
+#include "hw/misc/unimp.h"
117
if (extract64(frac, 51, 1) == 0) {
76
+#include "hw/char/cmsdk-apb-uart.h"
118
- exp = -1;
77
+#include "hw/timer/cmsdk-apb-timer.h"
119
- frac = extract64(frac, 0, 50) << 2;
78
+#include "hw/misc/mps2-scc.h"
120
+ *exp = -1;
79
+#include "hw/misc/mps2-fpgaio.h"
121
+ frac <<= 2;
80
+#include "hw/arm/iotkit.h"
122
} else {
81
+#include "hw/devices.h"
123
- frac = extract64(frac, 0, 51) << 1;
82
+#include "net/net.h"
124
+ frac <<= 1;
83
+#include "hw/core/split-irq.h"
125
}
84
+
126
}
85
+typedef enum MPS2TZFPGAType {
127
86
+ FPGA_AN505,
128
- /* scaled = '0' : '01111111110' : fraction<51:44> : Zeros(44); */
87
+} MPS2TZFPGAType;
129
- scaled = make_float64((0x3feULL << 52)
88
+
130
- | extract64(frac, 44, 8) << 44);
89
+typedef struct {
131
+ /* scaled = UInt('1':fraction<51:44>) */
90
+ MachineClass parent;
132
+ scaled = deposit32(1 << 8, 0, 8, extract64(frac, 44, 8));
91
+ MPS2TZFPGAType fpga_type;
133
+ estimate = recip_estimate(scaled);
92
+ uint32_t scc_id;
134
93
+} MPS2TZMachineClass;
135
- estimate = recip_estimate(scaled, fpst);
94
+
136
-
95
+typedef struct {
137
- /* Build new result */
96
+ MachineState parent;
138
- val64 = float64_val(estimate);
97
+
139
- sbit = 0x8000000000000000ULL & val64;
98
+ IoTKit iotkit;
140
- exp = off - exp;
99
+ MemoryRegion psram;
141
- frac = extract64(val64, 0, 52);
100
+ MemoryRegion ssram1;
142
-
101
+ MemoryRegion ssram1_m;
143
- if (exp == 0) {
102
+ MemoryRegion ssram23;
144
- frac = 1ULL << 51 | extract64(frac, 1, 51);
103
+ MPS2SCC scc;
145
- } else if (exp == -1) {
104
+ MPS2FPGAIO fpgaio;
146
- frac = 1ULL << 50 | extract64(frac, 2, 50);
105
+ TZPPC ppc[5];
147
- exp = 0;
106
+ UnimplementedDeviceState ssram_mpc[3];
148
+ result_exp = exp_off - *exp;
107
+ UnimplementedDeviceState spi[5];
149
+ result_frac = deposit64(0, 44, 8, estimate);
108
+ UnimplementedDeviceState i2c[4];
150
+ if (result_exp == 0) {
109
+ UnimplementedDeviceState i2s_audio;
151
+ result_frac = deposit64(result_frac >> 1, 51, 1, 1);
110
+ UnimplementedDeviceState gpio[5];
152
+ } else if (result_exp == -1) {
111
+ UnimplementedDeviceState dma[4];
153
+ result_frac = deposit64(result_frac >> 2, 50, 2, 1);
112
+ UnimplementedDeviceState gfx;
154
+ result_exp = 0;
113
+ CMSDKAPBUART uart[5];
155
}
114
+ SplitIRQ sec_resp_splitter;
156
115
+ qemu_or_irq uart_irq_orgate;
157
- return make_float64(sbit | (exp << 52) | frac);
116
+} MPS2TZMachineState;
158
+ *exp = result_exp;
117
+
159
+
118
+#define TYPE_MPS2TZ_MACHINE "mps2tz"
160
+ return result_frac;
119
+#define TYPE_MPS2TZ_AN505_MACHINE MACHINE_TYPE_NAME("mps2-an505")
161
}
120
+
162
121
+#define MPS2TZ_MACHINE(obj) \
163
static bool round_to_inf(float_status *fpst, bool sign_bit)
122
+ OBJECT_CHECK(MPS2TZMachineState, obj, TYPE_MPS2TZ_MACHINE)
164
@@ -XXX,XX +XXX,XX @@ static bool round_to_inf(float_status *fpst, bool sign_bit)
123
+#define MPS2TZ_MACHINE_GET_CLASS(obj) \
165
g_assert_not_reached();
124
+ OBJECT_GET_CLASS(MPS2TZMachineClass, obj, TYPE_MPS2TZ_MACHINE)
166
}
125
+#define MPS2TZ_MACHINE_CLASS(klass) \
167
126
+ OBJECT_CLASS_CHECK(MPS2TZMachineClass, klass, TYPE_MPS2TZ_MACHINE)
168
+float16 HELPER(recpe_f16)(float16 input, void *fpstp)
127
+
169
+{
128
+/* Main SYSCLK frequency in Hz */
170
+ float_status *fpst = fpstp;
129
+#define SYSCLK_FRQ 20000000
171
+ float16 f16 = float16_squash_input_denormal(input, fpst);
130
+
172
+ uint32_t f16_val = float16_val(f16);
131
+/* Initialize the auxiliary RAM region @mr and map it into
173
+ uint32_t f16_sign = float16_is_neg(f16);
132
+ * the memory map at @base.
174
+ int f16_exp = extract32(f16_val, 10, 5);
133
+ */
175
+ uint32_t f16_frac = extract32(f16_val, 0, 10);
134
+static void make_ram(MemoryRegion *mr, const char *name,
176
+ uint64_t f64_frac;
135
+ hwaddr base, hwaddr size)
177
+
136
+{
178
+ if (float16_is_any_nan(f16)) {
137
+ memory_region_init_ram(mr, NULL, name, size, &error_fatal);
179
+ float16 nan = f16;
138
+ memory_region_add_subregion(get_system_memory(), base, mr);
180
+ if (float16_is_signaling_nan(f16, fpst)) {
139
+}
181
+ float_raise(float_flag_invalid, fpst);
140
+
182
+ nan = float16_maybe_silence_nan(f16, fpst);
141
+/* Create an alias of an entire original MemoryRegion @orig
142
+ * located at @base in the memory map.
143
+ */
144
+static void make_ram_alias(MemoryRegion *mr, const char *name,
145
+ MemoryRegion *orig, hwaddr base)
146
+{
147
+ memory_region_init_alias(mr, NULL, name, orig, 0,
148
+ memory_region_size(orig));
149
+ memory_region_add_subregion(get_system_memory(), base, mr);
150
+}
151
+
152
+static void init_sysbus_child(Object *parent, const char *childname,
153
+ void *child, size_t childsize,
154
+ const char *childtype)
155
+{
156
+ object_initialize(child, childsize, childtype);
157
+ object_property_add_child(parent, childname, OBJECT(child), &error_abort);
158
+ qdev_set_parent_bus(DEVICE(child), sysbus_get_default());
159
+
160
+}
161
+
162
+/* Most of the devices in the AN505 FPGA image sit behind
163
+ * Peripheral Protection Controllers. These data structures
164
+ * define the layout of which devices sit behind which PPCs.
165
+ * The devfn for each port is a function which creates, configures
166
+ * and initializes the device, returning the MemoryRegion which
167
+ * needs to be plugged into the downstream end of the PPC port.
168
+ */
169
+typedef MemoryRegion *MakeDevFn(MPS2TZMachineState *mms, void *opaque,
170
+ const char *name, hwaddr size);
171
+
172
+typedef struct PPCPortInfo {
173
+ const char *name;
174
+ MakeDevFn *devfn;
175
+ void *opaque;
176
+ hwaddr addr;
177
+ hwaddr size;
178
+} PPCPortInfo;
179
+
180
+typedef struct PPCInfo {
181
+ const char *name;
182
+ PPCPortInfo ports[TZ_NUM_PORTS];
183
+} PPCInfo;
184
+
185
+static MemoryRegion *make_unimp_dev(MPS2TZMachineState *mms,
186
+ void *opaque,
187
+ const char *name, hwaddr size)
188
+{
189
+ /* Initialize, configure and realize a TYPE_UNIMPLEMENTED_DEVICE,
190
+ * and return a pointer to its MemoryRegion.
191
+ */
192
+ UnimplementedDeviceState *uds = opaque;
193
+
194
+ init_sysbus_child(OBJECT(mms), name, uds,
195
+ sizeof(UnimplementedDeviceState),
196
+ TYPE_UNIMPLEMENTED_DEVICE);
197
+ qdev_prop_set_string(DEVICE(uds), "name", name);
198
+ qdev_prop_set_uint64(DEVICE(uds), "size", size);
199
+ object_property_set_bool(OBJECT(uds), true, "realized", &error_fatal);
200
+ return sysbus_mmio_get_region(SYS_BUS_DEVICE(uds), 0);
201
+}
202
+
203
+static MemoryRegion *make_uart(MPS2TZMachineState *mms, void *opaque,
204
+ const char *name, hwaddr size)
205
+{
206
+ CMSDKAPBUART *uart = opaque;
207
+ int i = uart - &mms->uart[0];
208
+ Chardev *uartchr = i < MAX_SERIAL_PORTS ? serial_hds[i] : NULL;
209
+ int rxirqno = i * 2;
210
+ int txirqno = i * 2 + 1;
211
+ int combirqno = i + 10;
212
+ SysBusDevice *s;
213
+ DeviceState *iotkitdev = DEVICE(&mms->iotkit);
214
+ DeviceState *orgate_dev = DEVICE(&mms->uart_irq_orgate);
215
+
216
+ init_sysbus_child(OBJECT(mms), name, uart,
217
+ sizeof(mms->uart[0]), TYPE_CMSDK_APB_UART);
218
+ qdev_prop_set_chr(DEVICE(uart), "chardev", uartchr);
219
+ qdev_prop_set_uint32(DEVICE(uart), "pclk-frq", SYSCLK_FRQ);
220
+ object_property_set_bool(OBJECT(uart), true, "realized", &error_fatal);
221
+ s = SYS_BUS_DEVICE(uart);
222
+ sysbus_connect_irq(s, 0, qdev_get_gpio_in_named(iotkitdev,
223
+ "EXP_IRQ", txirqno));
224
+ sysbus_connect_irq(s, 1, qdev_get_gpio_in_named(iotkitdev,
225
+ "EXP_IRQ", rxirqno));
226
+ sysbus_connect_irq(s, 2, qdev_get_gpio_in(orgate_dev, i * 2));
227
+ sysbus_connect_irq(s, 3, qdev_get_gpio_in(orgate_dev, i * 2 + 1));
228
+ sysbus_connect_irq(s, 4, qdev_get_gpio_in_named(iotkitdev,
229
+ "EXP_IRQ", combirqno));
230
+ return sysbus_mmio_get_region(SYS_BUS_DEVICE(uart), 0);
231
+}
232
+
233
+static MemoryRegion *make_scc(MPS2TZMachineState *mms, void *opaque,
234
+ const char *name, hwaddr size)
235
+{
236
+ MPS2SCC *scc = opaque;
237
+ DeviceState *sccdev;
238
+ MPS2TZMachineClass *mmc = MPS2TZ_MACHINE_GET_CLASS(mms);
239
+
240
+ object_initialize(scc, sizeof(mms->scc), TYPE_MPS2_SCC);
241
+ sccdev = DEVICE(scc);
242
+ qdev_set_parent_bus(sccdev, sysbus_get_default());
243
+ qdev_prop_set_uint32(sccdev, "scc-cfg4", 0x2);
244
+ qdev_prop_set_uint32(sccdev, "scc-aid", 0x02000008);
245
+ qdev_prop_set_uint32(sccdev, "scc-id", mmc->scc_id);
246
+ object_property_set_bool(OBJECT(scc), true, "realized", &error_fatal);
247
+ return sysbus_mmio_get_region(SYS_BUS_DEVICE(sccdev), 0);
248
+}
249
+
250
+static MemoryRegion *make_fpgaio(MPS2TZMachineState *mms, void *opaque,
251
+ const char *name, hwaddr size)
252
+{
253
+ MPS2FPGAIO *fpgaio = opaque;
254
+
255
+ object_initialize(fpgaio, sizeof(mms->fpgaio), TYPE_MPS2_FPGAIO);
256
+ qdev_set_parent_bus(DEVICE(fpgaio), sysbus_get_default());
257
+ object_property_set_bool(OBJECT(fpgaio), true, "realized", &error_fatal);
258
+ return sysbus_mmio_get_region(SYS_BUS_DEVICE(fpgaio), 0);
259
+}
260
+
261
+static void mps2tz_common_init(MachineState *machine)
262
+{
263
+ MPS2TZMachineState *mms = MPS2TZ_MACHINE(machine);
264
+ MachineClass *mc = MACHINE_GET_CLASS(machine);
265
+ MemoryRegion *system_memory = get_system_memory();
266
+ DeviceState *iotkitdev;
267
+ DeviceState *dev_splitter;
268
+ int i;
269
+
270
+ if (strcmp(machine->cpu_type, mc->default_cpu_type) != 0) {
271
+ error_report("This board can only be used with CPU %s",
272
+ mc->default_cpu_type);
273
+ exit(1);
274
+ }
275
+
276
+ init_sysbus_child(OBJECT(machine), "iotkit", &mms->iotkit,
277
+ sizeof(mms->iotkit), TYPE_IOTKIT);
278
+ iotkitdev = DEVICE(&mms->iotkit);
279
+ object_property_set_link(OBJECT(&mms->iotkit), OBJECT(system_memory),
280
+ "memory", &error_abort);
281
+ qdev_prop_set_uint32(iotkitdev, "EXP_NUMIRQ", 92);
282
+ qdev_prop_set_uint32(iotkitdev, "MAINCLK", SYSCLK_FRQ);
283
+ object_property_set_bool(OBJECT(&mms->iotkit), true, "realized",
284
+ &error_fatal);
285
+
286
+ /* The sec_resp_cfg output from the IoTKit must be split into multiple
287
+ * lines, one for each of the PPCs we create here.
288
+ */
289
+ object_initialize(&mms->sec_resp_splitter, sizeof(mms->sec_resp_splitter),
290
+ TYPE_SPLIT_IRQ);
291
+ object_property_add_child(OBJECT(machine), "sec-resp-splitter",
292
+ OBJECT(&mms->sec_resp_splitter), &error_abort);
293
+ object_property_set_int(OBJECT(&mms->sec_resp_splitter), 5,
294
+ "num-lines", &error_fatal);
295
+ object_property_set_bool(OBJECT(&mms->sec_resp_splitter), true,
296
+ "realized", &error_fatal);
297
+ dev_splitter = DEVICE(&mms->sec_resp_splitter);
298
+ qdev_connect_gpio_out_named(iotkitdev, "sec_resp_cfg", 0,
299
+ qdev_get_gpio_in(dev_splitter, 0));
300
+
301
+ /* The IoTKit sets up much of the memory layout, including
302
+ * the aliases between secure and non-secure regions in the
303
+ * address space. The FPGA itself contains:
304
+ *
305
+ * 0x00000000..0x003fffff SSRAM1
306
+ * 0x00400000..0x007fffff alias of SSRAM1
307
+ * 0x28000000..0x283fffff 4MB SSRAM2 + SSRAM3
308
+ * 0x40100000..0x4fffffff AHB Master Expansion 1 interface devices
309
+ * 0x80000000..0x80ffffff 16MB PSRAM
310
+ */
311
+
312
+ /* The FPGA images have an odd combination of different RAMs,
313
+ * because in hardware they are different implementations and
314
+ * connected to different buses, giving varying performance/size
315
+ * tradeoffs. For QEMU they're all just RAM, though. We arbitrarily
316
+ * call the 16MB our "system memory", as it's the largest lump.
317
+ */
318
+ memory_region_allocate_system_memory(&mms->psram,
319
+ NULL, "mps.ram", 0x01000000);
320
+ memory_region_add_subregion(system_memory, 0x80000000, &mms->psram);
321
+
322
+ /* The SSRAM memories should all be behind Memory Protection Controllers,
323
+ * but we don't implement that yet.
324
+ */
325
+ make_ram(&mms->ssram1, "mps.ssram1", 0x00000000, 0x00400000);
326
+ make_ram_alias(&mms->ssram1_m, "mps.ssram1_m", &mms->ssram1, 0x00400000);
327
+
328
+ make_ram(&mms->ssram23, "mps.ssram23", 0x28000000, 0x00400000);
329
+
330
+ /* The overflow IRQs for all UARTs are ORed together.
331
+ * Tx, Rx and "combined" IRQs are sent to the NVIC separately.
332
+ * Create the OR gate for this.
333
+ */
334
+ object_initialize(&mms->uart_irq_orgate, sizeof(mms->uart_irq_orgate),
335
+ TYPE_OR_IRQ);
336
+ object_property_add_child(OBJECT(mms), "uart-irq-orgate",
337
+ OBJECT(&mms->uart_irq_orgate), &error_abort);
338
+ object_property_set_int(OBJECT(&mms->uart_irq_orgate), 10, "num-lines",
339
+ &error_fatal);
340
+ object_property_set_bool(OBJECT(&mms->uart_irq_orgate), true,
341
+ "realized", &error_fatal);
342
+ qdev_connect_gpio_out(DEVICE(&mms->uart_irq_orgate), 0,
343
+ qdev_get_gpio_in_named(iotkitdev, "EXP_IRQ", 15));
344
+
345
+ /* Most of the devices in the FPGA are behind Peripheral Protection
346
+ * Controllers. The required order for initializing things is:
347
+ * + initialize the PPC
348
+ * + initialize, configure and realize downstream devices
349
+ * + connect downstream device MemoryRegions to the PPC
350
+ * + realize the PPC
351
+ * + map the PPC's MemoryRegions to the places in the address map
352
+ * where the downstream devices should appear
353
+ * + wire up the PPC's control lines to the IoTKit object
354
+ */
355
+
356
+ const PPCInfo ppcs[] = { {
357
+ .name = "apb_ppcexp0",
358
+ .ports = {
359
+ { "ssram-mpc0", make_unimp_dev, &mms->ssram_mpc[0],
360
+ 0x58007000, 0x1000 },
361
+ { "ssram-mpc1", make_unimp_dev, &mms->ssram_mpc[1],
362
+ 0x58008000, 0x1000 },
363
+ { "ssram-mpc2", make_unimp_dev, &mms->ssram_mpc[2],
364
+ 0x58009000, 0x1000 },
365
+ },
366
+ }, {
367
+ .name = "apb_ppcexp1",
368
+ .ports = {
369
+ { "spi0", make_unimp_dev, &mms->spi[0], 0x40205000, 0x1000 },
370
+ { "spi1", make_unimp_dev, &mms->spi[1], 0x40206000, 0x1000 },
371
+ { "spi2", make_unimp_dev, &mms->spi[2], 0x40209000, 0x1000 },
372
+ { "spi3", make_unimp_dev, &mms->spi[3], 0x4020a000, 0x1000 },
373
+ { "spi4", make_unimp_dev, &mms->spi[4], 0x4020b000, 0x1000 },
374
+ { "uart0", make_uart, &mms->uart[0], 0x40200000, 0x1000 },
375
+ { "uart1", make_uart, &mms->uart[1], 0x40201000, 0x1000 },
376
+ { "uart2", make_uart, &mms->uart[2], 0x40202000, 0x1000 },
377
+ { "uart3", make_uart, &mms->uart[3], 0x40203000, 0x1000 },
378
+ { "uart4", make_uart, &mms->uart[4], 0x40204000, 0x1000 },
379
+ { "i2c0", make_unimp_dev, &mms->i2c[0], 0x40207000, 0x1000 },
380
+ { "i2c1", make_unimp_dev, &mms->i2c[1], 0x40208000, 0x1000 },
381
+ { "i2c2", make_unimp_dev, &mms->i2c[2], 0x4020c000, 0x1000 },
382
+ { "i2c3", make_unimp_dev, &mms->i2c[3], 0x4020d000, 0x1000 },
383
+ },
384
+ }, {
385
+ .name = "apb_ppcexp2",
386
+ .ports = {
387
+ { "scc", make_scc, &mms->scc, 0x40300000, 0x1000 },
388
+ { "i2s-audio", make_unimp_dev, &mms->i2s_audio,
389
+ 0x40301000, 0x1000 },
390
+ { "fpgaio", make_fpgaio, &mms->fpgaio, 0x40302000, 0x1000 },
391
+ },
392
+ }, {
393
+ .name = "ahb_ppcexp0",
394
+ .ports = {
395
+ { "gfx", make_unimp_dev, &mms->gfx, 0x41000000, 0x140000 },
396
+ { "gpio0", make_unimp_dev, &mms->gpio[0], 0x40100000, 0x1000 },
397
+ { "gpio1", make_unimp_dev, &mms->gpio[1], 0x40101000, 0x1000 },
398
+ { "gpio2", make_unimp_dev, &mms->gpio[2], 0x40102000, 0x1000 },
399
+ { "gpio3", make_unimp_dev, &mms->gpio[3], 0x40103000, 0x1000 },
400
+ { "gpio4", make_unimp_dev, &mms->gpio[4], 0x40104000, 0x1000 },
401
+ },
402
+ }, {
403
+ .name = "ahb_ppcexp1",
404
+ .ports = {
405
+ { "dma0", make_unimp_dev, &mms->dma[0], 0x40110000, 0x1000 },
406
+ { "dma1", make_unimp_dev, &mms->dma[1], 0x40111000, 0x1000 },
407
+ { "dma2", make_unimp_dev, &mms->dma[2], 0x40112000, 0x1000 },
408
+ { "dma3", make_unimp_dev, &mms->dma[3], 0x40113000, 0x1000 },
409
+ },
410
+ },
411
+ };
412
+
413
+ for (i = 0; i < ARRAY_SIZE(ppcs); i++) {
414
+ const PPCInfo *ppcinfo = &ppcs[i];
415
+ TZPPC *ppc = &mms->ppc[i];
416
+ DeviceState *ppcdev;
417
+ int port;
418
+ char *gpioname;
419
+
420
+ init_sysbus_child(OBJECT(machine), ppcinfo->name, ppc,
421
+ sizeof(TZPPC), TYPE_TZ_PPC);
422
+ ppcdev = DEVICE(ppc);
423
+
424
+ for (port = 0; port < TZ_NUM_PORTS; port++) {
425
+ const PPCPortInfo *pinfo = &ppcinfo->ports[port];
426
+ MemoryRegion *mr;
427
+ char *portname;
428
+
429
+ if (!pinfo->devfn) {
430
+ continue;
431
+ }
432
+
433
+ mr = pinfo->devfn(mms, pinfo->opaque, pinfo->name, pinfo->size);
434
+ portname = g_strdup_printf("port[%d]", port);
435
+ object_property_set_link(OBJECT(ppc), OBJECT(mr),
436
+ portname, &error_fatal);
437
+ g_free(portname);
183
+ }
438
+ }
184
+ if (fpst->default_nan_mode) {
439
+
185
+ nan = float16_default_nan(fpst);
440
+ object_property_set_bool(OBJECT(ppc), true, "realized", &error_fatal);
441
+
442
+ for (port = 0; port < TZ_NUM_PORTS; port++) {
443
+ const PPCPortInfo *pinfo = &ppcinfo->ports[port];
444
+
445
+ if (!pinfo->devfn) {
446
+ continue;
447
+ }
448
+ sysbus_mmio_map(SYS_BUS_DEVICE(ppc), port, pinfo->addr);
449
+
450
+ gpioname = g_strdup_printf("%s_nonsec", ppcinfo->name);
451
+ qdev_connect_gpio_out_named(iotkitdev, gpioname, port,
452
+ qdev_get_gpio_in_named(ppcdev,
453
+ "cfg_nonsec",
454
+ port));
455
+ g_free(gpioname);
456
+ gpioname = g_strdup_printf("%s_ap", ppcinfo->name);
457
+ qdev_connect_gpio_out_named(iotkitdev, gpioname, port,
458
+ qdev_get_gpio_in_named(ppcdev,
459
+ "cfg_ap", port));
460
+ g_free(gpioname);
186
+ }
461
+ }
187
+ return nan;
462
+
188
+ } else if (float16_is_infinity(f16)) {
463
+ gpioname = g_strdup_printf("%s_irq_enable", ppcinfo->name);
189
+ return float16_set_sign(float16_zero, float16_is_neg(f16));
464
+ qdev_connect_gpio_out_named(iotkitdev, gpioname, 0,
190
+ } else if (float16_is_zero(f16)) {
465
+ qdev_get_gpio_in_named(ppcdev,
191
+ float_raise(float_flag_divbyzero, fpst);
466
+ "irq_enable", 0));
192
+ return float16_set_sign(float16_infinity, float16_is_neg(f16));
467
+ g_free(gpioname);
193
+ } else if (float16_abs(f16) < (1 << 8)) {
468
+ gpioname = g_strdup_printf("%s_irq_clear", ppcinfo->name);
194
+ /* Abs(value) < 2.0^-16 */
469
+ qdev_connect_gpio_out_named(iotkitdev, gpioname, 0,
195
+ float_raise(float_flag_overflow | float_flag_inexact, fpst);
470
+ qdev_get_gpio_in_named(ppcdev,
196
+ if (round_to_inf(fpst, f16_sign)) {
471
+ "irq_clear", 0));
197
+ return float16_set_sign(float16_infinity, f16_sign);
472
+ g_free(gpioname);
198
+ } else {
473
+ gpioname = g_strdup_printf("%s_irq_status", ppcinfo->name);
199
+ return float16_set_sign(float16_maxnorm, f16_sign);
474
+ qdev_connect_gpio_out_named(ppcdev, "irq", 0,
200
+ }
475
+ qdev_get_gpio_in_named(iotkitdev,
201
+ } else if (f16_exp >= 29 && fpst->flush_to_zero) {
476
+ gpioname, 0));
202
+ float_raise(float_flag_underflow, fpst);
477
+ g_free(gpioname);
203
+ return float16_set_sign(float16_zero, float16_is_neg(f16));
478
+
479
+ qdev_connect_gpio_out(dev_splitter, i,
480
+ qdev_get_gpio_in_named(ppcdev,
481
+ "cfg_sec_resp", 0));
204
+ }
482
+ }
205
+
483
+
206
+ f64_frac = call_recip_estimate(&f16_exp, 29,
484
+ /* In hardware this is a LAN9220; the LAN9118 is software compatible
207
+ ((uint64_t) f16_frac) << (52 - 10));
485
+ * except that it doesn't support the checksum-offload feature.
208
+
486
+ * The ethernet controller is not behind a PPC.
209
+ /* result = sign : result_exp<4:0> : fraction<51:42> */
487
+ */
210
+ f16_val = deposit32(0, 15, 1, f16_sign);
488
+ lan9118_init(&nd_table[0], 0x42000000,
211
+ f16_val = deposit32(f16_val, 10, 5, f16_exp);
489
+ qdev_get_gpio_in_named(iotkitdev, "EXP_IRQ", 16));
212
+ f16_val = deposit32(f16_val, 0, 10, extract64(f64_frac, 52 - 10, 10));
490
+
213
+ return make_float16(f16_val);
491
+ create_unimplemented_device("FPGA NS PC", 0x48007000, 0x1000);
214
+}
492
+
215
+
493
+ armv7m_load_kernel(ARM_CPU(first_cpu), machine->kernel_filename, 0x400000);
216
float32 HELPER(recpe_f32)(float32 input, void *fpstp)
494
+}
217
{
495
+
218
float_status *fpst = fpstp;
496
+static void mps2tz_class_init(ObjectClass *oc, void *data)
219
float32 f32 = float32_squash_input_denormal(input, fpst);
497
+{
220
uint32_t f32_val = float32_val(f32);
498
+ MachineClass *mc = MACHINE_CLASS(oc);
221
- uint32_t f32_sbit = 0x80000000ULL & f32_val;
499
+
222
- int32_t f32_exp = extract32(f32_val, 23, 8);
500
+ mc->init = mps2tz_common_init;
223
+ bool f32_sign = float32_is_neg(f32);
501
+ mc->max_cpus = 1;
224
+ int f32_exp = extract32(f32_val, 23, 8);
502
+}
225
uint32_t f32_frac = extract32(f32_val, 0, 23);
503
+
226
- float64 f64, r64;
504
+static void mps2tz_an505_class_init(ObjectClass *oc, void *data)
227
- uint64_t r64_val;
505
+{
228
- int64_t r64_exp;
506
+ MachineClass *mc = MACHINE_CLASS(oc);
229
- uint64_t r64_frac;
507
+ MPS2TZMachineClass *mmc = MPS2TZ_MACHINE_CLASS(oc);
230
+ uint64_t f64_frac;
508
+
231
509
+ mc->desc = "ARM MPS2 with AN505 FPGA image for Cortex-M33";
232
if (float32_is_any_nan(f32)) {
510
+ mmc->fpga_type = FPGA_AN505;
233
float32 nan = f32;
511
+ mc->default_cpu_type = ARM_CPU_TYPE_NAME("cortex-m33");
234
@@ -XXX,XX +XXX,XX @@ float32 HELPER(recpe_f32)(float32 input, void *fpstp)
512
+ mmc->scc_id = 0x41040000 | (505 << 4);
235
} else if (float32_is_zero(f32)) {
513
+}
236
float_raise(float_flag_divbyzero, fpst);
514
+
237
return float32_set_sign(float32_infinity, float32_is_neg(f32));
515
+static const TypeInfo mps2tz_info = {
238
- } else if ((f32_val & ~(1ULL << 31)) < (1ULL << 21)) {
516
+ .name = TYPE_MPS2TZ_MACHINE,
239
+ } else if (float32_abs(f32) < (1ULL << 21)) {
517
+ .parent = TYPE_MACHINE,
240
/* Abs(value) < 2.0^-128 */
518
+ .abstract = true,
241
float_raise(float_flag_overflow | float_flag_inexact, fpst);
519
+ .instance_size = sizeof(MPS2TZMachineState),
242
- if (round_to_inf(fpst, f32_sbit)) {
520
+ .class_size = sizeof(MPS2TZMachineClass),
243
- return float32_set_sign(float32_infinity, float32_is_neg(f32));
521
+ .class_init = mps2tz_class_init,
244
+ if (round_to_inf(fpst, f32_sign)) {
522
+};
245
+ return float32_set_sign(float32_infinity, f32_sign);
523
+
246
} else {
524
+static const TypeInfo mps2tz_an505_info = {
247
- return float32_set_sign(float32_maxnorm, float32_is_neg(f32));
525
+ .name = TYPE_MPS2TZ_AN505_MACHINE,
248
+ return float32_set_sign(float32_maxnorm, f32_sign);
526
+ .parent = TYPE_MPS2TZ_MACHINE,
249
}
527
+ .class_init = mps2tz_an505_class_init,
250
} else if (f32_exp >= 253 && fpst->flush_to_zero) {
528
+};
251
float_raise(float_flag_underflow, fpst);
529
+
252
return float32_set_sign(float32_zero, float32_is_neg(f32));
530
+static void mps2tz_machine_init(void)
253
}
531
+{
254
532
+ type_register_static(&mps2tz_info);
255
+ f64_frac = call_recip_estimate(&f32_exp, 253,
533
+ type_register_static(&mps2tz_an505_info);
256
+ ((uint64_t) f32_frac) << (52 - 23));
534
+}
257
535
+
258
- f64 = make_float64(((int64_t)(f32_exp) << 52) | (int64_t)(f32_frac) << 29);
536
+type_init(mps2tz_machine_init);
259
- r64 = call_recip_estimate(f64, 253, fpst);
260
- r64_val = float64_val(r64);
261
- r64_exp = extract64(r64_val, 52, 11);
262
- r64_frac = extract64(r64_val, 0, 52);
263
-
264
- /* result = sign : result_exp<7:0> : fraction<51:29>; */
265
- return make_float32(f32_sbit |
266
- (r64_exp & 0xff) << 23 |
267
- extract64(r64_frac, 29, 24));
268
+ /* result = sign : result_exp<7:0> : fraction<51:29> */
269
+ f32_val = deposit32(0, 31, 1, f32_sign);
270
+ f32_val = deposit32(f32_val, 23, 8, f32_exp);
271
+ f32_val = deposit32(f32_val, 0, 23, extract64(f64_frac, 52 - 23, 23));
272
+ return make_float32(f32_val);
273
}
274
275
float64 HELPER(recpe_f64)(float64 input, void *fpstp)
276
@@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp)
277
float_status *fpst = fpstp;
278
float64 f64 = float64_squash_input_denormal(input, fpst);
279
uint64_t f64_val = float64_val(f64);
280
- uint64_t f64_sbit = 0x8000000000000000ULL & f64_val;
281
- int64_t f64_exp = extract64(f64_val, 52, 11);
282
- float64 r64;
283
- uint64_t r64_val;
284
- int64_t r64_exp;
285
- uint64_t r64_frac;
286
+ bool f64_sign = float64_is_neg(f64);
287
+ int f64_exp = extract64(f64_val, 52, 11);
288
+ uint64_t f64_frac = extract64(f64_val, 0, 52);
289
290
/* Deal with any special cases */
291
if (float64_is_any_nan(f64)) {
292
@@ -XXX,XX +XXX,XX @@ float64 HELPER(recpe_f64)(float64 input, void *fpstp)
293
} else if ((f64_val & ~(1ULL << 63)) < (1ULL << 50)) {
294
/* Abs(value) < 2.0^-1024 */
295
float_raise(float_flag_overflow | float_flag_inexact, fpst);
296
- if (round_to_inf(fpst, f64_sbit)) {
297
- return float64_set_sign(float64_infinity, float64_is_neg(f64));
298
+ if (round_to_inf(fpst, f64_sign)) {
299
+ return float64_set_sign(float64_infinity, f64_sign);
300
} else {
301
- return float64_set_sign(float64_maxnorm, float64_is_neg(f64));
302
+ return float64_set_sign(float64_maxnorm, f64_sign);
303
}
304
} else if (f64_exp >= 2045 && fpst->flush_to_zero) {
305
float_raise(float_flag_underflow, fpst);
306
return float64_set_sign(float64_zero, float64_is_neg(f64));
307
}
308
309
- r64 = call_recip_estimate(f64, 2045, fpst);
310
- r64_val = float64_val(r64);
311
- r64_exp = extract64(r64_val, 52, 11);
312
- r64_frac = extract64(r64_val, 0, 52);
313
+ f64_frac = call_recip_estimate(&f64_exp, 2045, f64_frac);
314
315
- /* result = sign : result_exp<10:0> : fraction<51:0> */
316
- return make_float64(f64_sbit |
317
- ((r64_exp & 0x7ff) << 52) |
318
- r64_frac);
319
+ /* result = sign : result_exp<10:0> : fraction<51:0>; */
320
+ f64_val = deposit64(0, 63, 1, f64_sign);
321
+ f64_val = deposit64(f64_val, 52, 11, f64_exp);
322
+ f64_val = deposit64(f64_val, 0, 52, f64_frac);
323
+ return make_float64(f64_val);
324
}
325
326
/* The algorithm that must be used to calculate the estimate
327
@@ -XXX,XX +XXX,XX @@ float64 HELPER(rsqrte_f64)(float64 input, void *fpstp)
328
329
uint32_t HELPER(recpe_u32)(uint32_t a, void *fpstp)
330
{
331
- float_status *s = fpstp;
332
- float64 f64;
333
+ /* float_status *s = fpstp; */
334
+ int input, estimate;
335
336
if ((a & 0x80000000) == 0) {
337
return 0xffffffff;
338
}
339
340
- f64 = make_float64((0x3feULL << 52)
341
- | ((int64_t)(a & 0x7fffffff) << 21));
342
+ input = extract32(a, 23, 9);
343
+ estimate = recip_estimate(input);
344
345
- f64 = recip_estimate(f64, s);
346
-
347
- return 0x80000000 | ((float64_val(f64) >> 21) & 0x7fffffff);
348
+ return deposit32(0, (32 - 9), 9, estimate);
349
}
350
351
uint32_t HELPER(rsqrte_u32)(uint32_t a, void *fpstp)
352
--
537
--
353
2.16.2
538
2.16.2
354
539
355
540
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
3
Not enabled anywhere yet.
4
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
4
5
Message-id: 20180227143852.11175-3-alex.bennee@linaro.org
5
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
6
[PMM: postpone actually enabling feature until end of the
6
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
7
patch series]
7
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-id: 20180228193125.20577-2-richard.henderson@linaro.org
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
---
10
---
10
target/arm/cpu.h | 1 +
11
target/arm/cpu.h | 1 +
11
1 file changed, 1 insertion(+)
12
linux-user/elfload.c | 1 +
13
2 files changed, 2 insertions(+)
12
14
13
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
15
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
14
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/cpu.h
17
--- a/target/arm/cpu.h
16
+++ b/target/arm/cpu.h
18
+++ b/target/arm/cpu.h
17
@@ -XXX,XX +XXX,XX @@ enum arm_features {
19
@@ -XXX,XX +XXX,XX @@ enum arm_features {
18
ARM_FEATURE_V8_SHA3, /* implements SHA3 part of v8 Crypto Extensions */
20
ARM_FEATURE_V8_SHA3, /* implements SHA3 part of v8 Crypto Extensions */
19
ARM_FEATURE_V8_SM3, /* implements SM3 part of v8 Crypto Extensions */
21
ARM_FEATURE_V8_SM3, /* implements SM3 part of v8 Crypto Extensions */
20
ARM_FEATURE_V8_SM4, /* implements SM4 part of v8 Crypto Extensions */
22
ARM_FEATURE_V8_SM4, /* implements SM4 part of v8 Crypto Extensions */
21
+ ARM_FEATURE_V8_FP16, /* implements v8.2 half-precision float */
23
+ ARM_FEATURE_V8_RDM, /* implements v8.1 simd round multiply */
24
ARM_FEATURE_V8_FP16, /* implements v8.2 half-precision float */
22
};
25
};
23
26
24
static inline int arm_feature(CPUARMState *env, int feature)
27
diff --git a/linux-user/elfload.c b/linux-user/elfload.c
28
index XXXXXXX..XXXXXXX 100644
29
--- a/linux-user/elfload.c
30
+++ b/linux-user/elfload.c
31
@@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap(void)
32
GET_FEATURE(ARM_FEATURE_V8_SHA512, ARM_HWCAP_A64_SHA512);
33
GET_FEATURE(ARM_FEATURE_V8_FP16,
34
ARM_HWCAP_A64_FPHP | ARM_HWCAP_A64_ASIMDHP);
35
+ GET_FEATURE(ARM_FEATURE_V8_RDM, ARM_HWCAP_A64_ASIMDRDM);
36
#undef GET_FEATURE
37
38
return hwcaps;
25
--
39
--
26
2.16.2
40
2.16.2
27
41
28
42
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
The helpers use the new re-factored muladd support in SoftFloat for
3
Include the U bit in the switches rather than testing separately.
4
the float16 work.
4
5
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
6
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
7
Message-id: 20180227143852.11175-15-alex.bennee@linaro.org
7
Message-id: 20180228193125.20577-3-richard.henderson@linaro.org
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
---
9
---
11
target/arm/translate-a64.c | 82 +++++++++++++++++++++++++++++++++++++---------
10
target/arm/translate-a64.c | 129 +++++++++++++++++++++------------------------
12
1 file changed, 66 insertions(+), 16 deletions(-)
11
1 file changed, 61 insertions(+), 68 deletions(-)
13
12
14
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
13
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
15
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/translate-a64.c
15
--- a/target/arm/translate-a64.c
17
+++ b/target/arm/translate-a64.c
16
+++ b/target/arm/translate-a64.c
18
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
17
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
19
int rd = extract32(insn, 0, 5);
20
bool is_long = false;
21
bool is_fp = false;
22
+ bool is_fp16 = false;
23
int index;
18
int index;
24
TCGv_ptr fpst;
19
TCGv_ptr fpst;
25
20
26
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
21
- switch (opcode) {
27
}
22
- case 0x0: /* MLA */
28
/* fall through */
23
- case 0x4: /* MLS */
29
case 0x9: /* FMUL, FMULX */
24
- if (!u || is_scalar) {
30
- if (!extract32(size, 1, 1)) {
25
+ switch (16 * u + opcode) {
31
+ if (size == 1) {
26
+ case 0x08: /* MUL */
27
+ case 0x10: /* MLA */
28
+ case 0x14: /* MLS */
29
+ if (is_scalar) {
32
unallocated_encoding(s);
30
unallocated_encoding(s);
33
return;
31
return;
34
}
32
}
35
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
33
break;
36
}
34
- case 0x2: /* SMLAL, SMLAL2, UMLAL, UMLAL2 */
37
35
- case 0x6: /* SMLSL, SMLSL2, UMLSL, UMLSL2 */
38
if (is_fp) {
36
- case 0xa: /* SMULL, SMULL2, UMULL, UMULL2 */
39
- /* low bit of size indicates single/double */
37
+ case 0x02: /* SMLAL, SMLAL2 */
40
- size = extract32(size, 0, 1) ? 3 : 2;
38
+ case 0x12: /* UMLAL, UMLAL2 */
41
- if (size == 2) {
39
+ case 0x06: /* SMLSL, SMLSL2 */
42
+ /* convert insn encoded size to TCGMemOp size */
40
+ case 0x16: /* UMLSL, UMLSL2 */
43
+ switch (size) {
41
+ case 0x0a: /* SMULL, SMULL2 */
44
+ case 2: /* single precision */
42
+ case 0x1a: /* UMULL, UMULL2 */
45
+ size = MO_32;
43
if (is_scalar) {
46
index = h << 1 | l;
44
unallocated_encoding(s);
47
- } else {
45
return;
48
+ rm |= (m << 4);
46
}
49
+ break;
47
is_long = true;
50
+ case 3: /* double precision */
48
break;
51
+ size = MO_64;
49
- case 0x3: /* SQDMLAL, SQDMLAL2 */
52
if (l || !is_q) {
50
- case 0x7: /* SQDMLSL, SQDMLSL2 */
53
unallocated_encoding(s);
51
- case 0xb: /* SQDMULL, SQDMULL2 */
54
return;
52
+ case 0x03: /* SQDMLAL, SQDMLAL2 */
53
+ case 0x07: /* SQDMLSL, SQDMLSL2 */
54
+ case 0x0b: /* SQDMULL, SQDMULL2 */
55
is_long = true;
56
- /* fall through */
57
- case 0xc: /* SQDMULH */
58
- case 0xd: /* SQRDMULH */
59
- if (u) {
60
- unallocated_encoding(s);
61
- return;
62
- }
63
break;
64
- case 0x8: /* MUL */
65
- if (u || is_scalar) {
66
- unallocated_encoding(s);
67
- return;
68
- }
69
+ case 0x0c: /* SQDMULH */
70
+ case 0x0d: /* SQRDMULH */
71
break;
72
- case 0x1: /* FMLA */
73
- case 0x5: /* FMLS */
74
- if (u) {
75
- unallocated_encoding(s);
76
- return;
77
- }
78
- /* fall through */
79
- case 0x9: /* FMUL, FMULX */
80
+ case 0x01: /* FMLA */
81
+ case 0x05: /* FMLS */
82
+ case 0x09: /* FMUL */
83
+ case 0x19: /* FMULX */
84
if (size == 1) {
85
unallocated_encoding(s);
86
return;
87
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
88
89
read_vec_element(s, tcg_op, rn, pass, MO_64);
90
91
- switch (opcode) {
92
- case 0x5: /* FMLS */
93
+ switch (16 * u + opcode) {
94
+ case 0x05: /* FMLS */
95
/* As usual for ARM, separate negation for fused multiply-add */
96
gen_helper_vfp_negd(tcg_op, tcg_op);
97
/* fall through */
98
- case 0x1: /* FMLA */
99
+ case 0x01: /* FMLA */
100
read_vec_element(s, tcg_res, rd, pass, MO_64);
101
gen_helper_vfp_muladdd(tcg_res, tcg_op, tcg_idx, tcg_res, fpst);
102
break;
103
- case 0x9: /* FMUL, FMULX */
104
- if (u) {
105
- gen_helper_vfp_mulxd(tcg_res, tcg_op, tcg_idx, fpst);
106
- } else {
107
- gen_helper_vfp_muld(tcg_res, tcg_op, tcg_idx, fpst);
108
- }
109
+ case 0x09: /* FMUL */
110
+ gen_helper_vfp_muld(tcg_res, tcg_op, tcg_idx, fpst);
111
+ break;
112
+ case 0x19: /* FMULX */
113
+ gen_helper_vfp_mulxd(tcg_res, tcg_op, tcg_idx, fpst);
114
break;
115
default:
116
g_assert_not_reached();
117
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
118
119
read_vec_element_i32(s, tcg_op, rn, pass, is_scalar ? size : MO_32);
120
121
- switch (opcode) {
122
- case 0x0: /* MLA */
123
- case 0x4: /* MLS */
124
- case 0x8: /* MUL */
125
+ switch (16 * u + opcode) {
126
+ case 0x08: /* MUL */
127
+ case 0x10: /* MLA */
128
+ case 0x14: /* MLS */
129
{
130
static NeonGenTwoOpFn * const fns[2][2] = {
131
{ gen_helper_neon_add_u16, gen_helper_neon_sub_u16 },
132
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
133
genfn(tcg_res, tcg_op, tcg_res);
134
break;
55
}
135
}
56
index = h;
136
- case 0x5: /* FMLS */
57
+ rm |= (m << 4);
137
- case 0x1: /* FMLA */
58
+ break;
138
+ case 0x05: /* FMLS */
59
+ case 0: /* half precision */
139
+ case 0x01: /* FMLA */
60
+ size = MO_16;
140
read_vec_element_i32(s, tcg_res, rd, pass,
61
+ index = h << 2 | l << 1 | m;
141
is_scalar ? size : MO_32);
62
+ is_fp16 = true;
142
switch (size) {
63
+ if (arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
143
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
64
+ break;
144
g_assert_not_reached();
65
+ }
145
}
66
+ /* fallthru */
146
break;
67
+ default: /* unallocated */
147
- case 0x9: /* FMUL, FMULX */
68
+ unallocated_encoding(s);
148
+ case 0x09: /* FMUL */
69
+ return;
149
switch (size) {
70
}
150
case 1:
71
- rm |= (m << 4);
151
- if (u) {
72
} else {
152
- if (is_scalar) {
73
switch (size) {
153
- gen_helper_advsimd_mulxh(tcg_res, tcg_op,
74
case 1:
154
- tcg_idx, fpst);
75
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
155
- } else {
76
}
156
- gen_helper_advsimd_mulx2h(tcg_res, tcg_op,
77
157
- tcg_idx, fpst);
78
if (is_fp) {
158
- }
79
- fpst = get_fpstatus_ptr(false);
159
+ if (is_scalar) {
80
+ fpst = get_fpstatus_ptr(is_fp16);
160
+ gen_helper_advsimd_mulh(tcg_res, tcg_op,
81
} else {
161
+ tcg_idx, fpst);
82
fpst = NULL;
162
} else {
83
}
163
- if (is_scalar) {
84
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
164
- gen_helper_advsimd_mulh(tcg_res, tcg_op,
85
break;
165
- tcg_idx, fpst);
86
}
166
- } else {
87
case 0x5: /* FMLS */
167
- gen_helper_advsimd_mul2h(tcg_res, tcg_op,
88
- /* As usual for ARM, separate negation for fused multiply-add */
168
- tcg_idx, fpst);
89
- gen_helper_vfp_negs(tcg_op, tcg_op);
169
- }
90
- /* fall through */
170
+ gen_helper_advsimd_mul2h(tcg_res, tcg_op,
91
case 0x1: /* FMLA */
171
+ tcg_idx, fpst);
92
- read_vec_element_i32(s, tcg_res, rd, pass, MO_32);
172
}
93
- gen_helper_vfp_muladds(tcg_res, tcg_op, tcg_idx, tcg_res, fpst);
173
break;
94
+ read_vec_element_i32(s, tcg_res, rd, pass,
174
case 2:
95
+ is_scalar ? size : MO_32);
175
- if (u) {
176
- gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst);
177
- } else {
178
- gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst);
179
- }
180
+ gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst);
181
break;
182
default:
183
g_assert_not_reached();
184
}
185
break;
186
- case 0xc: /* SQDMULH */
187
+ case 0x19: /* FMULX */
96
+ switch (size) {
188
+ switch (size) {
97
+ case 1:
189
+ case 1:
98
+ if (opcode == 0x5) {
190
+ if (is_scalar) {
99
+ /* As usual for ARM, separate negation for fused
191
+ gen_helper_advsimd_mulxh(tcg_res, tcg_op,
100
+ * multiply-add */
192
+ tcg_idx, fpst);
101
+ tcg_gen_xori_i32(tcg_op, tcg_op, 0x80008000);
193
+ } else {
194
+ gen_helper_advsimd_mulx2h(tcg_res, tcg_op,
195
+ tcg_idx, fpst);
102
+ }
196
+ }
103
+ gen_helper_advsimd_muladdh(tcg_res, tcg_op, tcg_idx,
104
+ tcg_res, fpst);
105
+ break;
197
+ break;
106
+ case 2:
198
+ case 2:
107
+ if (opcode == 0x5) {
199
+ gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst);
108
+ /* As usual for ARM, separate negation for
109
+ * fused multiply-add */
110
+ tcg_gen_xori_i32(tcg_op, tcg_op, 0x80000000);
111
+ }
112
+ gen_helper_vfp_muladds(tcg_res, tcg_op, tcg_idx,
113
+ tcg_res, fpst);
114
+ break;
200
+ break;
115
+ default:
201
+ default:
116
+ g_assert_not_reached();
202
+ g_assert_not_reached();
117
+ }
203
+ }
118
break;
204
+ break;
119
case 0x9: /* FMUL, FMULX */
205
+ case 0x0c: /* SQDMULH */
120
- if (u) {
206
if (size == 1) {
121
- gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst);
207
gen_helper_neon_qdmulh_s16(tcg_res, cpu_env,
122
- } else {
208
tcg_op, tcg_idx);
123
- gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst);
209
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
124
+ switch (size) {
210
tcg_op, tcg_idx);
125
+ case 1:
126
+ if (u) {
127
+ gen_helper_advsimd_mulxh(tcg_res, tcg_op, tcg_idx,
128
+ fpst);
129
+ } else {
130
+ g_assert_not_reached();
131
+ }
132
+ break;
133
+ case 2:
134
+ if (u) {
135
+ gen_helper_vfp_mulxs(tcg_res, tcg_op, tcg_idx, fpst);
136
+ } else {
137
+ gen_helper_vfp_muls(tcg_res, tcg_op, tcg_idx, fpst);
138
+ }
139
+ break;
140
+ default:
141
+ g_assert_not_reached();
142
}
211
}
143
break;
212
break;
144
case 0xc: /* SQDMULH */
213
- case 0xd: /* SQRDMULH */
214
+ case 0x0d: /* SQRDMULH */
215
if (size == 1) {
216
gen_helper_neon_qrdmulh_s16(tcg_res, cpu_env,
217
tcg_op, tcg_idx);
145
--
218
--
146
2.16.2
219
2.16.2
147
220
148
221
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
Only one half-precision instruction has been added to this group.
3
The integer size check was already outside of the opcode switch;
4
move the floating-point size check outside as well. Unify the
5
size vs index adjustment between fp and integer paths.
4
6
5
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
7
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
7
Message-id: 20180227143852.11175-29-alex.bennee@linaro.org
9
Message-id: 20180228193125.20577-4-richard.henderson@linaro.org
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
---
11
---
10
target/arm/translate-a64.c | 35 +++++++++++++++++++++++++----------
12
target/arm/translate-a64.c | 65 +++++++++++++++++++++++-----------------------
11
1 file changed, 25 insertions(+), 10 deletions(-)
13
1 file changed, 32 insertions(+), 33 deletions(-)
12
14
13
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
15
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
14
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/translate-a64.c
17
--- a/target/arm/translate-a64.c
16
+++ b/target/arm/translate-a64.c
18
+++ b/target/arm/translate-a64.c
17
@@ -XXX,XX +XXX,XX @@ static void disas_simd_copy(DisasContext *s, uint32_t insn)
19
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
18
* MVNI - move inverted (shifted) imm into register
20
case 0x05: /* FMLS */
19
* ORR - bitwise OR of (shifted) imm with register
21
case 0x09: /* FMUL */
20
* BIC - bitwise clear of (shifted) imm with register
22
case 0x19: /* FMULX */
21
+ * With ARMv8.2 we also have:
23
- if (size == 1) {
22
+ * FMOV half-precision
24
- unallocated_encoding(s);
23
*/
25
- return;
24
static void disas_simd_mod_imm(DisasContext *s, uint32_t insn)
26
- }
25
{
27
is_fp = true;
26
@@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn)
28
break;
27
uint64_t imm = 0;
29
default:
28
30
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
29
if (o2 != 0 || ((cmode == 0xf) && is_neg && !is_q)) {
31
if (is_fp) {
30
- unallocated_encoding(s);
32
/* convert insn encoded size to TCGMemOp size */
31
- return;
33
switch (size) {
32
+ /* Check for FMOV (vector, immediate) - half-precision */
34
- case 2: /* single precision */
33
+ if (!(arm_dc_feature(s, ARM_FEATURE_V8_FP16) && o2 && cmode == 0xf)) {
35
- size = MO_32;
36
- index = h << 1 | l;
37
- rm |= (m << 4);
38
- break;
39
- case 3: /* double precision */
40
- size = MO_64;
41
- if (l || !is_q) {
42
+ case 0: /* half-precision */
43
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
44
unallocated_encoding(s);
45
return;
46
}
47
- index = h;
48
- rm |= (m << 4);
49
- break;
50
- case 0: /* half precision */
51
size = MO_16;
52
- index = h << 2 | l << 1 | m;
53
- is_fp16 = true;
54
- if (arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
55
- break;
56
- }
57
- /* fallthru */
58
- default: /* unallocated */
59
- unallocated_encoding(s);
60
- return;
61
- }
62
- } else {
63
- switch (size) {
64
- case 1:
65
- index = h << 2 | l << 1 | m;
66
break;
67
- case 2:
68
- index = h << 1 | l;
69
- rm |= (m << 4);
70
+ case MO_32: /* single precision */
71
+ case MO_64: /* double precision */
72
break;
73
default:
74
unallocated_encoding(s);
75
return;
76
}
77
+ } else {
78
+ switch (size) {
79
+ case MO_8:
80
+ case MO_64:
34
+ unallocated_encoding(s);
81
+ unallocated_encoding(s);
35
+ return;
82
+ return;
36
+ }
83
+ }
37
}
84
+ }
38
85
+
39
if (!fp_access_check(s)) {
86
+ /* Given TCGMemOp size, adjust register and indexing. */
40
@@ -XXX,XX +XXX,XX @@ static void disas_simd_mod_imm(DisasContext *s, uint32_t insn)
87
+ switch (size) {
41
imm |= 0x4000000000000000ULL;
88
+ case MO_16:
42
}
89
+ index = h << 2 | l << 1 | m;
43
} else {
90
+ break;
44
- imm = (abcdefgh & 0x3f) << 19;
91
+ case MO_32:
45
- if (abcdefgh & 0x80) {
92
+ index = h << 1 | l;
46
- imm |= 0x80000000;
93
+ rm |= m << 4;
47
- }
94
+ break;
48
- if (abcdefgh & 0x40) {
95
+ case MO_64:
49
- imm |= 0x3e000000;
96
+ if (l || !is_q) {
50
+ if (o2) {
97
+ unallocated_encoding(s);
51
+ /* FMOV (vector, immediate) - half-precision */
98
+ return;
52
+ imm = vfp_expand_imm(MO_16, abcdefgh);
99
+ }
53
+ /* now duplicate across the lanes */
100
+ index = h;
54
+ imm = bitfield_replicate(imm, 16);
101
+ rm |= m << 4;
55
} else {
102
+ break;
56
- imm |= 0x40000000;
57
+ imm = (abcdefgh & 0x3f) << 19;
58
+ if (abcdefgh & 0x80) {
59
+ imm |= 0x80000000;
60
+ }
61
+ if (abcdefgh & 0x40) {
62
+ imm |= 0x3e000000;
63
+ } else {
64
+ imm |= 0x40000000;
65
+ }
66
+ imm |= (imm << 32);
67
}
68
- imm |= (imm << 32);
69
}
70
}
71
break;
72
+ default:
103
+ default:
73
+ fprintf(stderr, "%s: cmode_3_1: %x\n", __func__, cmode_3_1);
74
+ g_assert_not_reached();
104
+ g_assert_not_reached();
75
}
105
}
76
106
77
if (cmode_3_1 != 7 && is_neg) {
107
if (!fp_access_check(s)) {
78
--
108
--
79
2.16.2
109
2.16.2
80
110
81
111
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
This covers the encoding group:
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Advanced SIMD scalar three same FP16
5
Message-id: 20180228193125.20577-5-richard.henderson@linaro.org
6
7
As all the helpers are already there it is simply a case of calling the
8
existing helpers in the scalar context.
9
10
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
11
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
12
Message-id: 20180227143852.11175-31-alex.bennee@linaro.org
13
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
14
---
7
---
15
target/arm/translate-a64.c | 99 ++++++++++++++++++++++++++++++++++++++++++++++
8
target/arm/Makefile.objs | 2 +-
16
1 file changed, 99 insertions(+)
9
target/arm/helper.h | 4 ++
17
10
target/arm/translate-a64.c | 84 ++++++++++++++++++++++++++++++++++
11
target/arm/vec_helper.c | 109 +++++++++++++++++++++++++++++++++++++++++++++
12
4 files changed, 198 insertions(+), 1 deletion(-)
13
create mode 100644 target/arm/vec_helper.c
14
15
diff --git a/target/arm/Makefile.objs b/target/arm/Makefile.objs
16
index XXXXXXX..XXXXXXX 100644
17
--- a/target/arm/Makefile.objs
18
+++ b/target/arm/Makefile.objs
19
@@ -XXX,XX +XXX,XX @@ obj-$(call land,$(CONFIG_KVM),$(call lnot,$(TARGET_AARCH64))) += kvm32.o
20
obj-$(call land,$(CONFIG_KVM),$(TARGET_AARCH64)) += kvm64.o
21
obj-$(call lnot,$(CONFIG_KVM)) += kvm-stub.o
22
obj-y += translate.o op_helper.o helper.o cpu.o
23
-obj-y += neon_helper.o iwmmxt_helper.o
24
+obj-y += neon_helper.o iwmmxt_helper.o vec_helper.o
25
obj-y += gdbstub.o
26
obj-$(TARGET_AARCH64) += cpu64.o translate-a64.o helper-a64.o gdbstub64.o
27
obj-y += crypto_helper.o
28
diff --git a/target/arm/helper.h b/target/arm/helper.h
29
index XXXXXXX..XXXXXXX 100644
30
--- a/target/arm/helper.h
31
+++ b/target/arm/helper.h
32
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_1(neon_rbit_u8, TCG_CALL_NO_RWG_SE, i32, i32)
33
34
DEF_HELPER_3(neon_qdmulh_s16, i32, env, i32, i32)
35
DEF_HELPER_3(neon_qrdmulh_s16, i32, env, i32, i32)
36
+DEF_HELPER_4(neon_qrdmlah_s16, i32, env, i32, i32, i32)
37
+DEF_HELPER_4(neon_qrdmlsh_s16, i32, env, i32, i32, i32)
38
DEF_HELPER_3(neon_qdmulh_s32, i32, env, i32, i32)
39
DEF_HELPER_3(neon_qrdmulh_s32, i32, env, i32, i32)
40
+DEF_HELPER_4(neon_qrdmlah_s32, i32, env, s32, s32, s32)
41
+DEF_HELPER_4(neon_qrdmlsh_s32, i32, env, s32, s32, s32)
42
43
DEF_HELPER_1(neon_narrow_u8, i32, i64)
44
DEF_HELPER_1(neon_narrow_u16, i32, i64)
18
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
45
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
19
index XXXXXXX..XXXXXXX 100644
46
index XXXXXXX..XXXXXXX 100644
20
--- a/target/arm/translate-a64.c
47
--- a/target/arm/translate-a64.c
21
+++ b/target/arm/translate-a64.c
48
+++ b/target/arm/translate-a64.c
22
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_three_reg_same(DisasContext *s, uint32_t insn)
49
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_three_reg_same_fp16(DisasContext *s,
23
tcg_temp_free_i64(tcg_rd);
50
tcg_temp_free_ptr(fpst);
24
}
51
}
25
52
26
+/* AdvSIMD scalar three same FP16
53
+/* AdvSIMD scalar three same extra
27
+ * 31 30 29 28 24 23 22 21 20 16 15 14 13 11 10 9 5 4 0
54
+ * 31 30 29 28 24 23 22 21 20 16 15 14 11 10 9 5 4 0
28
+ * +-----+---+-----------+---+-----+------+-----+--------+---+----+----+
55
+ * +-----+---+-----------+------+---+------+---+--------+---+----+----+
29
+ * | 0 1 | U | 1 1 1 1 0 | a | 1 0 | Rm | 0 0 | opcode | 1 | Rn | Rd |
56
+ * | 0 1 | U | 1 1 1 1 0 | size | 0 | Rm | 1 | opcode | 1 | Rn | Rd |
30
+ * +-----+---+-----------+---+-----+------+-----+--------+---+----+----+
57
+ * +-----+---+-----------+------+---+------+---+--------+---+----+----+
31
+ * v: 0101 1110 0100 0000 0000 0100 0000 0000 => 5e400400
32
+ * m: 1101 1111 0110 0000 1100 0100 0000 0000 => df60c400
33
+ */
58
+ */
34
+static void disas_simd_scalar_three_reg_same_fp16(DisasContext *s,
59
+static void disas_simd_scalar_three_reg_same_extra(DisasContext *s,
35
+ uint32_t insn)
60
+ uint32_t insn)
36
+{
61
+{
37
+ int rd = extract32(insn, 0, 5);
62
+ int rd = extract32(insn, 0, 5);
38
+ int rn = extract32(insn, 5, 5);
63
+ int rn = extract32(insn, 5, 5);
39
+ int opcode = extract32(insn, 11, 3);
64
+ int opcode = extract32(insn, 11, 4);
40
+ int rm = extract32(insn, 16, 5);
65
+ int rm = extract32(insn, 16, 5);
66
+ int size = extract32(insn, 22, 2);
41
+ bool u = extract32(insn, 29, 1);
67
+ bool u = extract32(insn, 29, 1);
42
+ bool a = extract32(insn, 23, 1);
68
+ TCGv_i32 ele1, ele2, ele3;
43
+ int fpopcode = opcode | (a << 3) | (u << 4);
69
+ TCGv_i64 res;
44
+ TCGv_ptr fpst;
70
+ int feature;
45
+ TCGv_i32 tcg_op1;
71
+
46
+ TCGv_i32 tcg_op2;
72
+ switch (u * 16 + opcode) {
47
+ TCGv_i32 tcg_res;
73
+ case 0x10: /* SQRDMLAH (vector) */
48
+
74
+ case 0x11: /* SQRDMLSH (vector) */
49
+ switch (fpopcode) {
75
+ if (size != 1 && size != 2) {
50
+ case 0x03: /* FMULX */
76
+ unallocated_encoding(s);
51
+ case 0x04: /* FCMEQ (reg) */
77
+ return;
52
+ case 0x07: /* FRECPS */
78
+ }
53
+ case 0x0f: /* FRSQRTS */
79
+ feature = ARM_FEATURE_V8_RDM;
54
+ case 0x14: /* FCMGE (reg) */
55
+ case 0x15: /* FACGE */
56
+ case 0x1a: /* FABD */
57
+ case 0x1c: /* FCMGT (reg) */
58
+ case 0x1d: /* FACGT */
59
+ break;
80
+ break;
60
+ default:
81
+ default:
61
+ unallocated_encoding(s);
82
+ unallocated_encoding(s);
62
+ return;
83
+ return;
63
+ }
84
+ }
64
+
85
+ if (!arm_dc_feature(s, feature)) {
65
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
66
+ unallocated_encoding(s);
86
+ unallocated_encoding(s);
67
+ }
87
+ return;
68
+
88
+ }
69
+ if (!fp_access_check(s)) {
89
+ if (!fp_access_check(s)) {
70
+ return;
90
+ return;
71
+ }
91
+ }
72
+
92
+
73
+ fpst = get_fpstatus_ptr(true);
93
+ /* Do a single operation on the lowest element in the vector.
74
+
94
+ * We use the standard Neon helpers and rely on 0 OP 0 == 0
75
+ tcg_op1 = tcg_temp_new_i32();
95
+ * with no side effects for all these operations.
76
+ tcg_op2 = tcg_temp_new_i32();
96
+ * OPTME: special-purpose helpers would avoid doing some
77
+ tcg_res = tcg_temp_new_i32();
97
+ * unnecessary work in the helper for the 16 bit cases.
78
+
98
+ */
79
+ read_vec_element_i32(s, tcg_op1, rn, 0, MO_16);
99
+ ele1 = tcg_temp_new_i32();
80
+ read_vec_element_i32(s, tcg_op2, rm, 0, MO_16);
100
+ ele2 = tcg_temp_new_i32();
81
+
101
+ ele3 = tcg_temp_new_i32();
82
+ switch (fpopcode) {
102
+
83
+ case 0x03: /* FMULX */
103
+ read_vec_element_i32(s, ele1, rn, 0, size);
84
+ gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst);
104
+ read_vec_element_i32(s, ele2, rm, 0, size);
105
+ read_vec_element_i32(s, ele3, rd, 0, size);
106
+
107
+ switch (opcode) {
108
+ case 0x0: /* SQRDMLAH */
109
+ if (size == 1) {
110
+ gen_helper_neon_qrdmlah_s16(ele3, cpu_env, ele1, ele2, ele3);
111
+ } else {
112
+ gen_helper_neon_qrdmlah_s32(ele3, cpu_env, ele1, ele2, ele3);
113
+ }
85
+ break;
114
+ break;
86
+ case 0x04: /* FCMEQ (reg) */
115
+ case 0x1: /* SQRDMLSH */
87
+ gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst);
116
+ if (size == 1) {
88
+ break;
117
+ gen_helper_neon_qrdmlsh_s16(ele3, cpu_env, ele1, ele2, ele3);
89
+ case 0x07: /* FRECPS */
118
+ } else {
90
+ gen_helper_recpsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
119
+ gen_helper_neon_qrdmlsh_s32(ele3, cpu_env, ele1, ele2, ele3);
91
+ break;
120
+ }
92
+ case 0x0f: /* FRSQRTS */
93
+ gen_helper_rsqrtsf_f16(tcg_res, tcg_op1, tcg_op2, fpst);
94
+ break;
95
+ case 0x14: /* FCMGE (reg) */
96
+ gen_helper_advsimd_cge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
97
+ break;
98
+ case 0x15: /* FACGE */
99
+ gen_helper_advsimd_acge_f16(tcg_res, tcg_op1, tcg_op2, fpst);
100
+ break;
101
+ case 0x1a: /* FABD */
102
+ gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
103
+ tcg_gen_andi_i32(tcg_res, tcg_res, 0x7fff);
104
+ break;
105
+ case 0x1c: /* FCMGT (reg) */
106
+ gen_helper_advsimd_cgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
107
+ break;
108
+ case 0x1d: /* FACGT */
109
+ gen_helper_advsimd_acgt_f16(tcg_res, tcg_op1, tcg_op2, fpst);
110
+ break;
121
+ break;
111
+ default:
122
+ default:
112
+ g_assert_not_reached();
123
+ g_assert_not_reached();
113
+ }
124
+ }
114
+
125
+ tcg_temp_free_i32(ele1);
115
+ write_fp_sreg(s, rd, tcg_res);
126
+ tcg_temp_free_i32(ele2);
116
+
127
+
117
+
128
+ res = tcg_temp_new_i64();
118
+ tcg_temp_free_i32(tcg_res);
129
+ tcg_gen_extu_i32_i64(res, ele3);
119
+ tcg_temp_free_i32(tcg_op1);
130
+ tcg_temp_free_i32(ele3);
120
+ tcg_temp_free_i32(tcg_op2);
131
+
121
+ tcg_temp_free_ptr(fpst);
132
+ write_fp_dreg(s, rd, res);
133
+ tcg_temp_free_i64(res);
122
+}
134
+}
123
+
135
+
124
static void handle_2misc_64(DisasContext *s, int opcode, bool u,
136
static void handle_2misc_64(DisasContext *s, int opcode, bool u,
125
TCGv_i64 tcg_rd, TCGv_i64 tcg_rn,
137
TCGv_i64 tcg_rd, TCGv_i64 tcg_rn,
126
TCGv_i32 tcg_rmode, TCGv_ptr tcg_fpstatus)
138
TCGv_i32 tcg_rmode, TCGv_ptr tcg_fpstatus)
127
@@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = {
139
@@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = {
128
{ 0xce408000, 0xffe0c000, disas_crypto_three_reg_imm2 },
140
{ 0x0e000800, 0xbf208c00, disas_simd_zip_trn },
129
{ 0x0e400400, 0x9f60c400, disas_simd_three_reg_same_fp16 },
141
{ 0x2e000000, 0xbf208400, disas_simd_ext },
130
{ 0x0e780800, 0x8f7e0c00, disas_simd_two_reg_misc_fp16 },
142
{ 0x5e200400, 0xdf200400, disas_simd_scalar_three_reg_same },
131
+ { 0x5e400400, 0xdf60c400, disas_simd_scalar_three_reg_same_fp16 },
143
+ { 0x5e008400, 0xdf208400, disas_simd_scalar_three_reg_same_extra },
132
{ 0x00000000, 0x00000000, NULL }
144
{ 0x5e200000, 0xdf200c00, disas_simd_scalar_three_reg_diff },
133
};
145
{ 0x5e200800, 0xdf3e0c00, disas_simd_scalar_two_reg_misc },
134
146
{ 0x5e300800, 0xdf3e0c00, disas_simd_scalar_pairwise },
147
diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c
148
new file mode 100644
149
index XXXXXXX..XXXXXXX
150
--- /dev/null
151
+++ b/target/arm/vec_helper.c
152
@@ -XXX,XX +XXX,XX @@
153
+/*
154
+ * ARM AdvSIMD / SVE Vector Operations
155
+ *
156
+ * Copyright (c) 2018 Linaro
157
+ *
158
+ * This library is free software; you can redistribute it and/or
159
+ * modify it under the terms of the GNU Lesser General Public
160
+ * License as published by the Free Software Foundation; either
161
+ * version 2 of the License, or (at your option) any later version.
162
+ *
163
+ * This library is distributed in the hope that it will be useful,
164
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
165
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
166
+ * Lesser General Public License for more details.
167
+ *
168
+ * You should have received a copy of the GNU Lesser General Public
169
+ * License along with this library; if not, see <http://www.gnu.org/licenses/>.
170
+ */
171
+
172
+#include "qemu/osdep.h"
173
+#include "cpu.h"
174
+#include "exec/exec-all.h"
175
+#include "exec/helper-proto.h"
176
+#include "tcg/tcg-gvec-desc.h"
177
+
178
+
179
+#define SET_QC() env->vfp.xregs[ARM_VFP_FPSCR] |= CPSR_Q
180
+
181
+/* Signed saturating rounding doubling multiply-accumulate high half, 16-bit */
182
+static uint16_t inl_qrdmlah_s16(CPUARMState *env, int16_t src1,
183
+ int16_t src2, int16_t src3)
184
+{
185
+ /* Simplify:
186
+ * = ((a3 << 16) + ((e1 * e2) << 1) + (1 << 15)) >> 16
187
+ * = ((a3 << 15) + (e1 * e2) + (1 << 14)) >> 15
188
+ */
189
+ int32_t ret = (int32_t)src1 * src2;
190
+ ret = ((int32_t)src3 << 15) + ret + (1 << 14);
191
+ ret >>= 15;
192
+ if (ret != (int16_t)ret) {
193
+ SET_QC();
194
+ ret = (ret < 0 ? -0x8000 : 0x7fff);
195
+ }
196
+ return ret;
197
+}
198
+
199
+uint32_t HELPER(neon_qrdmlah_s16)(CPUARMState *env, uint32_t src1,
200
+ uint32_t src2, uint32_t src3)
201
+{
202
+ uint16_t e1 = inl_qrdmlah_s16(env, src1, src2, src3);
203
+ uint16_t e2 = inl_qrdmlah_s16(env, src1 >> 16, src2 >> 16, src3 >> 16);
204
+ return deposit32(e1, 16, 16, e2);
205
+}
206
+
207
+/* Signed saturating rounding doubling multiply-subtract high half, 16-bit */
208
+static uint16_t inl_qrdmlsh_s16(CPUARMState *env, int16_t src1,
209
+ int16_t src2, int16_t src3)
210
+{
211
+ /* Similarly, using subtraction:
212
+ * = ((a3 << 16) - ((e1 * e2) << 1) + (1 << 15)) >> 16
213
+ * = ((a3 << 15) - (e1 * e2) + (1 << 14)) >> 15
214
+ */
215
+ int32_t ret = (int32_t)src1 * src2;
216
+ ret = ((int32_t)src3 << 15) - ret + (1 << 14);
217
+ ret >>= 15;
218
+ if (ret != (int16_t)ret) {
219
+ SET_QC();
220
+ ret = (ret < 0 ? -0x8000 : 0x7fff);
221
+ }
222
+ return ret;
223
+}
224
+
225
+uint32_t HELPER(neon_qrdmlsh_s16)(CPUARMState *env, uint32_t src1,
226
+ uint32_t src2, uint32_t src3)
227
+{
228
+ uint16_t e1 = inl_qrdmlsh_s16(env, src1, src2, src3);
229
+ uint16_t e2 = inl_qrdmlsh_s16(env, src1 >> 16, src2 >> 16, src3 >> 16);
230
+ return deposit32(e1, 16, 16, e2);
231
+}
232
+
233
+/* Signed saturating rounding doubling multiply-accumulate high half, 32-bit */
234
+uint32_t HELPER(neon_qrdmlah_s32)(CPUARMState *env, int32_t src1,
235
+ int32_t src2, int32_t src3)
236
+{
237
+ /* Simplify similarly to int_qrdmlah_s16 above. */
238
+ int64_t ret = (int64_t)src1 * src2;
239
+ ret = ((int64_t)src3 << 31) + ret + (1 << 30);
240
+ ret >>= 31;
241
+ if (ret != (int32_t)ret) {
242
+ SET_QC();
243
+ ret = (ret < 0 ? INT32_MIN : INT32_MAX);
244
+ }
245
+ return ret;
246
+}
247
+
248
+/* Signed saturating rounding doubling multiply-subtract high half, 32-bit */
249
+uint32_t HELPER(neon_qrdmlsh_s32)(CPUARMState *env, int32_t src1,
250
+ int32_t src2, int32_t src3)
251
+{
252
+ /* Simplify similarly to int_qrdmlsh_s16 above. */
253
+ int64_t ret = (int64_t)src1 * src2;
254
+ ret = ((int64_t)src3 << 31) - ret + (1 << 30);
255
+ ret >>= 31;
256
+ if (ret != (int32_t)ret) {
257
+ SET_QC();
258
+ ret = (ret < 0 ? INT32_MIN : INT32_MAX);
259
+ }
260
+ return ret;
261
+}
135
--
262
--
136
2.16.2
263
2.16.2
137
264
138
265
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
This is the initial decode skeleton for the Advanced SIMD three same
3
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
4
instruction group.
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
5
Message-id: 20180228193125.20577-6-richard.henderson@linaro.org
6
The fprintf is purely to aid debugging as the additional instructions
7
are added. It will be removed once the group is complete.
8
9
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
10
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
11
Message-id: 20180227143852.11175-9-alex.bennee@linaro.org
12
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
13
---
7
---
14
target/arm/translate-a64.c | 73 ++++++++++++++++++++++++++++++++++++++++++++++
8
target/arm/helper.h | 9 +++++
15
1 file changed, 73 insertions(+)
9
target/arm/translate-a64.c | 83 ++++++++++++++++++++++++++++++++++++++++++++++
16
10
target/arm/vec_helper.c | 74 +++++++++++++++++++++++++++++++++++++++++
11
3 files changed, 166 insertions(+)
12
13
diff --git a/target/arm/helper.h b/target/arm/helper.h
14
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/helper.h
16
+++ b/target/arm/helper.h
17
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_2(dc_zva, void, env, i64)
18
DEF_HELPER_FLAGS_2(neon_pmull_64_lo, TCG_CALL_NO_RWG_SE, i64, i64, i64)
19
DEF_HELPER_FLAGS_2(neon_pmull_64_hi, TCG_CALL_NO_RWG_SE, i64, i64, i64)
20
21
+DEF_HELPER_FLAGS_5(gvec_qrdmlah_s16, TCG_CALL_NO_RWG,
22
+ void, ptr, ptr, ptr, ptr, i32)
23
+DEF_HELPER_FLAGS_5(gvec_qrdmlsh_s16, TCG_CALL_NO_RWG,
24
+ void, ptr, ptr, ptr, ptr, i32)
25
+DEF_HELPER_FLAGS_5(gvec_qrdmlah_s32, TCG_CALL_NO_RWG,
26
+ void, ptr, ptr, ptr, ptr, i32)
27
+DEF_HELPER_FLAGS_5(gvec_qrdmlsh_s32, TCG_CALL_NO_RWG,
28
+ void, ptr, ptr, ptr, ptr, i32)
29
+
30
#ifdef TARGET_AARCH64
31
#include "helper-a64.h"
32
#endif
17
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
33
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
18
index XXXXXXX..XXXXXXX 100644
34
index XXXXXXX..XXXXXXX 100644
19
--- a/target/arm/translate-a64.c
35
--- a/target/arm/translate-a64.c
20
+++ b/target/arm/translate-a64.c
36
+++ b/target/arm/translate-a64.c
21
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same(DisasContext *s, uint32_t insn)
37
@@ -XXX,XX +XXX,XX @@ static void gen_gvec_op3(DisasContext *s, bool is_q, int rd,
22
}
38
vec_full_reg_size(s), gvec_op);
23
}
39
}
24
40
25
+/*
41
+/* Expand a 3-operand + env pointer operation using
26
+ * Advanced SIMD three same (ARMv8.2 FP16 variants)
42
+ * an out-of-line helper.
27
+ *
28
+ * 31 30 29 28 24 23 22 21 20 16 15 14 13 11 10 9 5 4 0
29
+ * +---+---+---+-----------+---------+------+-----+--------+---+------+------+
30
+ * | 0 | Q | U | 0 1 1 1 0 | a | 1 0 | Rm | 0 0 | opcode | 1 | Rn | Rd |
31
+ * +---+---+---+-----------+---------+------+-----+--------+---+------+------+
32
+ *
33
+ * This includes FMULX, FCMEQ (register), FRECPS, FRSQRTS, FCMGE
34
+ * (register), FACGE, FABD, FCMGT (register) and FACGT.
35
+ *
36
+ */
43
+ */
37
+static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
44
+static void gen_gvec_op3_env(DisasContext *s, bool is_q, int rd,
38
+{
45
+ int rn, int rm, gen_helper_gvec_3_ptr *fn)
39
+ int opcode, fpopcode;
46
+{
40
+ int is_q, u, a, rm, rn, rd;
47
+ tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd),
41
+ int datasize, elements;
48
+ vec_full_reg_offset(s, rn),
42
+ int pass;
49
+ vec_full_reg_offset(s, rm), cpu_env,
43
+ TCGv_ptr fpst;
50
+ is_q ? 16 : 8, vec_full_reg_size(s), 0, fn);
44
+
51
+}
45
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
52
+
53
/* Set ZF and NF based on a 64 bit result. This is alas fiddlier
54
* than the 32 bit equivalent.
55
*/
56
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
57
clear_vec_high(s, is_q, rd);
58
}
59
60
+/* AdvSIMD three same extra
61
+ * 31 30 29 28 24 23 22 21 20 16 15 14 11 10 9 5 4 0
62
+ * +---+---+---+-----------+------+---+------+---+--------+---+----+----+
63
+ * | 0 | Q | U | 0 1 1 1 0 | size | 0 | Rm | 1 | opcode | 1 | Rn | Rd |
64
+ * +---+---+---+-----------+------+---+------+---+--------+---+----+----+
65
+ */
66
+static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn)
67
+{
68
+ int rd = extract32(insn, 0, 5);
69
+ int rn = extract32(insn, 5, 5);
70
+ int opcode = extract32(insn, 11, 4);
71
+ int rm = extract32(insn, 16, 5);
72
+ int size = extract32(insn, 22, 2);
73
+ bool u = extract32(insn, 29, 1);
74
+ bool is_q = extract32(insn, 30, 1);
75
+ int feature;
76
+
77
+ switch (u * 16 + opcode) {
78
+ case 0x10: /* SQRDMLAH (vector) */
79
+ case 0x11: /* SQRDMLSH (vector) */
80
+ if (size != 1 && size != 2) {
81
+ unallocated_encoding(s);
82
+ return;
83
+ }
84
+ feature = ARM_FEATURE_V8_RDM;
85
+ break;
86
+ default:
46
+ unallocated_encoding(s);
87
+ unallocated_encoding(s);
47
+ return;
88
+ return;
48
+ }
89
+ }
49
+
90
+ if (!arm_dc_feature(s, feature)) {
91
+ unallocated_encoding(s);
92
+ return;
93
+ }
50
+ if (!fp_access_check(s)) {
94
+ if (!fp_access_check(s)) {
51
+ return;
95
+ return;
52
+ }
96
+ }
53
+
97
+
54
+ /* For these floating point ops, the U, a and opcode bits
98
+ switch (opcode) {
55
+ * together indicate the operation.
99
+ case 0x0: /* SQRDMLAH (vector) */
56
+ */
100
+ switch (size) {
57
+ opcode = extract32(insn, 11, 3);
101
+ case 1:
58
+ u = extract32(insn, 29, 1);
102
+ gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlah_s16);
59
+ a = extract32(insn, 23, 1);
103
+ break;
60
+ is_q = extract32(insn, 30, 1);
104
+ case 2:
61
+ rm = extract32(insn, 16, 5);
105
+ gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlah_s32);
62
+ rn = extract32(insn, 5, 5);
106
+ break;
63
+ rd = extract32(insn, 0, 5);
64
+
65
+ fpopcode = opcode | (a << 3) | (u << 4);
66
+ datasize = is_q ? 128 : 64;
67
+ elements = datasize / 16;
68
+
69
+ fpst = get_fpstatus_ptr(true);
70
+
71
+ for (pass = 0; pass < elements; pass++) {
72
+ TCGv_i32 tcg_op1 = tcg_temp_new_i32();
73
+ TCGv_i32 tcg_op2 = tcg_temp_new_i32();
74
+ TCGv_i32 tcg_res = tcg_temp_new_i32();
75
+
76
+ read_vec_element_i32(s, tcg_op1, rn, pass, MO_16);
77
+ read_vec_element_i32(s, tcg_op2, rm, pass, MO_16);
78
+
79
+ switch (fpopcode) {
80
+ default:
107
+ default:
81
+ fprintf(stderr, "%s: insn %#04x, fpop %#2x @ %#" PRIx64 "\n",
82
+ __func__, insn, fpopcode, s->pc);
83
+ g_assert_not_reached();
108
+ g_assert_not_reached();
84
+ }
109
+ }
85
+
110
+ return;
86
+ write_vec_element_i32(s, tcg_res, rd, pass, MO_16);
111
+
87
+ tcg_temp_free_i32(tcg_res);
112
+ case 0x1: /* SQRDMLSH (vector) */
88
+ tcg_temp_free_i32(tcg_op1);
113
+ switch (size) {
89
+ tcg_temp_free_i32(tcg_op2);
114
+ case 1:
90
+ }
115
+ gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlsh_s16);
91
+
116
+ break;
92
+ tcg_temp_free_ptr(fpst);
117
+ case 2:
93
+
118
+ gen_gvec_op3_env(s, is_q, rd, rn, rm, gen_helper_gvec_qrdmlsh_s32);
94
+ clear_vec_high(s, is_q, rd);
119
+ break;
120
+ default:
121
+ g_assert_not_reached();
122
+ }
123
+ return;
124
+
125
+ default:
126
+ g_assert_not_reached();
127
+ }
95
+}
128
+}
96
+
129
+
97
static void handle_2misc_widening(DisasContext *s, int opcode, bool is_q,
130
static void handle_2misc_widening(DisasContext *s, int opcode, bool is_q,
98
int size, int rn, int rd)
131
int size, int rn, int rd)
99
{
132
{
100
@@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = {
133
@@ -XXX,XX +XXX,XX @@ static void disas_crypto_three_reg_imm2(DisasContext *s, uint32_t insn)
101
{ 0xce000000, 0xff808000, disas_crypto_four_reg },
134
static const AArch64DecodeTable data_proc_simd[] = {
102
{ 0xce800000, 0xffe00000, disas_crypto_xar },
135
/* pattern , mask , fn */
103
{ 0xce408000, 0xffe0c000, disas_crypto_three_reg_imm2 },
136
{ 0x0e200400, 0x9f200400, disas_simd_three_reg_same },
104
+ { 0x0e400400, 0x9f60c400, disas_simd_three_reg_same_fp16 },
137
+ { 0x0e008400, 0x9f208400, disas_simd_three_reg_same_extra },
105
{ 0x00000000, 0x00000000, NULL }
138
{ 0x0e200000, 0x9f200c00, disas_simd_three_reg_diff },
106
};
139
{ 0x0e200800, 0x9f3e0c00, disas_simd_two_reg_misc },
107
140
{ 0x0e300800, 0x9f3e0c00, disas_simd_across_lanes },
141
diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c
142
index XXXXXXX..XXXXXXX 100644
143
--- a/target/arm/vec_helper.c
144
+++ b/target/arm/vec_helper.c
145
@@ -XXX,XX +XXX,XX @@
146
147
#define SET_QC() env->vfp.xregs[ARM_VFP_FPSCR] |= CPSR_Q
148
149
+static void clear_tail(void *vd, uintptr_t opr_sz, uintptr_t max_sz)
150
+{
151
+ uint64_t *d = vd + opr_sz;
152
+ uintptr_t i;
153
+
154
+ for (i = opr_sz; i < max_sz; i += 8) {
155
+ *d++ = 0;
156
+ }
157
+}
158
+
159
/* Signed saturating rounding doubling multiply-accumulate high half, 16-bit */
160
static uint16_t inl_qrdmlah_s16(CPUARMState *env, int16_t src1,
161
int16_t src2, int16_t src3)
162
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlah_s16)(CPUARMState *env, uint32_t src1,
163
return deposit32(e1, 16, 16, e2);
164
}
165
166
+void HELPER(gvec_qrdmlah_s16)(void *vd, void *vn, void *vm,
167
+ void *ve, uint32_t desc)
168
+{
169
+ uintptr_t opr_sz = simd_oprsz(desc);
170
+ int16_t *d = vd;
171
+ int16_t *n = vn;
172
+ int16_t *m = vm;
173
+ CPUARMState *env = ve;
174
+ uintptr_t i;
175
+
176
+ for (i = 0; i < opr_sz / 2; ++i) {
177
+ d[i] = inl_qrdmlah_s16(env, n[i], m[i], d[i]);
178
+ }
179
+ clear_tail(d, opr_sz, simd_maxsz(desc));
180
+}
181
+
182
/* Signed saturating rounding doubling multiply-subtract high half, 16-bit */
183
static uint16_t inl_qrdmlsh_s16(CPUARMState *env, int16_t src1,
184
int16_t src2, int16_t src3)
185
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlsh_s16)(CPUARMState *env, uint32_t src1,
186
return deposit32(e1, 16, 16, e2);
187
}
188
189
+void HELPER(gvec_qrdmlsh_s16)(void *vd, void *vn, void *vm,
190
+ void *ve, uint32_t desc)
191
+{
192
+ uintptr_t opr_sz = simd_oprsz(desc);
193
+ int16_t *d = vd;
194
+ int16_t *n = vn;
195
+ int16_t *m = vm;
196
+ CPUARMState *env = ve;
197
+ uintptr_t i;
198
+
199
+ for (i = 0; i < opr_sz / 2; ++i) {
200
+ d[i] = inl_qrdmlsh_s16(env, n[i], m[i], d[i]);
201
+ }
202
+ clear_tail(d, opr_sz, simd_maxsz(desc));
203
+}
204
+
205
/* Signed saturating rounding doubling multiply-accumulate high half, 32-bit */
206
uint32_t HELPER(neon_qrdmlah_s32)(CPUARMState *env, int32_t src1,
207
int32_t src2, int32_t src3)
208
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlah_s32)(CPUARMState *env, int32_t src1,
209
return ret;
210
}
211
212
+void HELPER(gvec_qrdmlah_s32)(void *vd, void *vn, void *vm,
213
+ void *ve, uint32_t desc)
214
+{
215
+ uintptr_t opr_sz = simd_oprsz(desc);
216
+ int32_t *d = vd;
217
+ int32_t *n = vn;
218
+ int32_t *m = vm;
219
+ CPUARMState *env = ve;
220
+ uintptr_t i;
221
+
222
+ for (i = 0; i < opr_sz / 4; ++i) {
223
+ d[i] = helper_neon_qrdmlah_s32(env, n[i], m[i], d[i]);
224
+ }
225
+ clear_tail(d, opr_sz, simd_maxsz(desc));
226
+}
227
+
228
/* Signed saturating rounding doubling multiply-subtract high half, 32-bit */
229
uint32_t HELPER(neon_qrdmlsh_s32)(CPUARMState *env, int32_t src1,
230
int32_t src2, int32_t src3)
231
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(neon_qrdmlsh_s32)(CPUARMState *env, int32_t src1,
232
}
233
return ret;
234
}
235
+
236
+void HELPER(gvec_qrdmlsh_s32)(void *vd, void *vn, void *vm,
237
+ void *ve, uint32_t desc)
238
+{
239
+ uintptr_t opr_sz = simd_oprsz(desc);
240
+ int32_t *d = vd;
241
+ int32_t *n = vn;
242
+ int32_t *m = vm;
243
+ CPUARMState *env = ve;
244
+ uintptr_t i;
245
+
246
+ for (i = 0; i < opr_sz / 4; ++i) {
247
+ d[i] = helper_neon_qrdmlsh_s32(env, n[i], m[i], d[i]);
248
+ }
249
+ clear_tail(d, opr_sz, simd_maxsz(desc));
250
+}
108
--
251
--
109
2.16.2
252
2.16.2
110
253
111
254
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Message-id: 20180227143852.11175-26-alex.bennee@linaro.org
5
Message-id: 20180228193125.20577-7-richard.henderson@linaro.org
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
---
7
---
8
target/arm/helper-a64.h | 1 +
8
target/arm/translate-a64.c | 29 +++++++++++++++++++++++++++++
9
target/arm/helper-a64.c | 13 +++++++++++++
9
1 file changed, 29 insertions(+)
10
target/arm/translate-a64.c | 5 +++++
11
3 files changed, 19 insertions(+)
12
10
13
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
14
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/helper-a64.h
16
+++ b/target/arm/helper-a64.h
17
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_2(advsimd_rinth_exact, f16, f16, ptr)
18
DEF_HELPER_2(advsimd_rinth, f16, f16, ptr)
19
DEF_HELPER_2(advsimd_f16tosinth, i32, f16, ptr)
20
DEF_HELPER_2(advsimd_f16touinth, i32, f16, ptr)
21
+DEF_HELPER_2(sqrt_f16, f16, f16, ptr)
22
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
23
index XXXXXXX..XXXXXXX 100644
24
--- a/target/arm/helper-a64.c
25
+++ b/target/arm/helper-a64.c
26
@@ -XXX,XX +XXX,XX @@ uint32_t HELPER(advsimd_f16touinth)(float16 a, void *fpstp)
27
}
28
return float16_to_uint16(a, fpst);
29
}
30
+
31
+/*
32
+ * Square Root and Reciprocal square root
33
+ */
34
+
35
+float16 HELPER(sqrt_f16)(float16 a, void *fpstp)
36
+{
37
+ float_status *s = fpstp;
38
+
39
+ return float16_sqrt(a, s);
40
+}
41
+
42
+
43
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
11
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
44
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
45
--- a/target/arm/translate-a64.c
13
--- a/target/arm/translate-a64.c
46
+++ b/target/arm/translate-a64.c
14
+++ b/target/arm/translate-a64.c
47
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
15
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
48
case 0x6f: /* FNEG */
16
case 0x19: /* FMULX */
49
need_fpst = false;
17
is_fp = true;
50
break;
18
break;
51
+ case 0x7f: /* FSQRT (vector) */
19
+ case 0x1d: /* SQRDMLAH */
20
+ case 0x1f: /* SQRDMLSH */
21
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_RDM)) {
22
+ unallocated_encoding(s);
23
+ return;
24
+ }
52
+ break;
25
+ break;
53
default:
26
default:
54
fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop);
27
unallocated_encoding(s);
55
g_assert_not_reached();
28
return;
56
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
29
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
57
case 0x6f: /* FNEG */
30
tcg_op, tcg_idx);
58
tcg_gen_xori_i32(tcg_res, tcg_op, 0x8000);
31
}
59
break;
32
break;
60
+ case 0x7f: /* FSQRT */
33
+ case 0x1d: /* SQRDMLAH */
61
+ gen_helper_sqrt_f16(tcg_res, tcg_op, tcg_fpstatus);
34
+ read_vec_element_i32(s, tcg_res, rd, pass,
35
+ is_scalar ? size : MO_32);
36
+ if (size == 1) {
37
+ gen_helper_neon_qrdmlah_s16(tcg_res, cpu_env,
38
+ tcg_op, tcg_idx, tcg_res);
39
+ } else {
40
+ gen_helper_neon_qrdmlah_s32(tcg_res, cpu_env,
41
+ tcg_op, tcg_idx, tcg_res);
42
+ }
43
+ break;
44
+ case 0x1f: /* SQRDMLSH */
45
+ read_vec_element_i32(s, tcg_res, rd, pass,
46
+ is_scalar ? size : MO_32);
47
+ if (size == 1) {
48
+ gen_helper_neon_qrdmlsh_s16(tcg_res, cpu_env,
49
+ tcg_op, tcg_idx, tcg_res);
50
+ } else {
51
+ gen_helper_neon_qrdmlsh_s32(tcg_res, cpu_env,
52
+ tcg_op, tcg_idx, tcg_res);
53
+ }
62
+ break;
54
+ break;
63
default:
55
default:
64
g_assert_not_reached();
56
g_assert_not_reached();
65
}
57
}
66
--
58
--
67
2.16.2
59
2.16.2
68
60
69
61
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
This covers all the floating point convert operations.
3
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
4
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
Message-id: 20180228193125.20577-8-richard.henderson@linaro.org
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
7
Message-id: 20180227143852.11175-19-alex.bennee@linaro.org
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
---
7
---
10
target/arm/helper-a64.h | 2 ++
8
target/arm/translate.c | 86 +++++++++++++++++++++++++++++++++++++++-----------
11
target/arm/helper-a64.c | 32 +++++++++++++++++
9
1 file changed, 67 insertions(+), 19 deletions(-)
12
target/arm/translate-a64.c | 85 +++++++++++++++++++++++++++++++++++++++++++++-
13
3 files changed, 118 insertions(+), 1 deletion(-)
14
10
15
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
11
diff --git a/target/arm/translate.c b/target/arm/translate.c
16
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
17
--- a/target/arm/helper-a64.h
13
--- a/target/arm/translate.c
18
+++ b/target/arm/helper-a64.h
14
+++ b/target/arm/translate.c
19
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_mulx2h, i32, i32, i32, ptr)
15
@@ -XXX,XX +XXX,XX @@
20
DEF_HELPER_4(advsimd_muladd2h, i32, i32, i32, i32, ptr)
16
#include "disas/disas.h"
21
DEF_HELPER_2(advsimd_rinth_exact, f16, f16, ptr)
17
#include "exec/exec-all.h"
22
DEF_HELPER_2(advsimd_rinth, f16, f16, ptr)
18
#include "tcg-op.h"
23
+DEF_HELPER_2(advsimd_f16tosinth, i32, f16, ptr)
19
+#include "tcg-op-gvec.h"
24
+DEF_HELPER_2(advsimd_f16touinth, i32, f16, ptr)
20
#include "qemu/log.h"
25
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
21
#include "qemu/bitops.h"
26
index XXXXXXX..XXXXXXX 100644
22
#include "arm_ldst.h"
27
--- a/target/arm/helper-a64.c
23
@@ -XXX,XX +XXX,XX @@ static void gen_neon_narrow_op(int op, int u, int size,
28
+++ b/target/arm/helper-a64.c
24
#define NEON_3R_VPMAX 20
29
@@ -XXX,XX +XXX,XX @@ float16 HELPER(advsimd_rinth)(float16 x, void *fp_status)
25
#define NEON_3R_VPMIN 21
30
26
#define NEON_3R_VQDMULH_VQRDMULH 22
31
return ret;
27
-#define NEON_3R_VPADD 23
32
}
28
+#define NEON_3R_VPADD_VQRDMLAH 23
29
#define NEON_3R_SHA 24 /* SHA1C,SHA1P,SHA1M,SHA1SU0,SHA256H{2},SHA256SU1 */
30
-#define NEON_3R_VFM 25 /* VFMA, VFMS : float fused multiply-add */
31
+#define NEON_3R_VFM_VQRDMLSH 25 /* VFMA, VFMS, VQRDMLSH */
32
#define NEON_3R_FLOAT_ARITH 26 /* float VADD, VSUB, VPADD, VABD */
33
#define NEON_3R_FLOAT_MULTIPLY 27 /* float VMLA, VMLS, VMUL */
34
#define NEON_3R_FLOAT_CMP 28 /* float VCEQ, VCGE, VCGT */
35
@@ -XXX,XX +XXX,XX @@ static const uint8_t neon_3r_sizes[] = {
36
[NEON_3R_VPMAX] = 0x7,
37
[NEON_3R_VPMIN] = 0x7,
38
[NEON_3R_VQDMULH_VQRDMULH] = 0x6,
39
- [NEON_3R_VPADD] = 0x7,
40
+ [NEON_3R_VPADD_VQRDMLAH] = 0x7,
41
[NEON_3R_SHA] = 0xf, /* size field encodes op type */
42
- [NEON_3R_VFM] = 0x5, /* size bit 1 encodes op */
43
+ [NEON_3R_VFM_VQRDMLSH] = 0x7, /* For VFM, size bit 1 encodes op */
44
[NEON_3R_FLOAT_ARITH] = 0x5, /* size bit 1 encodes op */
45
[NEON_3R_FLOAT_MULTIPLY] = 0x5, /* size bit 1 encodes op */
46
[NEON_3R_FLOAT_CMP] = 0x5, /* size bit 1 encodes op */
47
@@ -XXX,XX +XXX,XX @@ static const uint8_t neon_2rm_sizes[] = {
48
[NEON_2RM_VCVT_UF] = 0x4,
49
};
50
33
+
51
+
34
+/*
52
+/* Expand v8.1 simd helper. */
35
+ * Half-precision floating point conversion functions
53
+static int do_v81_helper(DisasContext *s, gen_helper_gvec_3_ptr *fn,
36
+ *
54
+ int q, int rd, int rn, int rm)
37
+ * There are a multitude of conversion functions with various
38
+ * different rounding modes. This is dealt with by the calling code
39
+ * setting the mode appropriately before calling the helper.
40
+ */
41
+
42
+uint32_t HELPER(advsimd_f16tosinth)(float16 a, void *fpstp)
43
+{
55
+{
44
+ float_status *fpst = fpstp;
56
+ if (arm_dc_feature(s, ARM_FEATURE_V8_RDM)) {
45
+
57
+ int opr_sz = (1 + q) * 8;
46
+ /* Invalid if we are passed a NaN */
58
+ tcg_gen_gvec_3_ptr(vfp_reg_offset(1, rd),
47
+ if (float16_is_any_nan(a)) {
59
+ vfp_reg_offset(1, rn),
48
+ float_raise(float_flag_invalid, fpst);
60
+ vfp_reg_offset(1, rm), cpu_env,
61
+ opr_sz, opr_sz, 0, fn);
49
+ return 0;
62
+ return 0;
50
+ }
63
+ }
51
+ return float16_to_int16(a, fpst);
64
+ return 1;
52
+}
65
+}
53
+
66
+
54
+uint32_t HELPER(advsimd_f16touinth)(float16 a, void *fpstp)
67
/* Translate a NEON data processing instruction. Return nonzero if the
55
+{
68
instruction is invalid.
56
+ float_status *fpst = fpstp;
69
We process data in a mixture of 32-bit and 64-bit chunks.
70
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
71
if (q && ((rd | rn | rm) & 1)) {
72
return 1;
73
}
74
- /*
75
- * The SHA-1/SHA-256 3-register instructions require special treatment
76
- * here, as their size field is overloaded as an op type selector, and
77
- * they all consume their input in a single pass.
78
- */
79
- if (op == NEON_3R_SHA) {
80
+ switch (op) {
81
+ case NEON_3R_SHA:
82
+ /* The SHA-1/SHA-256 3-register instructions require special
83
+ * treatment here, as their size field is overloaded as an
84
+ * op type selector, and they all consume their input in a
85
+ * single pass.
86
+ */
87
if (!q) {
88
return 1;
89
}
90
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
91
tcg_temp_free_ptr(ptr2);
92
tcg_temp_free_ptr(ptr3);
93
return 0;
57
+
94
+
58
+ /* Invalid if we are passed a NaN */
95
+ case NEON_3R_VPADD_VQRDMLAH:
59
+ if (float16_is_any_nan(a)) {
96
+ if (!u) {
60
+ float_raise(float_flag_invalid, fpst);
97
+ break; /* VPADD */
61
+ return 0;
98
+ }
62
+ }
99
+ /* VQRDMLAH */
63
+ return float16_to_uint16(a, fpst);
100
+ switch (size) {
64
+}
101
+ case 1:
65
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
102
+ return do_v81_helper(s, gen_helper_gvec_qrdmlah_s16,
66
index XXXXXXX..XXXXXXX 100644
103
+ q, rd, rn, rm);
67
--- a/target/arm/translate-a64.c
104
+ case 2:
68
+++ b/target/arm/translate-a64.c
105
+ return do_v81_helper(s, gen_helper_gvec_qrdmlah_s32,
69
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
106
+ q, rd, rn, rm);
70
only_in_vector = true;
107
+ }
71
/* current rounding mode */
108
+ return 1;
72
break;
73
+ case 0x1a: /* FCVTNS */
74
+ need_rmode = true;
75
+ rmode = FPROUNDING_TIEEVEN;
76
+ break;
77
+ case 0x1b: /* FCVTMS */
78
+ need_rmode = true;
79
+ rmode = FPROUNDING_NEGINF;
80
+ break;
81
+ case 0x1c: /* FCVTAS */
82
+ need_rmode = true;
83
+ rmode = FPROUNDING_TIEAWAY;
84
+ break;
85
+ case 0x3a: /* FCVTPS */
86
+ need_rmode = true;
87
+ rmode = FPROUNDING_POSINF;
88
+ break;
89
+ case 0x3b: /* FCVTZS */
90
+ need_rmode = true;
91
+ rmode = FPROUNDING_ZERO;
92
+ break;
93
+ case 0x5a: /* FCVTNU */
94
+ need_rmode = true;
95
+ rmode = FPROUNDING_TIEEVEN;
96
+ break;
97
+ case 0x5b: /* FCVTMU */
98
+ need_rmode = true;
99
+ rmode = FPROUNDING_NEGINF;
100
+ break;
101
+ case 0x5c: /* FCVTAU */
102
+ need_rmode = true;
103
+ rmode = FPROUNDING_TIEAWAY;
104
+ break;
105
+ case 0x7a: /* FCVTPU */
106
+ need_rmode = true;
107
+ rmode = FPROUNDING_POSINF;
108
+ break;
109
+ case 0x7b: /* FCVTZU */
110
+ need_rmode = true;
111
+ rmode = FPROUNDING_ZERO;
112
+ break;
113
default:
114
fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop);
115
g_assert_not_reached();
116
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
117
}
118
119
if (is_scalar) {
120
- /* no operations yet */
121
+ TCGv_i32 tcg_op = tcg_temp_new_i32();
122
+ TCGv_i32 tcg_res = tcg_temp_new_i32();
123
+
109
+
124
+ read_vec_element_i32(s, tcg_op, rn, 0, MO_16);
110
+ case NEON_3R_VFM_VQRDMLSH:
125
+
111
+ if (!u) {
126
+ switch (fpop) {
112
+ /* VFM, VFMS */
127
+ case 0x1a: /* FCVTNS */
113
+ if (size == 1) {
128
+ case 0x1b: /* FCVTMS */
114
+ return 1;
129
+ case 0x1c: /* FCVTAS */
115
+ }
130
+ case 0x3a: /* FCVTPS */
131
+ case 0x3b: /* FCVTZS */
132
+ gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus);
133
+ break;
134
+ case 0x5a: /* FCVTNU */
135
+ case 0x5b: /* FCVTMU */
136
+ case 0x5c: /* FCVTAU */
137
+ case 0x7a: /* FCVTPU */
138
+ case 0x7b: /* FCVTZU */
139
+ gen_helper_advsimd_f16touinth(tcg_res, tcg_op, tcg_fpstatus);
140
+ break;
141
+ default:
142
+ g_assert_not_reached();
143
+ }
144
+
145
+ /* limit any sign extension going on */
146
+ tcg_gen_andi_i32(tcg_res, tcg_res, 0xffff);
147
+ write_fp_sreg(s, rd, tcg_res);
148
+
149
+ tcg_temp_free_i32(tcg_res);
150
+ tcg_temp_free_i32(tcg_op);
151
} else {
152
for (pass = 0; pass < (is_q ? 8 : 4); pass++) {
153
TCGv_i32 tcg_op = tcg_temp_new_i32();
154
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
155
read_vec_element_i32(s, tcg_op, rn, pass, MO_16);
156
157
switch (fpop) {
158
+ case 0x1a: /* FCVTNS */
159
+ case 0x1b: /* FCVTMS */
160
+ case 0x1c: /* FCVTAS */
161
+ case 0x3a: /* FCVTPS */
162
+ case 0x3b: /* FCVTZS */
163
+ gen_helper_advsimd_f16tosinth(tcg_res, tcg_op, tcg_fpstatus);
164
+ break;
116
+ break;
165
+ case 0x5a: /* FCVTNU */
117
+ }
166
+ case 0x5b: /* FCVTMU */
118
+ /* VQRDMLSH */
167
+ case 0x5c: /* FCVTAU */
119
+ switch (size) {
168
+ case 0x7a: /* FCVTPU */
120
+ case 1:
169
+ case 0x7b: /* FCVTZU */
121
+ return do_v81_helper(s, gen_helper_gvec_qrdmlsh_s16,
170
+ gen_helper_advsimd_f16touinth(tcg_res, tcg_op, tcg_fpstatus);
122
+ q, rd, rn, rm);
171
+ break;
123
+ case 2:
172
case 0x18: /* FRINTN */
124
+ return do_v81_helper(s, gen_helper_gvec_qrdmlsh_s32,
173
case 0x19: /* FRINTM */
125
+ q, rd, rn, rm);
174
case 0x38: /* FRINTP */
126
+ }
127
+ return 1;
128
}
129
if (size == 3 && op != NEON_3R_LOGIC) {
130
/* 64-bit element instructions. */
131
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
132
rm = rtmp;
133
}
134
break;
135
- case NEON_3R_VPADD:
136
- if (u) {
137
- return 1;
138
- }
139
- /* Fall through */
140
+ case NEON_3R_VPADD_VQRDMLAH:
141
case NEON_3R_VPMAX:
142
case NEON_3R_VPMIN:
143
pairwise = 1;
144
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
145
return 1;
146
}
147
break;
148
- case NEON_3R_VFM:
149
- if (!arm_dc_feature(s, ARM_FEATURE_VFP4) || u) {
150
+ case NEON_3R_VFM_VQRDMLSH:
151
+ if (!arm_dc_feature(s, ARM_FEATURE_VFP4)) {
152
return 1;
153
}
154
break;
155
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
156
}
157
}
158
break;
159
- case NEON_3R_VPADD:
160
+ case NEON_3R_VPADD_VQRDMLAH:
161
switch (size) {
162
case 0: gen_helper_neon_padd_u8(tmp, tmp, tmp2); break;
163
case 1: gen_helper_neon_padd_u16(tmp, tmp, tmp2); break;
164
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
165
}
166
}
167
break;
168
- case NEON_3R_VFM:
169
+ case NEON_3R_VFM_VQRDMLSH:
170
{
171
/* VFMA, VFMS: fused multiply-add */
172
TCGv_ptr fpstatus = get_fpstatus_ptr(1);
175
--
173
--
176
2.16.2
174
2.16.2
177
175
178
176
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
3
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
4
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Message-id: 20180227143852.11175-12-alex.bennee@linaro.org
5
Message-id: 20180228193125.20577-9-richard.henderson@linaro.org
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
---
7
---
8
target/arm/helper-a64.h | 2 ++
8
target/arm/translate.c | 46 ++++++++++++++++++++++++++++++++++++++++++----
9
target/arm/helper-a64.c | 24 ++++++++++++++++++++++++
9
1 file changed, 42 insertions(+), 4 deletions(-)
10
target/arm/translate-a64.c | 15 +++++++++++++++
11
3 files changed, 41 insertions(+)
12
10
13
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
11
diff --git a/target/arm/translate.c b/target/arm/translate.c
14
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
15
--- a/target/arm/helper-a64.h
13
--- a/target/arm/translate.c
16
+++ b/target/arm/helper-a64.h
14
+++ b/target/arm/translate.c
17
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(advsimd_cge_f16, i32, f16, f16, ptr)
15
@@ -XXX,XX +XXX,XX @@ static const char *regnames[] =
18
DEF_HELPER_3(advsimd_cgt_f16, i32, f16, f16, ptr)
16
{ "r0", "r1", "r2", "r3", "r4", "r5", "r6", "r7",
19
DEF_HELPER_3(advsimd_acge_f16, i32, f16, f16, ptr)
17
"r8", "r9", "r10", "r11", "r12", "r13", "r14", "pc" };
20
DEF_HELPER_3(advsimd_acgt_f16, i32, f16, f16, ptr)
18
21
+DEF_HELPER_3(advsimd_mulxh, f16, f16, f16, ptr)
19
+/* Function prototypes for gen_ functions calling Neon helpers. */
22
+DEF_HELPER_4(advsimd_muladdh, f16, f16, f16, f16, ptr)
20
+typedef void NeonGenThreeOpEnvFn(TCGv_i32, TCGv_env, TCGv_i32,
23
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
21
+ TCGv_i32, TCGv_i32);
24
index XXXXXXX..XXXXXXX 100644
25
--- a/target/arm/helper-a64.c
26
+++ b/target/arm/helper-a64.c
27
@@ -XXX,XX +XXX,XX @@ ADVSIMD_HALFOP(max)
28
ADVSIMD_HALFOP(minnum)
29
ADVSIMD_HALFOP(maxnum)
30
31
+/* Data processing - scalar floating-point and advanced SIMD */
32
+float16 HELPER(advsimd_mulxh)(float16 a, float16 b, void *fpstp)
33
+{
34
+ float_status *fpst = fpstp;
35
+
22
+
36
+ a = float16_squash_input_denormal(a, fpst);
23
/* initialize TCG globals. */
37
+ b = float16_squash_input_denormal(b, fpst);
24
void arm_translate_init(void)
25
{
26
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
27
}
28
neon_store_reg64(cpu_V0, rd + pass);
29
}
30
-
31
-
32
break;
33
- default: /* 14 and 15 are RESERVED */
34
- return 1;
35
+ case 14: /* VQRDMLAH scalar */
36
+ case 15: /* VQRDMLSH scalar */
37
+ {
38
+ NeonGenThreeOpEnvFn *fn;
38
+
39
+
39
+ if ((float16_is_zero(a) && float16_is_infinity(b)) ||
40
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_RDM)) {
40
+ (float16_is_infinity(a) && float16_is_zero(b))) {
41
+ return 1;
41
+ /* 2.0 with the sign bit set to sign(A) XOR sign(B) */
42
+ }
42
+ return make_float16((1U << 14) |
43
+ if (u && ((rd | rn) & 1)) {
43
+ ((float16_val(a) ^ float16_val(b)) & (1U << 15)));
44
+ return 1;
44
+ }
45
+ }
45
+ return float16_mul(a, b, fpst);
46
+ if (op == 14) {
46
+}
47
+ if (size == 1) {
48
+ fn = gen_helper_neon_qrdmlah_s16;
49
+ } else {
50
+ fn = gen_helper_neon_qrdmlah_s32;
51
+ }
52
+ } else {
53
+ if (size == 1) {
54
+ fn = gen_helper_neon_qrdmlsh_s16;
55
+ } else {
56
+ fn = gen_helper_neon_qrdmlsh_s32;
57
+ }
58
+ }
47
+
59
+
48
+/* fused multiply-accumulate */
60
+ tmp2 = neon_get_scalar(size, rm);
49
+float16 HELPER(advsimd_muladdh)(float16 a, float16 b, float16 c, void *fpstp)
61
+ for (pass = 0; pass < (u ? 4 : 2); pass++) {
50
+{
62
+ tmp = neon_load_reg(rn, pass);
51
+ float_status *fpst = fpstp;
63
+ tmp3 = neon_load_reg(rd, pass);
52
+ return float16_muladd(a, b, c, 0, fpst);
64
+ fn(tmp, cpu_env, tmp, tmp2, tmp3);
53
+}
65
+ tcg_temp_free_i32(tmp3);
54
+
66
+ neon_store_reg(rd, pass, tmp);
55
/*
67
+ }
56
* Floating point comparisons produce an integer result. Softfloat
68
+ tcg_temp_free_i32(tmp2);
57
* routines return float_relation types which we convert to the 0/-1
69
+ }
58
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
70
+ break;
59
index XXXXXXX..XXXXXXX 100644
71
+ default:
60
--- a/target/arm/translate-a64.c
72
+ g_assert_not_reached();
61
+++ b/target/arm/translate-a64.c
73
}
62
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
74
}
63
case 0x0: /* FMAXNM */
75
} else { /* size == 3 */
64
gen_helper_advsimd_maxnumh(tcg_res, tcg_op1, tcg_op2, fpst);
65
break;
66
+ case 0x1: /* FMLA */
67
+ read_vec_element_i32(s, tcg_res, rd, pass, MO_16);
68
+ gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res,
69
+ fpst);
70
+ break;
71
case 0x2: /* FADD */
72
gen_helper_advsimd_addh(tcg_res, tcg_op1, tcg_op2, fpst);
73
break;
74
+ case 0x3: /* FMULX */
75
+ gen_helper_advsimd_mulxh(tcg_res, tcg_op1, tcg_op2, fpst);
76
+ break;
77
case 0x4: /* FCMEQ */
78
gen_helper_advsimd_ceq_f16(tcg_res, tcg_op1, tcg_op2, fpst);
79
break;
80
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_fp16(DisasContext *s, uint32_t insn)
81
case 0x8: /* FMINNM */
82
gen_helper_advsimd_minnumh(tcg_res, tcg_op1, tcg_op2, fpst);
83
break;
84
+ case 0x9: /* FMLS */
85
+ /* As usual for ARM, separate negation for fused multiply-add */
86
+ tcg_gen_xori_i32(tcg_op1, tcg_op1, 0x8000);
87
+ read_vec_element_i32(s, tcg_res, rd, pass, MO_16);
88
+ gen_helper_advsimd_muladdh(tcg_res, tcg_op1, tcg_op2, tcg_res,
89
+ fpst);
90
+ break;
91
case 0xa: /* FSUB */
92
gen_helper_advsimd_subh(tcg_res, tcg_op1, tcg_op2, fpst);
93
break;
94
--
76
--
95
2.16.2
77
2.16.2
96
78
97
79
diff view generated by jsdifflib
1
Now we have implemented FP16 we can enable it for the "any" CPU.
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
3
Enable it for the "any" CPU used by *-linux-user.
4
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
4
5
[PMM: split out from an earlier patch in the series]
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
7
Message-id: 20180228193125.20577-10-richard.henderson@linaro.org
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
7
---
9
---
10
target/arm/cpu.c | 1 +
8
target/arm/cpu64.c | 1 +
11
target/arm/cpu64.c | 1 +
9
1 file changed, 1 insertion(+)
12
2 files changed, 2 insertions(+)
10
13
14
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
15
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/cpu.c
17
+++ b/target/arm/cpu.c
18
@@ -XXX,XX +XXX,XX @@ static void arm_any_initfn(Object *obj)
19
set_feature(&cpu->env, ARM_FEATURE_V8_SHA256);
20
set_feature(&cpu->env, ARM_FEATURE_V8_PMULL);
21
set_feature(&cpu->env, ARM_FEATURE_CRC);
22
+ set_feature(&cpu->env, ARM_FEATURE_V8_RDM);
23
cpu->midr = 0xffffffff;
24
}
25
#endif
11
diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
26
diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
12
index XXXXXXX..XXXXXXX 100644
27
index XXXXXXX..XXXXXXX 100644
13
--- a/target/arm/cpu64.c
28
--- a/target/arm/cpu64.c
14
+++ b/target/arm/cpu64.c
29
+++ b/target/arm/cpu64.c
15
@@ -XXX,XX +XXX,XX @@ static void aarch64_any_initfn(Object *obj)
30
@@ -XXX,XX +XXX,XX @@ static void aarch64_any_initfn(Object *obj)
16
set_feature(&cpu->env, ARM_FEATURE_V8_SM4);
31
set_feature(&cpu->env, ARM_FEATURE_V8_SM4);
17
set_feature(&cpu->env, ARM_FEATURE_V8_PMULL);
32
set_feature(&cpu->env, ARM_FEATURE_V8_PMULL);
18
set_feature(&cpu->env, ARM_FEATURE_CRC);
33
set_feature(&cpu->env, ARM_FEATURE_CRC);
19
+ set_feature(&cpu->env, ARM_FEATURE_V8_FP16);
34
+ set_feature(&cpu->env, ARM_FEATURE_V8_RDM);
35
set_feature(&cpu->env, ARM_FEATURE_V8_FP16);
20
cpu->ctr = 0x80038003; /* 32 byte I and D cacheline size, VIPT icache */
36
cpu->ctr = 0x80038003; /* 32 byte I and D cacheline size, VIPT icache */
21
cpu->dcz_blocksize = 7; /* 512 bytes */
37
cpu->dcz_blocksize = 7; /* 512 bytes */
22
}
23
--
38
--
24
2.16.2
39
2.16.2
25
40
26
41
diff view generated by jsdifflib
1
Set the appropriate Linux hwcap bits to tell the guest binary if we
1
From: Richard Henderson <richard.henderson@linaro.org>
2
have implemented half-precision floating point support.
3
2
3
Not enabled anywhere yet.
4
5
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
7
Message-id: 20180228193125.20577-11-richard.henderson@linaro.org
4
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
5
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
---
9
---
7
linux-user/elfload.c | 2 ++
10
target/arm/cpu.h | 1 +
8
1 file changed, 2 insertions(+)
11
linux-user/elfload.c | 1 +
12
2 files changed, 2 insertions(+)
9
13
14
diff --git a/target/arm/cpu.h b/target/arm/cpu.h
15
index XXXXXXX..XXXXXXX 100644
16
--- a/target/arm/cpu.h
17
+++ b/target/arm/cpu.h
18
@@ -XXX,XX +XXX,XX @@ enum arm_features {
19
ARM_FEATURE_V8_SM4, /* implements SM4 part of v8 Crypto Extensions */
20
ARM_FEATURE_V8_RDM, /* implements v8.1 simd round multiply */
21
ARM_FEATURE_V8_FP16, /* implements v8.2 half-precision float */
22
+ ARM_FEATURE_V8_FCMA, /* has complex number part of v8.3 extensions. */
23
};
24
25
static inline int arm_feature(CPUARMState *env, int feature)
10
diff --git a/linux-user/elfload.c b/linux-user/elfload.c
26
diff --git a/linux-user/elfload.c b/linux-user/elfload.c
11
index XXXXXXX..XXXXXXX 100644
27
index XXXXXXX..XXXXXXX 100644
12
--- a/linux-user/elfload.c
28
--- a/linux-user/elfload.c
13
+++ b/linux-user/elfload.c
29
+++ b/linux-user/elfload.c
14
@@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap(void)
30
@@ -XXX,XX +XXX,XX @@ static uint32_t get_elf_hwcap(void)
15
GET_FEATURE(ARM_FEATURE_V8_SM3, ARM_HWCAP_A64_SM3);
31
GET_FEATURE(ARM_FEATURE_V8_FP16,
16
GET_FEATURE(ARM_FEATURE_V8_SM4, ARM_HWCAP_A64_SM4);
32
ARM_HWCAP_A64_FPHP | ARM_HWCAP_A64_ASIMDHP);
17
GET_FEATURE(ARM_FEATURE_V8_SHA512, ARM_HWCAP_A64_SHA512);
33
GET_FEATURE(ARM_FEATURE_V8_RDM, ARM_HWCAP_A64_ASIMDRDM);
18
+ GET_FEATURE(ARM_FEATURE_V8_FP16,
34
+ GET_FEATURE(ARM_FEATURE_V8_FCMA, ARM_HWCAP_A64_FCMA);
19
+ ARM_HWCAP_A64_FPHP | ARM_HWCAP_A64_ASIMDHP);
20
#undef GET_FEATURE
35
#undef GET_FEATURE
21
36
22
return hwcaps;
37
return hwcaps;
23
--
38
--
24
2.16.2
39
2.16.2
25
40
26
41
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
I've re-factored the handle_simd_intfp_conv helper to properly handle
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
half-precision as well as call plain conversion helpers when we are
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
not doing fixed point conversion.
5
Message-id: 20180228193125.20577-12-richard.henderson@linaro.org
6
7
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Message-id: 20180227143852.11175-21-alex.bennee@linaro.org
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
7
---
12
target/arm/helper.h | 10 ++++
8
target/arm/helper.h | 7 ++++
13
target/arm/helper.c | 4 ++
9
target/arm/translate-a64.c | 48 ++++++++++++++++++++++-
14
target/arm/translate-a64.c | 122 ++++++++++++++++++++++++++++++++++-----------
10
target/arm/vec_helper.c | 97 ++++++++++++++++++++++++++++++++++++++++++++++
15
3 files changed, 108 insertions(+), 28 deletions(-)
11
3 files changed, 151 insertions(+), 1 deletion(-)
16
12
17
diff --git a/target/arm/helper.h b/target/arm/helper.h
13
diff --git a/target/arm/helper.h b/target/arm/helper.h
18
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
19
--- a/target/arm/helper.h
15
--- a/target/arm/helper.h
20
+++ b/target/arm/helper.h
16
+++ b/target/arm/helper.h
21
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_cmped, void, f64, f64, env)
17
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_qrdmlah_s32, TCG_CALL_NO_RWG,
22
DEF_HELPER_2(vfp_fcvtds, f64, f32, env)
18
DEF_HELPER_FLAGS_5(gvec_qrdmlsh_s32, TCG_CALL_NO_RWG,
23
DEF_HELPER_2(vfp_fcvtsd, f32, f64, env)
19
void, ptr, ptr, ptr, ptr, i32)
24
20
25
+DEF_HELPER_2(vfp_uitoh, f16, i32, ptr)
21
+DEF_HELPER_FLAGS_5(gvec_fcaddh, TCG_CALL_NO_RWG,
26
DEF_HELPER_2(vfp_uitos, f32, i32, ptr)
22
+ void, ptr, ptr, ptr, ptr, i32)
27
DEF_HELPER_2(vfp_uitod, f64, i32, ptr)
23
+DEF_HELPER_FLAGS_5(gvec_fcadds, TCG_CALL_NO_RWG,
28
+DEF_HELPER_2(vfp_sitoh, f16, i32, ptr)
24
+ void, ptr, ptr, ptr, ptr, i32)
29
DEF_HELPER_2(vfp_sitos, f32, i32, ptr)
25
+DEF_HELPER_FLAGS_5(gvec_fcaddd, TCG_CALL_NO_RWG,
30
DEF_HELPER_2(vfp_sitod, f64, i32, ptr)
26
+ void, ptr, ptr, ptr, ptr, i32)
31
27
+
32
+DEF_HELPER_2(vfp_touih, i32, f16, ptr)
28
#ifdef TARGET_AARCH64
33
DEF_HELPER_2(vfp_touis, i32, f32, ptr)
29
#include "helper-a64.h"
34
DEF_HELPER_2(vfp_touid, i32, f64, ptr)
30
#endif
35
+DEF_HELPER_2(vfp_touizh, i32, f16, ptr)
36
DEF_HELPER_2(vfp_touizs, i32, f32, ptr)
37
DEF_HELPER_2(vfp_touizd, i32, f64, ptr)
38
+DEF_HELPER_2(vfp_tosih, i32, f16, ptr)
39
DEF_HELPER_2(vfp_tosis, i32, f32, ptr)
40
DEF_HELPER_2(vfp_tosid, i32, f64, ptr)
41
+DEF_HELPER_2(vfp_tosizh, i32, f16, ptr)
42
DEF_HELPER_2(vfp_tosizs, i32, f32, ptr)
43
DEF_HELPER_2(vfp_tosizd, i32, f64, ptr)
44
45
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_toshd_round_to_zero, i64, f64, i32, ptr)
46
DEF_HELPER_3(vfp_tosld_round_to_zero, i64, f64, i32, ptr)
47
DEF_HELPER_3(vfp_touhd_round_to_zero, i64, f64, i32, ptr)
48
DEF_HELPER_3(vfp_tould_round_to_zero, i64, f64, i32, ptr)
49
+DEF_HELPER_3(vfp_toulh, i32, f16, i32, ptr)
50
+DEF_HELPER_3(vfp_toslh, i32, f16, i32, ptr)
51
DEF_HELPER_3(vfp_toshs, i32, f32, i32, ptr)
52
DEF_HELPER_3(vfp_tosls, i32, f32, i32, ptr)
53
DEF_HELPER_3(vfp_tosqs, i64, f32, i32, ptr)
54
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_sqtod, f64, i64, i32, ptr)
55
DEF_HELPER_3(vfp_uhtod, f64, i64, i32, ptr)
56
DEF_HELPER_3(vfp_ultod, f64, i64, i32, ptr)
57
DEF_HELPER_3(vfp_uqtod, f64, i64, i32, ptr)
58
+DEF_HELPER_3(vfp_sltoh, f16, i32, i32, ptr)
59
+DEF_HELPER_3(vfp_ultoh, f16, i32, i32, ptr)
60
61
DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, ptr)
62
DEF_HELPER_FLAGS_2(set_neon_rmode, TCG_CALL_NO_RWG, i32, i32, env)
63
diff --git a/target/arm/helper.c b/target/arm/helper.c
64
index XXXXXXX..XXXXXXX 100644
65
--- a/target/arm/helper.c
66
+++ b/target/arm/helper.c
67
@@ -XXX,XX +XXX,XX @@ CONV_ITOF(vfp_##name##to##p, fsz, sign) \
68
CONV_FTOI(vfp_to##name##p, fsz, sign, ) \
69
CONV_FTOI(vfp_to##name##z##p, fsz, sign, _round_to_zero)
70
71
+FLOAT_CONVS(si, h, 16, )
72
FLOAT_CONVS(si, s, 32, )
73
FLOAT_CONVS(si, d, 64, )
74
+FLOAT_CONVS(ui, h, 16, u)
75
FLOAT_CONVS(ui, s, 32, u)
76
FLOAT_CONVS(ui, d, 64, u)
77
78
@@ -XXX,XX +XXX,XX @@ VFP_CONV_FIX_A64(sq, s, 32, 64, int64)
79
VFP_CONV_FIX(uh, s, 32, 32, uint16)
80
VFP_CONV_FIX(ul, s, 32, 32, uint32)
81
VFP_CONV_FIX_A64(uq, s, 32, 64, uint64)
82
+VFP_CONV_FIX_A64(sl, h, 16, 32, int32)
83
+VFP_CONV_FIX_A64(ul, h, 16, 32, uint32)
84
#undef VFP_CONV_FIX
85
#undef VFP_CONV_FIX_FLOAT
86
#undef VFP_CONV_FLOAT_FIX_ROUND
87
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
31
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
88
index XXXXXXX..XXXXXXX 100644
32
index XXXXXXX..XXXXXXX 100644
89
--- a/target/arm/translate-a64.c
33
--- a/target/arm/translate-a64.c
90
+++ b/target/arm/translate-a64.c
34
+++ b/target/arm/translate-a64.c
91
@@ -XXX,XX +XXX,XX @@ static void handle_simd_intfp_conv(DisasContext *s, int rd, int rn,
35
@@ -XXX,XX +XXX,XX @@ static void gen_gvec_op3_env(DisasContext *s, bool is_q, int rd,
92
int elements, int is_signed,
36
is_q ? 16 : 8, vec_full_reg_size(s), 0, fn);
93
int fracbits, int size)
37
}
94
{
38
95
- bool is_double = size == 3 ? true : false;
39
+/* Expand a 3-operand + fpstatus pointer + simd data value operation using
96
- TCGv_ptr tcg_fpst = get_fpstatus_ptr(false);
40
+ * an out-of-line helper.
97
- TCGv_i32 tcg_shift = tcg_const_i32(fracbits);
41
+ */
98
- TCGv_i64 tcg_int = tcg_temp_new_i64();
42
+static void gen_gvec_op3_fpst(DisasContext *s, bool is_q, int rd, int rn,
99
+ TCGv_ptr tcg_fpst = get_fpstatus_ptr(size == MO_16);
43
+ int rm, bool is_fp16, int data,
100
+ TCGv_i32 tcg_shift = NULL;
44
+ gen_helper_gvec_3_ptr *fn)
101
+
45
+{
102
TCGMemOp mop = size | (is_signed ? MO_SIGN : 0);
46
+ TCGv_ptr fpst = get_fpstatus_ptr(is_fp16);
103
int pass;
47
+ tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd),
104
48
+ vec_full_reg_offset(s, rn),
105
- for (pass = 0; pass < elements; pass++) {
49
+ vec_full_reg_offset(s, rm), fpst,
106
- read_vec_element(s, tcg_int, rn, pass, mop);
50
+ is_q ? 16 : 8, vec_full_reg_size(s), data, fn);
107
+ if (fracbits || size == MO_64) {
51
+ tcg_temp_free_ptr(fpst);
108
+ tcg_shift = tcg_const_i32(fracbits);
52
+}
109
+ }
53
+
110
+
54
/* Set ZF and NF based on a 64 bit result. This is alas fiddlier
111
+ if (size == MO_64) {
55
* than the 32 bit equivalent.
112
+ TCGv_i64 tcg_int64 = tcg_temp_new_i64();
56
*/
113
+ TCGv_i64 tcg_double = tcg_temp_new_i64();
57
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn)
114
+
58
int size = extract32(insn, 22, 2);
115
+ for (pass = 0; pass < elements; pass++) {
59
bool u = extract32(insn, 29, 1);
116
+ read_vec_element(s, tcg_int64, rn, pass, mop);
60
bool is_q = extract32(insn, 30, 1);
117
61
- int feature;
118
- if (is_double) {
62
+ int feature, rot;
119
- TCGv_i64 tcg_double = tcg_temp_new_i64();
63
120
if (is_signed) {
64
switch (u * 16 + opcode) {
121
- gen_helper_vfp_sqtod(tcg_double, tcg_int,
65
case 0x10: /* SQRDMLAH (vector) */
122
+ gen_helper_vfp_sqtod(tcg_double, tcg_int64,
66
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn)
123
tcg_shift, tcg_fpst);
124
} else {
125
- gen_helper_vfp_uqtod(tcg_double, tcg_int,
126
+ gen_helper_vfp_uqtod(tcg_double, tcg_int64,
127
tcg_shift, tcg_fpst);
128
}
129
if (elements == 1) {
130
@@ -XXX,XX +XXX,XX @@ static void handle_simd_intfp_conv(DisasContext *s, int rd, int rn,
131
} else {
132
write_vec_element(s, tcg_double, rd, pass, MO_64);
133
}
134
- tcg_temp_free_i64(tcg_double);
135
- } else {
136
- TCGv_i32 tcg_single = tcg_temp_new_i32();
137
- if (is_signed) {
138
- gen_helper_vfp_sqtos(tcg_single, tcg_int,
139
- tcg_shift, tcg_fpst);
140
- } else {
141
- gen_helper_vfp_uqtos(tcg_single, tcg_int,
142
- tcg_shift, tcg_fpst);
143
- }
144
- if (elements == 1) {
145
- write_fp_sreg(s, rd, tcg_single);
146
- } else {
147
- write_vec_element_i32(s, tcg_single, rd, pass, MO_32);
148
- }
149
- tcg_temp_free_i32(tcg_single);
150
}
67
}
151
+
68
feature = ARM_FEATURE_V8_RDM;
152
+ tcg_temp_free_i64(tcg_int64);
69
break;
153
+ tcg_temp_free_i64(tcg_double);
70
+ case 0xc: /* FCADD, #90 */
154
+
71
+ case 0xe: /* FCADD, #270 */
155
+ } else {
72
+ if (size == 0
156
+ TCGv_i32 tcg_int32 = tcg_temp_new_i32();
73
+ || (size == 1 && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))
157
+ TCGv_i32 tcg_float = tcg_temp_new_i32();
74
+ || (size == 3 && !is_q)) {
158
+
75
+ unallocated_encoding(s);
159
+ for (pass = 0; pass < elements; pass++) {
160
+ read_vec_element_i32(s, tcg_int32, rn, pass, mop);
161
+
162
+ switch (size) {
163
+ case MO_32:
164
+ if (fracbits) {
165
+ if (is_signed) {
166
+ gen_helper_vfp_sltos(tcg_float, tcg_int32,
167
+ tcg_shift, tcg_fpst);
168
+ } else {
169
+ gen_helper_vfp_ultos(tcg_float, tcg_int32,
170
+ tcg_shift, tcg_fpst);
171
+ }
172
+ } else {
173
+ if (is_signed) {
174
+ gen_helper_vfp_sitos(tcg_float, tcg_int32, tcg_fpst);
175
+ } else {
176
+ gen_helper_vfp_uitos(tcg_float, tcg_int32, tcg_fpst);
177
+ }
178
+ }
179
+ break;
180
+ case MO_16:
181
+ if (fracbits) {
182
+ if (is_signed) {
183
+ gen_helper_vfp_sltoh(tcg_float, tcg_int32,
184
+ tcg_shift, tcg_fpst);
185
+ } else {
186
+ gen_helper_vfp_ultoh(tcg_float, tcg_int32,
187
+ tcg_shift, tcg_fpst);
188
+ }
189
+ } else {
190
+ if (is_signed) {
191
+ gen_helper_vfp_sitoh(tcg_float, tcg_int32, tcg_fpst);
192
+ } else {
193
+ gen_helper_vfp_uitoh(tcg_float, tcg_int32, tcg_fpst);
194
+ }
195
+ }
196
+ break;
197
+ default:
198
+ g_assert_not_reached();
199
+ }
200
+
201
+ if (elements == 1) {
202
+ write_fp_sreg(s, rd, tcg_float);
203
+ } else {
204
+ write_vec_element_i32(s, tcg_float, rd, pass, size);
205
+ }
206
+ }
207
+
208
+ tcg_temp_free_i32(tcg_int32);
209
+ tcg_temp_free_i32(tcg_float);
210
}
211
212
- tcg_temp_free_i64(tcg_int);
213
tcg_temp_free_ptr(tcg_fpst);
214
- tcg_temp_free_i32(tcg_shift);
215
+ if (tcg_shift) {
216
+ tcg_temp_free_i32(tcg_shift);
217
+ }
218
219
clear_vec_high(s, elements << size == 16, rd);
220
}
221
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
222
rn = extract32(insn, 5, 5);
223
224
switch (fpop) {
225
+ case 0x1d: /* SCVTF */
226
+ case 0x5d: /* UCVTF */
227
+ {
228
+ int elements;
229
+
230
+ if (is_scalar) {
231
+ elements = 1;
232
+ } else {
233
+ elements = (is_q ? 8 : 4);
234
+ }
235
+
236
+ if (!fp_access_check(s)) {
237
+ return;
76
+ return;
238
+ }
77
+ }
239
+ handle_simd_intfp_conv(s, rd, rn, elements, !u, 0, MO_16);
78
+ feature = ARM_FEATURE_V8_FCMA;
79
+ break;
80
default:
81
unallocated_encoding(s);
82
return;
83
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn)
84
}
85
return;
86
87
+ case 0xc: /* FCADD, #90 */
88
+ case 0xe: /* FCADD, #270 */
89
+ rot = extract32(opcode, 1, 1);
90
+ switch (size) {
91
+ case 1:
92
+ gen_gvec_op3_fpst(s, is_q, rd, rn, rm, size == 1, rot,
93
+ gen_helper_gvec_fcaddh);
94
+ break;
95
+ case 2:
96
+ gen_gvec_op3_fpst(s, is_q, rd, rn, rm, size == 1, rot,
97
+ gen_helper_gvec_fcadds);
98
+ break;
99
+ case 3:
100
+ gen_gvec_op3_fpst(s, is_q, rd, rn, rm, size == 1, rot,
101
+ gen_helper_gvec_fcaddd);
102
+ break;
103
+ default:
104
+ g_assert_not_reached();
105
+ }
240
+ return;
106
+ return;
107
+
108
default:
109
g_assert_not_reached();
110
}
111
diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c
112
index XXXXXXX..XXXXXXX 100644
113
--- a/target/arm/vec_helper.c
114
+++ b/target/arm/vec_helper.c
115
@@ -XXX,XX +XXX,XX @@
116
#include "exec/exec-all.h"
117
#include "exec/helper-proto.h"
118
#include "tcg/tcg-gvec-desc.h"
119
+#include "fpu/softfloat.h"
120
121
122
+/* Note that vector data is stored in host-endian 64-bit chunks,
123
+ so addressing units smaller than that needs a host-endian fixup. */
124
+#ifdef HOST_WORDS_BIGENDIAN
125
+#define H1(x) ((x) ^ 7)
126
+#define H2(x) ((x) ^ 3)
127
+#define H4(x) ((x) ^ 1)
128
+#else
129
+#define H1(x) (x)
130
+#define H2(x) (x)
131
+#define H4(x) (x)
132
+#endif
133
+
134
#define SET_QC() env->vfp.xregs[ARM_VFP_FPSCR] |= CPSR_Q
135
136
static void clear_tail(void *vd, uintptr_t opr_sz, uintptr_t max_sz)
137
@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_qrdmlsh_s32)(void *vd, void *vn, void *vm,
138
}
139
clear_tail(d, opr_sz, simd_maxsz(desc));
140
}
141
+
142
+void HELPER(gvec_fcaddh)(void *vd, void *vn, void *vm,
143
+ void *vfpst, uint32_t desc)
144
+{
145
+ uintptr_t opr_sz = simd_oprsz(desc);
146
+ float16 *d = vd;
147
+ float16 *n = vn;
148
+ float16 *m = vm;
149
+ float_status *fpst = vfpst;
150
+ uint32_t neg_real = extract32(desc, SIMD_DATA_SHIFT, 1);
151
+ uint32_t neg_imag = neg_real ^ 1;
152
+ uintptr_t i;
153
+
154
+ /* Shift boolean to the sign bit so we can xor to negate. */
155
+ neg_real <<= 15;
156
+ neg_imag <<= 15;
157
+
158
+ for (i = 0; i < opr_sz / 2; i += 2) {
159
+ float16 e0 = n[H2(i)];
160
+ float16 e1 = m[H2(i + 1)] ^ neg_imag;
161
+ float16 e2 = n[H2(i + 1)];
162
+ float16 e3 = m[H2(i)] ^ neg_real;
163
+
164
+ d[H2(i)] = float16_add(e0, e1, fpst);
165
+ d[H2(i + 1)] = float16_add(e2, e3, fpst);
241
+ }
166
+ }
242
break;
167
+ clear_tail(d, opr_sz, simd_maxsz(desc));
243
case 0x2c: /* FCMGT (zero) */
168
+}
244
case 0x2d: /* FCMEQ (zero) */
169
+
170
+void HELPER(gvec_fcadds)(void *vd, void *vn, void *vm,
171
+ void *vfpst, uint32_t desc)
172
+{
173
+ uintptr_t opr_sz = simd_oprsz(desc);
174
+ float32 *d = vd;
175
+ float32 *n = vn;
176
+ float32 *m = vm;
177
+ float_status *fpst = vfpst;
178
+ uint32_t neg_real = extract32(desc, SIMD_DATA_SHIFT, 1);
179
+ uint32_t neg_imag = neg_real ^ 1;
180
+ uintptr_t i;
181
+
182
+ /* Shift boolean to the sign bit so we can xor to negate. */
183
+ neg_real <<= 31;
184
+ neg_imag <<= 31;
185
+
186
+ for (i = 0; i < opr_sz / 4; i += 2) {
187
+ float32 e0 = n[H4(i)];
188
+ float32 e1 = m[H4(i + 1)] ^ neg_imag;
189
+ float32 e2 = n[H4(i + 1)];
190
+ float32 e3 = m[H4(i)] ^ neg_real;
191
+
192
+ d[H4(i)] = float32_add(e0, e1, fpst);
193
+ d[H4(i + 1)] = float32_add(e2, e3, fpst);
194
+ }
195
+ clear_tail(d, opr_sz, simd_maxsz(desc));
196
+}
197
+
198
+void HELPER(gvec_fcaddd)(void *vd, void *vn, void *vm,
199
+ void *vfpst, uint32_t desc)
200
+{
201
+ uintptr_t opr_sz = simd_oprsz(desc);
202
+ float64 *d = vd;
203
+ float64 *n = vn;
204
+ float64 *m = vm;
205
+ float_status *fpst = vfpst;
206
+ uint64_t neg_real = extract64(desc, SIMD_DATA_SHIFT, 1);
207
+ uint64_t neg_imag = neg_real ^ 1;
208
+ uintptr_t i;
209
+
210
+ /* Shift boolean to the sign bit so we can xor to negate. */
211
+ neg_real <<= 63;
212
+ neg_imag <<= 63;
213
+
214
+ for (i = 0; i < opr_sz / 8; i += 2) {
215
+ float64 e0 = n[i];
216
+ float64 e1 = m[i + 1] ^ neg_imag;
217
+ float64 e2 = n[i + 1];
218
+ float64 e3 = m[i] ^ neg_real;
219
+
220
+ d[i] = float64_add(e0, e1, fpst);
221
+ d[i + 1] = float64_add(e2, e3, fpst);
222
+ }
223
+ clear_tail(d, opr_sz, simd_maxsz(desc));
224
+}
245
--
225
--
246
2.16.2
226
2.16.2
247
227
248
228
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
This implements the half-precision variants of the across vector
3
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
4
reduction operations. This involves a re-factor of the reduction code
4
Message-id: 20180228193125.20577-13-richard.henderson@linaro.org
5
which more closely matches the ARM ARM order (and handles 8 element
5
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
reductions).
6
[PMM: renamed e1/e2/e3/e4 to use the same naming as the version
7
of the pseudocode in the Arm ARM]
8
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
9
---
10
target/arm/helper.h | 11 ++++
11
target/arm/translate-a64.c | 94 +++++++++++++++++++++++++---
12
target/arm/vec_helper.c | 149 +++++++++++++++++++++++++++++++++++++++++++++
13
3 files changed, 246 insertions(+), 8 deletions(-)
7
14
8
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
15
diff --git a/target/arm/helper.h b/target/arm/helper.h
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
10
Message-id: 20180227143852.11175-7-alex.bennee@linaro.org
11
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
12
---
13
target/arm/helper-a64.h | 4 ++
14
target/arm/helper-a64.c | 18 ++++++
15
target/arm/translate-a64.c | 140 ++++++++++++++++++++++++++++-----------------
16
3 files changed, 109 insertions(+), 53 deletions(-)
17
18
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
19
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
20
--- a/target/arm/helper-a64.h
17
--- a/target/arm/helper.h
21
+++ b/target/arm/helper-a64.h
18
+++ b/target/arm/helper.h
22
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_4(paired_cmpxchg64_le_parallel, TCG_CALL_NO_WG,
19
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_5(gvec_fcadds, TCG_CALL_NO_RWG,
23
DEF_HELPER_FLAGS_4(paired_cmpxchg64_be, TCG_CALL_NO_WG, i64, env, i64, i64, i64)
20
DEF_HELPER_FLAGS_5(gvec_fcaddd, TCG_CALL_NO_RWG,
24
DEF_HELPER_FLAGS_4(paired_cmpxchg64_be_parallel, TCG_CALL_NO_WG,
21
void, ptr, ptr, ptr, ptr, i32)
25
i64, env, i64, i64, i64)
22
26
+DEF_HELPER_FLAGS_3(advsimd_maxh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
23
+DEF_HELPER_FLAGS_5(gvec_fcmlah, TCG_CALL_NO_RWG,
27
+DEF_HELPER_FLAGS_3(advsimd_minh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
24
+ void, ptr, ptr, ptr, ptr, i32)
28
+DEF_HELPER_FLAGS_3(advsimd_maxnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
25
+DEF_HELPER_FLAGS_5(gvec_fcmlah_idx, TCG_CALL_NO_RWG,
29
+DEF_HELPER_FLAGS_3(advsimd_minnumh, TCG_CALL_NO_RWG, f16, f16, f16, ptr)
26
+ void, ptr, ptr, ptr, ptr, i32)
30
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
27
+DEF_HELPER_FLAGS_5(gvec_fcmlas, TCG_CALL_NO_RWG,
31
index XXXXXXX..XXXXXXX 100644
28
+ void, ptr, ptr, ptr, ptr, i32)
32
--- a/target/arm/helper-a64.c
29
+DEF_HELPER_FLAGS_5(gvec_fcmlas_idx, TCG_CALL_NO_RWG,
33
+++ b/target/arm/helper-a64.c
30
+ void, ptr, ptr, ptr, ptr, i32)
34
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(paired_cmpxchg64_be_parallel)(CPUARMState *env, uint64_t addr,
31
+DEF_HELPER_FLAGS_5(gvec_fcmlad, TCG_CALL_NO_RWG,
35
{
32
+ void, ptr, ptr, ptr, ptr, i32)
36
return do_paired_cmpxchg64_be(env, addr, new_lo, new_hi, true, GETPC());
33
+
37
}
34
#ifdef TARGET_AARCH64
38
+
35
#include "helper-a64.h"
39
+/*
36
#endif
40
+ * AdvSIMD half-precision
41
+ */
42
+
43
+#define ADVSIMD_HELPER(name, suffix) HELPER(glue(glue(advsimd_, name), suffix))
44
+
45
+#define ADVSIMD_HALFOP(name) \
46
+float16 ADVSIMD_HELPER(name, h)(float16 a, float16 b, void *fpstp) \
47
+{ \
48
+ float_status *fpst = fpstp; \
49
+ return float16_ ## name(a, b, fpst); \
50
+}
51
+
52
+ADVSIMD_HALFOP(min)
53
+ADVSIMD_HALFOP(max)
54
+ADVSIMD_HALFOP(minnum)
55
+ADVSIMD_HALFOP(maxnum)
56
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
37
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
57
index XXXXXXX..XXXXXXX 100644
38
index XXXXXXX..XXXXXXX 100644
58
--- a/target/arm/translate-a64.c
39
--- a/target/arm/translate-a64.c
59
+++ b/target/arm/translate-a64.c
40
+++ b/target/arm/translate-a64.c
60
@@ -XXX,XX +XXX,XX @@ static void disas_simd_zip_trn(DisasContext *s, uint32_t insn)
41
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn)
61
tcg_temp_free_i64(tcg_resh);
42
}
62
}
43
feature = ARM_FEATURE_V8_RDM;
63
44
break;
64
-static void do_minmaxop(DisasContext *s, TCGv_i32 tcg_elt1, TCGv_i32 tcg_elt2,
45
+ case 0x8: /* FCMLA, #0 */
65
- int opc, bool is_min, TCGv_ptr fpst)
46
+ case 0x9: /* FCMLA, #90 */
66
+/*
47
+ case 0xa: /* FCMLA, #180 */
67
+ * do_reduction_op helper
48
+ case 0xb: /* FCMLA, #270 */
68
+ *
49
case 0xc: /* FCADD, #90 */
69
+ * This mirrors the Reduce() pseudocode in the ARM ARM. It is
50
case 0xe: /* FCADD, #270 */
70
+ * important for correct NaN propagation that we do these
51
if (size == 0
71
+ * operations in exactly the order specified by the pseudocode.
52
@@ -XXX,XX +XXX,XX @@ static void disas_simd_three_reg_same_extra(DisasContext *s, uint32_t insn)
72
+ *
53
}
73
+ * This is a recursive function, TCG temps should be freed by the
54
return;
74
+ * calling function once it is done with the values.
55
75
+ */
56
+ case 0x8: /* FCMLA, #0 */
76
+static TCGv_i32 do_reduction_op(DisasContext *s, int fpopcode, int rn,
57
+ case 0x9: /* FCMLA, #90 */
77
+ int esize, int size, int vmap, TCGv_ptr fpst)
58
+ case 0xa: /* FCMLA, #180 */
78
{
59
+ case 0xb: /* FCMLA, #270 */
79
- /* Helper function for disas_simd_across_lanes: do a single precision
60
+ rot = extract32(opcode, 0, 2);
80
- * min/max operation on the specified two inputs,
61
+ switch (size) {
81
- * and return the result in tcg_elt1.
62
+ case 1:
82
- */
63
+ gen_gvec_op3_fpst(s, is_q, rd, rn, rm, true, rot,
83
- if (opc == 0xc) {
64
+ gen_helper_gvec_fcmlah);
84
- if (is_min) {
65
+ break;
85
- gen_helper_vfp_minnums(tcg_elt1, tcg_elt1, tcg_elt2, fpst);
66
+ case 2:
86
- } else {
67
+ gen_gvec_op3_fpst(s, is_q, rd, rn, rm, false, rot,
87
- gen_helper_vfp_maxnums(tcg_elt1, tcg_elt1, tcg_elt2, fpst);
68
+ gen_helper_gvec_fcmlas);
88
- }
69
+ break;
89
+ if (esize == size) {
70
+ case 3:
90
+ int element;
71
+ gen_gvec_op3_fpst(s, is_q, rd, rn, rm, false, rot,
91
+ TCGMemOp msize = esize == 16 ? MO_16 : MO_32;
72
+ gen_helper_gvec_fcmlad);
92
+ TCGv_i32 tcg_elem;
93
+
94
+ /* We should have one register left here */
95
+ assert(ctpop8(vmap) == 1);
96
+ element = ctz32(vmap);
97
+ assert(element < 8);
98
+
99
+ tcg_elem = tcg_temp_new_i32();
100
+ read_vec_element_i32(s, tcg_elem, rn, element, msize);
101
+ return tcg_elem;
102
} else {
103
- assert(opc == 0xf);
104
- if (is_min) {
105
- gen_helper_vfp_mins(tcg_elt1, tcg_elt1, tcg_elt2, fpst);
106
- } else {
107
- gen_helper_vfp_maxs(tcg_elt1, tcg_elt1, tcg_elt2, fpst);
108
+ int bits = size / 2;
109
+ int shift = ctpop8(vmap) / 2;
110
+ int vmap_lo = (vmap >> shift) & vmap;
111
+ int vmap_hi = (vmap & ~vmap_lo);
112
+ TCGv_i32 tcg_hi, tcg_lo, tcg_res;
113
+
114
+ tcg_hi = do_reduction_op(s, fpopcode, rn, esize, bits, vmap_hi, fpst);
115
+ tcg_lo = do_reduction_op(s, fpopcode, rn, esize, bits, vmap_lo, fpst);
116
+ tcg_res = tcg_temp_new_i32();
117
+
118
+ switch (fpopcode) {
119
+ case 0x0c: /* fmaxnmv half-precision */
120
+ gen_helper_advsimd_maxnumh(tcg_res, tcg_lo, tcg_hi, fpst);
121
+ break;
122
+ case 0x0f: /* fmaxv half-precision */
123
+ gen_helper_advsimd_maxh(tcg_res, tcg_lo, tcg_hi, fpst);
124
+ break;
125
+ case 0x1c: /* fminnmv half-precision */
126
+ gen_helper_advsimd_minnumh(tcg_res, tcg_lo, tcg_hi, fpst);
127
+ break;
128
+ case 0x1f: /* fminv half-precision */
129
+ gen_helper_advsimd_minh(tcg_res, tcg_lo, tcg_hi, fpst);
130
+ break;
131
+ case 0x2c: /* fmaxnmv */
132
+ gen_helper_vfp_maxnums(tcg_res, tcg_lo, tcg_hi, fpst);
133
+ break;
134
+ case 0x2f: /* fmaxv */
135
+ gen_helper_vfp_maxs(tcg_res, tcg_lo, tcg_hi, fpst);
136
+ break;
137
+ case 0x3c: /* fminnmv */
138
+ gen_helper_vfp_minnums(tcg_res, tcg_lo, tcg_hi, fpst);
139
+ break;
140
+ case 0x3f: /* fminv */
141
+ gen_helper_vfp_mins(tcg_res, tcg_lo, tcg_hi, fpst);
142
+ break;
73
+ break;
143
+ default:
74
+ default:
144
+ g_assert_not_reached();
75
+ g_assert_not_reached();
145
}
76
+ }
146
+
77
+ return;
147
+ tcg_temp_free_i32(tcg_hi);
78
+
148
+ tcg_temp_free_i32(tcg_lo);
79
case 0xc: /* FCADD, #90 */
149
+ return tcg_res;
80
case 0xe: /* FCADD, #270 */
150
}
81
rot = extract32(opcode, 1, 1);
151
}
82
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
152
83
int rn = extract32(insn, 5, 5);
153
@@ -XXX,XX +XXX,XX @@ static void disas_simd_across_lanes(DisasContext *s, uint32_t insn)
84
int rd = extract32(insn, 0, 5);
85
bool is_long = false;
86
- bool is_fp = false;
87
+ int is_fp = 0;
88
bool is_fp16 = false;
89
int index;
90
TCGv_ptr fpst;
91
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
92
case 0x05: /* FMLS */
93
case 0x09: /* FMUL */
94
case 0x19: /* FMULX */
95
- is_fp = true;
96
+ is_fp = 1;
154
break;
97
break;
155
case 0xc: /* FMAXNMV, FMINNMV */
98
case 0x1d: /* SQRDMLAH */
156
case 0xf: /* FMAXV, FMINV */
99
case 0x1f: /* SQRDMLSH */
157
- if (!is_u || !is_q || extract32(size, 0, 1)) {
100
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
158
- unallocated_encoding(s);
101
return;
159
- return;
102
}
160
- }
103
break;
161
- /* Bit 1 of size field encodes min vs max, and actual size is always
104
+ case 0x11: /* FCMLA #0 */
162
- * 32 bits: adjust the size variable so following code can rely on it
105
+ case 0x13: /* FCMLA #90 */
163
+ /* Bit 1 of size field encodes min vs max and the actual size
106
+ case 0x15: /* FCMLA #180 */
164
+ * depends on the encoding of the U bit. If not set (and FP16
107
+ case 0x17: /* FCMLA #270 */
165
+ * enabled) then we do half-precision float instead of single
108
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA)) {
166
+ * precision.
167
*/
168
is_min = extract32(size, 1, 1);
169
is_fp = true;
170
- size = 2;
171
+ if (!is_u && arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
172
+ size = 1;
173
+ } else if (!is_u || !is_q || extract32(size, 0, 1)) {
174
+ unallocated_encoding(s);
109
+ unallocated_encoding(s);
175
+ return;
110
+ return;
176
+ } else {
177
+ size = 2;
178
+ }
111
+ }
179
break;
112
+ is_fp = 2;
113
+ break;
180
default:
114
default:
181
unallocated_encoding(s);
115
unallocated_encoding(s);
182
@@ -XXX,XX +XXX,XX @@ static void disas_simd_across_lanes(DisasContext *s, uint32_t insn)
116
return;
183
184
}
185
} else {
186
- /* Floating point ops which work on 32 bit (single) intermediates.
187
+ /* Floating point vector reduction ops which work across 32
188
+ * bit (single) or 16 bit (half-precision) intermediates.
189
* Note that correct NaN propagation requires that we do these
190
* operations in exactly the order specified by the pseudocode.
191
*/
192
- TCGv_i32 tcg_elt1 = tcg_temp_new_i32();
193
- TCGv_i32 tcg_elt2 = tcg_temp_new_i32();
194
- TCGv_i32 tcg_elt3 = tcg_temp_new_i32();
195
- TCGv_ptr fpst = get_fpstatus_ptr(false);
196
-
197
- assert(esize == 32);
198
- assert(elements == 4);
199
-
200
- read_vec_element(s, tcg_elt, rn, 0, MO_32);
201
- tcg_gen_extrl_i64_i32(tcg_elt1, tcg_elt);
202
- read_vec_element(s, tcg_elt, rn, 1, MO_32);
203
- tcg_gen_extrl_i64_i32(tcg_elt2, tcg_elt);
204
-
205
- do_minmaxop(s, tcg_elt1, tcg_elt2, opcode, is_min, fpst);
206
-
207
- read_vec_element(s, tcg_elt, rn, 2, MO_32);
208
- tcg_gen_extrl_i64_i32(tcg_elt2, tcg_elt);
209
- read_vec_element(s, tcg_elt, rn, 3, MO_32);
210
- tcg_gen_extrl_i64_i32(tcg_elt3, tcg_elt);
211
-
212
- do_minmaxop(s, tcg_elt2, tcg_elt3, opcode, is_min, fpst);
213
-
214
- do_minmaxop(s, tcg_elt1, tcg_elt2, opcode, is_min, fpst);
215
-
216
- tcg_gen_extu_i32_i64(tcg_res, tcg_elt1);
217
- tcg_temp_free_i32(tcg_elt1);
218
- tcg_temp_free_i32(tcg_elt2);
219
- tcg_temp_free_i32(tcg_elt3);
220
+ TCGv_ptr fpst = get_fpstatus_ptr(size == MO_16);
221
+ int fpopcode = opcode | is_min << 4 | is_u << 5;
222
+ int vmap = (1 << elements) - 1;
223
+ TCGv_i32 tcg_res32 = do_reduction_op(s, fpopcode, rn, esize,
224
+ (is_q ? 128 : 64), vmap, fpst);
225
+ tcg_gen_extu_i32_i64(tcg_res, tcg_res32);
226
+ tcg_temp_free_i32(tcg_res32);
227
tcg_temp_free_ptr(fpst);
228
}
117
}
229
118
119
- if (is_fp) {
120
+ switch (is_fp) {
121
+ case 1: /* normal fp */
122
/* convert insn encoded size to TCGMemOp size */
123
switch (size) {
124
case 0: /* half-precision */
125
- if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
126
- unallocated_encoding(s);
127
- return;
128
- }
129
size = MO_16;
130
+ is_fp16 = true;
131
break;
132
case MO_32: /* single precision */
133
case MO_64: /* double precision */
134
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
135
unallocated_encoding(s);
136
return;
137
}
138
- } else {
139
+ break;
140
+
141
+ case 2: /* complex fp */
142
+ /* Each indexable element is a complex pair. */
143
+ size <<= 1;
144
+ switch (size) {
145
+ case MO_32:
146
+ if (h && !is_q) {
147
+ unallocated_encoding(s);
148
+ return;
149
+ }
150
+ is_fp16 = true;
151
+ break;
152
+ case MO_64:
153
+ break;
154
+ default:
155
+ unallocated_encoding(s);
156
+ return;
157
+ }
158
+ break;
159
+
160
+ default: /* integer */
161
switch (size) {
162
case MO_8:
163
case MO_64:
164
unallocated_encoding(s);
165
return;
166
}
167
+ break;
168
+ }
169
+ if (is_fp16 && !arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
170
+ unallocated_encoding(s);
171
+ return;
172
}
173
174
/* Given TCGMemOp size, adjust register and indexing. */
175
@@ -XXX,XX +XXX,XX @@ static void disas_simd_indexed(DisasContext *s, uint32_t insn)
176
fpst = NULL;
177
}
178
179
+ switch (16 * u + opcode) {
180
+ case 0x11: /* FCMLA #0 */
181
+ case 0x13: /* FCMLA #90 */
182
+ case 0x15: /* FCMLA #180 */
183
+ case 0x17: /* FCMLA #270 */
184
+ tcg_gen_gvec_3_ptr(vec_full_reg_offset(s, rd),
185
+ vec_full_reg_offset(s, rn),
186
+ vec_reg_offset(s, rm, index, size), fpst,
187
+ is_q ? 16 : 8, vec_full_reg_size(s),
188
+ extract32(insn, 13, 2), /* rot */
189
+ size == MO_64
190
+ ? gen_helper_gvec_fcmlas_idx
191
+ : gen_helper_gvec_fcmlah_idx);
192
+ tcg_temp_free_ptr(fpst);
193
+ return;
194
+ }
195
+
196
if (size == 3) {
197
TCGv_i64 tcg_idx = tcg_temp_new_i64();
198
int pass;
199
diff --git a/target/arm/vec_helper.c b/target/arm/vec_helper.c
200
index XXXXXXX..XXXXXXX 100644
201
--- a/target/arm/vec_helper.c
202
+++ b/target/arm/vec_helper.c
203
@@ -XXX,XX +XXX,XX @@ void HELPER(gvec_fcaddd)(void *vd, void *vn, void *vm,
204
}
205
clear_tail(d, opr_sz, simd_maxsz(desc));
206
}
207
+
208
+void HELPER(gvec_fcmlah)(void *vd, void *vn, void *vm,
209
+ void *vfpst, uint32_t desc)
210
+{
211
+ uintptr_t opr_sz = simd_oprsz(desc);
212
+ float16 *d = vd;
213
+ float16 *n = vn;
214
+ float16 *m = vm;
215
+ float_status *fpst = vfpst;
216
+ intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1);
217
+ uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1);
218
+ uint32_t neg_real = flip ^ neg_imag;
219
+ uintptr_t i;
220
+
221
+ /* Shift boolean to the sign bit so we can xor to negate. */
222
+ neg_real <<= 15;
223
+ neg_imag <<= 15;
224
+
225
+ for (i = 0; i < opr_sz / 2; i += 2) {
226
+ float16 e2 = n[H2(i + flip)];
227
+ float16 e1 = m[H2(i + flip)] ^ neg_real;
228
+ float16 e4 = e2;
229
+ float16 e3 = m[H2(i + 1 - flip)] ^ neg_imag;
230
+
231
+ d[H2(i)] = float16_muladd(e2, e1, d[H2(i)], 0, fpst);
232
+ d[H2(i + 1)] = float16_muladd(e4, e3, d[H2(i + 1)], 0, fpst);
233
+ }
234
+ clear_tail(d, opr_sz, simd_maxsz(desc));
235
+}
236
+
237
+void HELPER(gvec_fcmlah_idx)(void *vd, void *vn, void *vm,
238
+ void *vfpst, uint32_t desc)
239
+{
240
+ uintptr_t opr_sz = simd_oprsz(desc);
241
+ float16 *d = vd;
242
+ float16 *n = vn;
243
+ float16 *m = vm;
244
+ float_status *fpst = vfpst;
245
+ intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1);
246
+ uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1);
247
+ uint32_t neg_real = flip ^ neg_imag;
248
+ uintptr_t i;
249
+ float16 e1 = m[H2(flip)];
250
+ float16 e3 = m[H2(1 - flip)];
251
+
252
+ /* Shift boolean to the sign bit so we can xor to negate. */
253
+ neg_real <<= 15;
254
+ neg_imag <<= 15;
255
+ e1 ^= neg_real;
256
+ e3 ^= neg_imag;
257
+
258
+ for (i = 0; i < opr_sz / 2; i += 2) {
259
+ float16 e2 = n[H2(i + flip)];
260
+ float16 e4 = e2;
261
+
262
+ d[H2(i)] = float16_muladd(e2, e1, d[H2(i)], 0, fpst);
263
+ d[H2(i + 1)] = float16_muladd(e4, e3, d[H2(i + 1)], 0, fpst);
264
+ }
265
+ clear_tail(d, opr_sz, simd_maxsz(desc));
266
+}
267
+
268
+void HELPER(gvec_fcmlas)(void *vd, void *vn, void *vm,
269
+ void *vfpst, uint32_t desc)
270
+{
271
+ uintptr_t opr_sz = simd_oprsz(desc);
272
+ float32 *d = vd;
273
+ float32 *n = vn;
274
+ float32 *m = vm;
275
+ float_status *fpst = vfpst;
276
+ intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1);
277
+ uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1);
278
+ uint32_t neg_real = flip ^ neg_imag;
279
+ uintptr_t i;
280
+
281
+ /* Shift boolean to the sign bit so we can xor to negate. */
282
+ neg_real <<= 31;
283
+ neg_imag <<= 31;
284
+
285
+ for (i = 0; i < opr_sz / 4; i += 2) {
286
+ float32 e2 = n[H4(i + flip)];
287
+ float32 e1 = m[H4(i + flip)] ^ neg_real;
288
+ float32 e4 = e2;
289
+ float32 e3 = m[H4(i + 1 - flip)] ^ neg_imag;
290
+
291
+ d[H4(i)] = float32_muladd(e2, e1, d[H4(i)], 0, fpst);
292
+ d[H4(i + 1)] = float32_muladd(e4, e3, d[H4(i + 1)], 0, fpst);
293
+ }
294
+ clear_tail(d, opr_sz, simd_maxsz(desc));
295
+}
296
+
297
+void HELPER(gvec_fcmlas_idx)(void *vd, void *vn, void *vm,
298
+ void *vfpst, uint32_t desc)
299
+{
300
+ uintptr_t opr_sz = simd_oprsz(desc);
301
+ float32 *d = vd;
302
+ float32 *n = vn;
303
+ float32 *m = vm;
304
+ float_status *fpst = vfpst;
305
+ intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1);
306
+ uint32_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1);
307
+ uint32_t neg_real = flip ^ neg_imag;
308
+ uintptr_t i;
309
+ float32 e1 = m[H4(flip)];
310
+ float32 e3 = m[H4(1 - flip)];
311
+
312
+ /* Shift boolean to the sign bit so we can xor to negate. */
313
+ neg_real <<= 31;
314
+ neg_imag <<= 31;
315
+ e1 ^= neg_real;
316
+ e3 ^= neg_imag;
317
+
318
+ for (i = 0; i < opr_sz / 4; i += 2) {
319
+ float32 e2 = n[H4(i + flip)];
320
+ float32 e4 = e2;
321
+
322
+ d[H4(i)] = float32_muladd(e2, e1, d[H4(i)], 0, fpst);
323
+ d[H4(i + 1)] = float32_muladd(e4, e3, d[H4(i + 1)], 0, fpst);
324
+ }
325
+ clear_tail(d, opr_sz, simd_maxsz(desc));
326
+}
327
+
328
+void HELPER(gvec_fcmlad)(void *vd, void *vn, void *vm,
329
+ void *vfpst, uint32_t desc)
330
+{
331
+ uintptr_t opr_sz = simd_oprsz(desc);
332
+ float64 *d = vd;
333
+ float64 *n = vn;
334
+ float64 *m = vm;
335
+ float_status *fpst = vfpst;
336
+ intptr_t flip = extract32(desc, SIMD_DATA_SHIFT, 1);
337
+ uint64_t neg_imag = extract32(desc, SIMD_DATA_SHIFT + 1, 1);
338
+ uint64_t neg_real = flip ^ neg_imag;
339
+ uintptr_t i;
340
+
341
+ /* Shift boolean to the sign bit so we can xor to negate. */
342
+ neg_real <<= 63;
343
+ neg_imag <<= 63;
344
+
345
+ for (i = 0; i < opr_sz / 8; i += 2) {
346
+ float64 e2 = n[i + flip];
347
+ float64 e1 = m[i + flip] ^ neg_real;
348
+ float64 e4 = e2;
349
+ float64 e3 = m[i + 1 - flip] ^ neg_imag;
350
+
351
+ d[i] = float64_muladd(e2, e1, d[i], 0, fpst);
352
+ d[i + 1] = float64_muladd(e4, e3, d[i + 1], 0, fpst);
353
+ }
354
+ clear_tail(d, opr_sz, simd_maxsz(desc));
355
+}
230
--
356
--
231
2.16.2
357
2.16.2
232
358
233
359
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
We go with the localised helper.
3
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
4
4
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
5
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
Message-id: 20180228193125.20577-14-richard.henderson@linaro.org
6
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
7
Message-id: 20180227143852.11175-25-alex.bennee@linaro.org
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
9
---
7
---
10
target/arm/helper-a64.h | 1 +
8
target/arm/translate.c | 68 ++++++++++++++++++++++++++++++++++++++++++++++++++
11
target/arm/helper-a64.c | 29 +++++++++++++++++++++++++++++
9
1 file changed, 68 insertions(+)
12
target/arm/translate-a64.c | 4 ++++
13
3 files changed, 34 insertions(+)
14
10
15
diff --git a/target/arm/helper-a64.h b/target/arm/helper-a64.h
11
diff --git a/target/arm/translate.c b/target/arm/translate.c
16
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
17
--- a/target/arm/helper-a64.h
13
--- a/target/arm/translate.c
18
+++ b/target/arm/helper-a64.h
14
+++ b/target/arm/translate.c
19
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_FLAGS_1(neon_addlp_s16, TCG_CALL_NO_RWG_SE, i64, i64)
15
@@ -XXX,XX +XXX,XX @@ static int disas_neon_data_insn(DisasContext *s, uint32_t insn)
20
DEF_HELPER_FLAGS_1(neon_addlp_u16, TCG_CALL_NO_RWG_SE, i64, i64)
16
return 0;
21
DEF_HELPER_FLAGS_2(frecpx_f64, TCG_CALL_NO_RWG, f64, f64, ptr)
22
DEF_HELPER_FLAGS_2(frecpx_f32, TCG_CALL_NO_RWG, f32, f32, ptr)
23
+DEF_HELPER_FLAGS_2(frecpx_f16, TCG_CALL_NO_RWG, f16, f16, ptr)
24
DEF_HELPER_FLAGS_2(fcvtx_f64_to_f32, TCG_CALL_NO_RWG, f32, f64, env)
25
DEF_HELPER_FLAGS_3(crc32_64, TCG_CALL_NO_RWG_SE, i64, i64, i64, i32)
26
DEF_HELPER_FLAGS_3(crc32c_64, TCG_CALL_NO_RWG_SE, i64, i64, i64, i32)
27
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
28
index XXXXXXX..XXXXXXX 100644
29
--- a/target/arm/helper-a64.c
30
+++ b/target/arm/helper-a64.c
31
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(neon_addlp_u16)(uint64_t a)
32
}
17
}
33
18
34
/* Floating-point reciprocal exponent - see FPRecpX in ARM ARM */
19
+/* Advanced SIMD three registers of the same length extension.
35
+float16 HELPER(frecpx_f16)(float16 a, void *fpstp)
20
+ * 31 25 23 22 20 16 12 11 10 9 8 3 0
21
+ * +---------------+-----+---+-----+----+----+---+----+---+----+---------+----+
22
+ * | 1 1 1 1 1 1 0 | op1 | D | op2 | Vn | Vd | 1 | o3 | 0 | o4 | N Q M U | Vm |
23
+ * +---------------+-----+---+-----+----+----+---+----+---+----+---------+----+
24
+ */
25
+static int disas_neon_insn_3same_ext(DisasContext *s, uint32_t insn)
36
+{
26
+{
37
+ float_status *fpst = fpstp;
27
+ gen_helper_gvec_3_ptr *fn_gvec_ptr;
38
+ uint16_t val16, sbit;
28
+ int rd, rn, rm, rot, size, opr_sz;
39
+ int16_t exp;
29
+ TCGv_ptr fpst;
30
+ bool q;
40
+
31
+
41
+ if (float16_is_any_nan(a)) {
32
+ q = extract32(insn, 6, 1);
42
+ float16 nan = a;
33
+ VFP_DREG_D(rd, insn);
43
+ if (float16_is_signaling_nan(a, fpst)) {
34
+ VFP_DREG_N(rn, insn);
44
+ float_raise(float_flag_invalid, fpst);
35
+ VFP_DREG_M(rm, insn);
45
+ nan = float16_maybe_silence_nan(a, fpst);
36
+ if ((rd | rn | rm) & q) {
46
+ }
37
+ return 1;
47
+ if (fpst->default_nan_mode) {
48
+ nan = float16_default_nan(fpst);
49
+ }
50
+ return nan;
51
+ }
38
+ }
52
+
39
+
53
+ val16 = float16_val(a);
40
+ if ((insn & 0xfe200f10) == 0xfc200800) {
54
+ sbit = 0x8000 & val16;
41
+ /* VCMLA -- 1111 110R R.1S .... .... 1000 ...0 .... */
55
+ exp = extract32(val16, 10, 5);
42
+ size = extract32(insn, 20, 1);
43
+ rot = extract32(insn, 23, 2);
44
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA)
45
+ || (!size && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))) {
46
+ return 1;
47
+ }
48
+ fn_gvec_ptr = size ? gen_helper_gvec_fcmlas : gen_helper_gvec_fcmlah;
49
+ } else if ((insn & 0xfea00f10) == 0xfc800800) {
50
+ /* VCADD -- 1111 110R 1.0S .... .... 1000 ...0 .... */
51
+ size = extract32(insn, 20, 1);
52
+ rot = extract32(insn, 24, 1);
53
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA)
54
+ || (!size && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))) {
55
+ return 1;
56
+ }
57
+ fn_gvec_ptr = size ? gen_helper_gvec_fcadds : gen_helper_gvec_fcaddh;
58
+ } else {
59
+ return 1;
60
+ }
56
+
61
+
57
+ if (exp == 0) {
62
+ if (s->fp_excp_el) {
58
+ return make_float16(deposit32(sbit, 10, 5, 0x1e));
63
+ gen_exception_insn(s, 4, EXCP_UDEF,
59
+ } else {
64
+ syn_fp_access_trap(1, 0xe, false), s->fp_excp_el);
60
+ return make_float16(deposit32(sbit, 10, 5, ~exp));
65
+ return 0;
61
+ }
66
+ }
67
+ if (!s->vfp_enabled) {
68
+ return 1;
69
+ }
70
+
71
+ opr_sz = (1 + q) * 8;
72
+ fpst = get_fpstatus_ptr(1);
73
+ tcg_gen_gvec_3_ptr(vfp_reg_offset(1, rd),
74
+ vfp_reg_offset(1, rn),
75
+ vfp_reg_offset(1, rm), fpst,
76
+ opr_sz, opr_sz, rot, fn_gvec_ptr);
77
+ tcg_temp_free_ptr(fpst);
78
+ return 0;
62
+}
79
+}
63
+
80
+
64
float32 HELPER(frecpx_f32)(float32 a, void *fpstp)
81
static int disas_coproc_insn(DisasContext *s, uint32_t insn)
65
{
82
{
66
float_status *fpst = fpstp;
83
int cpnum, is64, crn, crm, opc1, opc2, isread, rt, rt2;
67
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
84
@@ -XXX,XX +XXX,XX @@ static void disas_arm_insn(DisasContext *s, unsigned int insn)
68
index XXXXXXX..XXXXXXX 100644
85
}
69
--- a/target/arm/translate-a64.c
86
}
70
+++ b/target/arm/translate-a64.c
87
}
71
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
88
+ } else if ((insn & 0x0e000a00) == 0x0c000800
72
handle_2misc_fcmp_zero(s, fpop, is_scalar, 0, is_q, MO_16, rn, rd);
89
+ && arm_dc_feature(s, ARM_FEATURE_V8)) {
73
return;
90
+ if (disas_neon_insn_3same_ext(s, insn)) {
74
case 0x3d: /* FRECPE */
91
+ goto illegal_op;
75
+ case 0x3f: /* FRECPX */
92
+ }
76
break;
93
+ return;
77
case 0x18: /* FRINTN */
94
} else if ((insn & 0x0fe00000) == 0x0c400000) {
78
need_rmode = true;
95
/* Coprocessor double register transfer. */
79
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
96
ARCH(5TE);
80
case 0x3d: /* FRECPE */
81
gen_helper_recpe_f16(tcg_res, tcg_op, tcg_fpstatus);
82
break;
83
+ case 0x3f: /* FRECPX */
84
+ gen_helper_frecpx_f16(tcg_res, tcg_op, tcg_fpstatus);
85
+ break;
86
case 0x5a: /* FCVTNU */
87
case 0x5b: /* FCVTMU */
88
case 0x5c: /* FCVTAU */
89
--
97
--
90
2.16.2
98
2.16.2
91
99
92
100
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
This actually covers two different sections of the encoding table:
3
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
4
4
Message-id: 20180228193125.20577-15-richard.henderson@linaro.org
5
Advanced SIMD scalar two-register miscellaneous FP16
5
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
6
Advanced SIMD two-register miscellaneous (FP16)
7
8
The difference between the two is covered by a combination of Q (bit
9
30) and S (bit 28). Notably the FRINTx instructions are only
10
available in the vector form.
11
12
This is just the decode skeleton which will be filled out by later
13
patches.
14
15
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
16
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
17
Message-id: 20180227143852.11175-17-alex.bennee@linaro.org
18
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
19
---
7
---
20
target/arm/translate-a64.c | 40 ++++++++++++++++++++++++++++++++++++++++
8
target/arm/translate.c | 61 ++++++++++++++++++++++++++++++++++++++++++++++++++
21
1 file changed, 40 insertions(+)
9
1 file changed, 61 insertions(+)
22
10
23
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
11
diff --git a/target/arm/translate.c b/target/arm/translate.c
24
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
25
--- a/target/arm/translate-a64.c
13
--- a/target/arm/translate.c
26
+++ b/target/arm/translate-a64.c
14
+++ b/target/arm/translate.c
27
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn)
15
@@ -XXX,XX +XXX,XX @@ static int disas_neon_insn_3same_ext(DisasContext *s, uint32_t insn)
28
}
16
return 0;
29
}
17
}
30
18
31
+/* AdvSIMD [scalar] two register miscellaneous (FP16)
19
+/* Advanced SIMD two registers and a scalar extension.
20
+ * 31 24 23 22 20 16 12 11 10 9 8 3 0
21
+ * +-----------------+----+---+----+----+----+---+----+---+----+---------+----+
22
+ * | 1 1 1 1 1 1 1 0 | o1 | D | o2 | Vn | Vd | 1 | o3 | 0 | o4 | N Q M U | Vm |
23
+ * +-----------------+----+---+----+----+----+---+----+---+----+---------+----+
32
+ *
24
+ *
33
+ * 31 30 29 28 27 24 23 22 21 17 16 12 11 10 9 5 4 0
34
+ * +---+---+---+---+---------+---+-------------+--------+-----+------+------+
35
+ * | 0 | Q | U | S | 1 1 1 0 | a | 1 1 1 1 0 0 | opcode | 1 0 | Rn | Rd |
36
+ * +---+---+---+---+---------+---+-------------+--------+-----+------+------+
37
+ * mask: 1000 1111 0111 1110 0000 1100 0000 0000 0x8f7e 0c00
38
+ * val: 0000 1110 0111 1000 0000 1000 0000 0000 0x0e78 0800
39
+ *
40
+ * This actually covers two groups where scalar access is governed by
41
+ * bit 28. A bunch of the instructions (float to integral) only exist
42
+ * in the vector form and are un-allocated for the scalar decode. Also
43
+ * in the scalar decode Q is always 1.
44
+ */
25
+ */
45
+static void disas_simd_two_reg_misc_fp16(DisasContext *s, uint32_t insn)
26
+
27
+static int disas_neon_insn_2reg_scalar_ext(DisasContext *s, uint32_t insn)
46
+{
28
+{
47
+ int fpop, opcode, a;
29
+ int rd, rn, rm, rot, size, opr_sz;
30
+ TCGv_ptr fpst;
31
+ bool q;
48
+
32
+
49
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FP16)) {
33
+ q = extract32(insn, 6, 1);
50
+ unallocated_encoding(s);
34
+ VFP_DREG_D(rd, insn);
51
+ return;
35
+ VFP_DREG_N(rn, insn);
36
+ VFP_DREG_M(rm, insn);
37
+ if ((rd | rn) & q) {
38
+ return 1;
52
+ }
39
+ }
53
+
40
+
54
+ if (!fp_access_check(s)) {
41
+ if ((insn & 0xff000f10) == 0xfe000800) {
55
+ return;
42
+ /* VCMLA (indexed) -- 1111 1110 S.RR .... .... 1000 ...0 .... */
43
+ rot = extract32(insn, 20, 2);
44
+ size = extract32(insn, 23, 1);
45
+ if (!arm_dc_feature(s, ARM_FEATURE_V8_FCMA)
46
+ || (!size && !arm_dc_feature(s, ARM_FEATURE_V8_FP16))) {
47
+ return 1;
48
+ }
49
+ } else {
50
+ return 1;
56
+ }
51
+ }
57
+
52
+
58
+ opcode = extract32(insn, 12, 4);
53
+ if (s->fp_excp_el) {
59
+ a = extract32(insn, 23, 1);
54
+ gen_exception_insn(s, 4, EXCP_UDEF,
60
+ fpop = deposit32(opcode, 5, 1, a);
55
+ syn_fp_access_trap(1, 0xe, false), s->fp_excp_el);
61
+
56
+ return 0;
62
+ switch (fpop) {
57
+ }
63
+ default:
58
+ if (!s->vfp_enabled) {
64
+ fprintf(stderr, "%s: insn %#04x fpop %#2x\n", __func__, insn, fpop);
59
+ return 1;
65
+ g_assert_not_reached();
66
+ }
60
+ }
67
+
61
+
62
+ opr_sz = (1 + q) * 8;
63
+ fpst = get_fpstatus_ptr(1);
64
+ tcg_gen_gvec_3_ptr(vfp_reg_offset(1, rd),
65
+ vfp_reg_offset(1, rn),
66
+ vfp_reg_offset(1, rm), fpst,
67
+ opr_sz, opr_sz, rot,
68
+ size ? gen_helper_gvec_fcmlas_idx
69
+ : gen_helper_gvec_fcmlah_idx);
70
+ tcg_temp_free_ptr(fpst);
71
+ return 0;
68
+}
72
+}
69
+
73
+
70
/* AdvSIMD scalar x indexed element
74
static int disas_coproc_insn(DisasContext *s, uint32_t insn)
71
* 31 30 29 28 24 23 22 21 20 19 16 15 12 11 10 9 5 4 0
75
{
72
* +-----+---+-----------+------+---+---+------+-----+---+---+------+------+
76
int cpnum, is64, crn, crm, opc1, opc2, isread, rt, rt2;
73
@@ -XXX,XX +XXX,XX @@ static const AArch64DecodeTable data_proc_simd[] = {
77
@@ -XXX,XX +XXX,XX @@ static void disas_arm_insn(DisasContext *s, unsigned int insn)
74
{ 0xce800000, 0xffe00000, disas_crypto_xar },
78
goto illegal_op;
75
{ 0xce408000, 0xffe0c000, disas_crypto_three_reg_imm2 },
79
}
76
{ 0x0e400400, 0x9f60c400, disas_simd_three_reg_same_fp16 },
80
return;
77
+ { 0x0e780800, 0x8f7e0c00, disas_simd_two_reg_misc_fp16 },
81
+ } else if ((insn & 0x0f000a00) == 0x0e000800
78
{ 0x00000000, 0x00000000, NULL }
82
+ && arm_dc_feature(s, ARM_FEATURE_V8)) {
79
};
83
+ if (disas_neon_insn_2reg_scalar_ext(s, insn)) {
80
84
+ goto illegal_op;
85
+ }
86
+ return;
87
} else if ((insn & 0x0fe00000) == 0x0c400000) {
88
/* Coprocessor double register transfer. */
89
ARCH(5TE);
81
--
90
--
82
2.16.2
91
2.16.2
83
92
84
93
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
As the rounding mode is now split between FP16 and the rest of
3
Happily, the bits are in the same places compared to a32.
4
floating point we need to be explicit when tweaking it. Instead of
5
passing the CPU env we now pass the appropriate fpst pointer directly.
6
4
7
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
Message-id: 20180228193125.20577-16-richard.henderson@linaro.org
9
Message-id: 20180227143852.11175-6-alex.bennee@linaro.org
7
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
9
---
12
target/arm/helper.h | 2 +-
10
target/arm/translate.c | 14 +++++++++++++-
13
target/arm/helper.c | 4 ++--
11
1 file changed, 13 insertions(+), 1 deletion(-)
14
target/arm/translate-a64.c | 26 +++++++++++++-------------
15
target/arm/translate.c | 12 ++++++------
16
4 files changed, 22 insertions(+), 22 deletions(-)
17
12
18
diff --git a/target/arm/helper.h b/target/arm/helper.h
19
index XXXXXXX..XXXXXXX 100644
20
--- a/target/arm/helper.h
21
+++ b/target/arm/helper.h
22
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_3(vfp_uhtod, f64, i64, i32, ptr)
23
DEF_HELPER_3(vfp_ultod, f64, i64, i32, ptr)
24
DEF_HELPER_3(vfp_uqtod, f64, i64, i32, ptr)
25
26
-DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, env)
27
+DEF_HELPER_FLAGS_2(set_rmode, TCG_CALL_NO_RWG, i32, i32, ptr)
28
DEF_HELPER_FLAGS_2(set_neon_rmode, TCG_CALL_NO_RWG, i32, i32, env)
29
30
DEF_HELPER_2(vfp_fcvt_f16_to_f32, f32, i32, env)
31
diff --git a/target/arm/helper.c b/target/arm/helper.c
32
index XXXXXXX..XXXXXXX 100644
33
--- a/target/arm/helper.c
34
+++ b/target/arm/helper.c
35
@@ -XXX,XX +XXX,XX @@ VFP_CONV_FIX_A64(uq, s, 32, 64, uint64)
36
/* Set the current fp rounding mode and return the old one.
37
* The argument is a softfloat float_round_ value.
38
*/
39
-uint32_t HELPER(set_rmode)(uint32_t rmode, CPUARMState *env)
40
+uint32_t HELPER(set_rmode)(uint32_t rmode, void *fpstp)
41
{
42
- float_status *fp_status = &env->vfp.fp_status;
43
+ float_status *fp_status = fpstp;
44
45
uint32_t prev_rmode = get_float_rounding_mode(fp_status);
46
set_float_rounding_mode(rmode, fp_status);
47
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
48
index XXXXXXX..XXXXXXX 100644
49
--- a/target/arm/translate-a64.c
50
+++ b/target/arm/translate-a64.c
51
@@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_single(DisasContext *s, int opcode, int rd, int rn)
52
{
53
TCGv_i32 tcg_rmode = tcg_const_i32(arm_rmode_to_sf(opcode & 7));
54
55
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
56
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
57
gen_helper_rints(tcg_res, tcg_op, fpst);
58
59
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
60
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
61
tcg_temp_free_i32(tcg_rmode);
62
break;
63
}
64
@@ -XXX,XX +XXX,XX @@ static void handle_fp_1src_double(DisasContext *s, int opcode, int rd, int rn)
65
{
66
TCGv_i32 tcg_rmode = tcg_const_i32(arm_rmode_to_sf(opcode & 7));
67
68
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
69
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
70
gen_helper_rintd(tcg_res, tcg_op, fpst);
71
72
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
73
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
74
tcg_temp_free_i32(tcg_rmode);
75
break;
76
}
77
@@ -XXX,XX +XXX,XX @@ static void handle_fpfpcvt(DisasContext *s, int rd, int rn, int opcode,
78
79
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode));
80
81
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
82
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
83
84
if (is_double) {
85
TCGv_i64 tcg_double = read_fp_dreg(s, rn);
86
@@ -XXX,XX +XXX,XX @@ static void handle_fpfpcvt(DisasContext *s, int rd, int rn, int opcode,
87
tcg_temp_free_i32(tcg_single);
88
}
89
90
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
91
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
92
tcg_temp_free_i32(tcg_rmode);
93
94
if (!sf) {
95
@@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,
96
assert(!(is_scalar && is_q));
97
98
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(FPROUNDING_ZERO));
99
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
100
tcg_fpstatus = get_fpstatus_ptr(false);
101
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
102
tcg_shift = tcg_const_i32(fracbits);
103
104
if (is_double) {
105
@@ -XXX,XX +XXX,XX @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,
106
107
tcg_temp_free_ptr(tcg_fpstatus);
108
tcg_temp_free_i32(tcg_shift);
109
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
110
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
111
tcg_temp_free_i32(tcg_rmode);
112
}
113
114
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_two_reg_misc(DisasContext *s, uint32_t insn)
115
116
if (is_fcvt) {
117
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode));
118
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
119
tcg_fpstatus = get_fpstatus_ptr(false);
120
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
121
} else {
122
tcg_rmode = NULL;
123
tcg_fpstatus = NULL;
124
@@ -XXX,XX +XXX,XX @@ static void disas_simd_scalar_two_reg_misc(DisasContext *s, uint32_t insn)
125
}
126
127
if (is_fcvt) {
128
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
129
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
130
tcg_temp_free_i32(tcg_rmode);
131
tcg_temp_free_ptr(tcg_fpstatus);
132
}
133
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn)
134
return;
135
}
136
137
- if (need_fpstatus) {
138
+ if (need_fpstatus || need_rmode) {
139
tcg_fpstatus = get_fpstatus_ptr(false);
140
} else {
141
tcg_fpstatus = NULL;
142
}
143
if (need_rmode) {
144
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rmode));
145
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
146
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
147
} else {
148
tcg_rmode = NULL;
149
}
150
@@ -XXX,XX +XXX,XX @@ static void disas_simd_two_reg_misc(DisasContext *s, uint32_t insn)
151
clear_vec_high(s, is_q, rd);
152
153
if (need_rmode) {
154
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
155
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, tcg_fpstatus);
156
tcg_temp_free_i32(tcg_rmode);
157
}
158
if (need_fpstatus) {
159
diff --git a/target/arm/translate.c b/target/arm/translate.c
13
diff --git a/target/arm/translate.c b/target/arm/translate.c
160
index XXXXXXX..XXXXXXX 100644
14
index XXXXXXX..XXXXXXX 100644
161
--- a/target/arm/translate.c
15
--- a/target/arm/translate.c
162
+++ b/target/arm/translate.c
16
+++ b/target/arm/translate.c
163
@@ -XXX,XX +XXX,XX @@ static int handle_vrint(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp,
17
@@ -XXX,XX +XXX,XX @@ static void disas_thumb2_insn(DisasContext *s, uint32_t insn)
164
TCGv_i32 tcg_rmode;
18
default_exception_el(s));
165
19
break;
166
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rounding));
20
}
167
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
21
- if (((insn >> 24) & 3) == 3) {
168
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
22
+ if ((insn & 0xfe000a00) == 0xfc000800
169
23
+ && arm_dc_feature(s, ARM_FEATURE_V8)) {
170
if (dp) {
24
+ /* The Thumb2 and ARM encodings are identical. */
171
TCGv_i64 tcg_op;
25
+ if (disas_neon_insn_3same_ext(s, insn)) {
172
@@ -XXX,XX +XXX,XX @@ static int handle_vrint(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp,
26
+ goto illegal_op;
173
tcg_temp_free_i32(tcg_res);
27
+ }
174
}
28
+ } else if ((insn & 0xff000a00) == 0xfe000800
175
29
+ && arm_dc_feature(s, ARM_FEATURE_V8)) {
176
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
30
+ /* The Thumb2 and ARM encodings are identical. */
177
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
31
+ if (disas_neon_insn_2reg_scalar_ext(s, insn)) {
178
tcg_temp_free_i32(tcg_rmode);
32
+ goto illegal_op;
179
33
+ }
180
tcg_temp_free_ptr(fpst);
34
+ } else if (((insn >> 24) & 3) == 3) {
181
@@ -XXX,XX +XXX,XX @@ static int handle_vcvt(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp,
35
/* Translate into the equivalent ARM encoding. */
182
tcg_shift = tcg_const_i32(0);
36
insn = (insn & 0xe2ffffff) | ((insn & (1 << 28)) >> 4) | (1 << 28);
183
37
if (disas_neon_data_insn(s, insn)) {
184
tcg_rmode = tcg_const_i32(arm_rmode_to_sf(rounding));
185
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
186
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
187
188
if (dp) {
189
TCGv_i64 tcg_double, tcg_res;
190
@@ -XXX,XX +XXX,XX @@ static int handle_vcvt(uint32_t insn, uint32_t rd, uint32_t rm, uint32_t dp,
191
tcg_temp_free_i32(tcg_single);
192
}
193
194
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
195
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
196
tcg_temp_free_i32(tcg_rmode);
197
198
tcg_temp_free_i32(tcg_shift);
199
@@ -XXX,XX +XXX,XX @@ static int disas_vfp_insn(DisasContext *s, uint32_t insn)
200
TCGv_ptr fpst = get_fpstatus_ptr(0);
201
TCGv_i32 tcg_rmode;
202
tcg_rmode = tcg_const_i32(float_round_to_zero);
203
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
204
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
205
if (dp) {
206
gen_helper_rintd(cpu_F0d, cpu_F0d, fpst);
207
} else {
208
gen_helper_rints(cpu_F0s, cpu_F0s, fpst);
209
}
210
- gen_helper_set_rmode(tcg_rmode, tcg_rmode, cpu_env);
211
+ gen_helper_set_rmode(tcg_rmode, tcg_rmode, fpst);
212
tcg_temp_free_i32(tcg_rmode);
213
tcg_temp_free_ptr(fpst);
214
break;
215
--
38
--
216
2.16.2
39
2.16.2
217
40
218
41
diff view generated by jsdifflib
1
From: Alex Bennée <alex.bennee@linaro.org>
1
From: Richard Henderson <richard.henderson@linaro.org>
2
2
3
This allows us to explicitly pass float16 to helpers rather than
3
Enable it for the "any" CPU used by *-linux-user.
4
assuming uint32_t and dealing with the result. Of course they will be
5
passed in i32 sized registers by default.
6
4
7
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
6
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
9
Message-id: 20180227143852.11175-2-alex.bennee@linaro.org
7
Message-id: 20180228193125.20577-17-richard.henderson@linaro.org
10
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
8
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
11
---
9
---
12
include/exec/helper-head.h | 3 +++
10
target/arm/cpu.c | 1 +
13
1 file changed, 3 insertions(+)
11
target/arm/cpu64.c | 1 +
12
2 files changed, 2 insertions(+)
14
13
15
diff --git a/include/exec/helper-head.h b/include/exec/helper-head.h
14
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
16
index XXXXXXX..XXXXXXX 100644
15
index XXXXXXX..XXXXXXX 100644
17
--- a/include/exec/helper-head.h
16
--- a/target/arm/cpu.c
18
+++ b/include/exec/helper-head.h
17
+++ b/target/arm/cpu.c
19
@@ -XXX,XX +XXX,XX @@
18
@@ -XXX,XX +XXX,XX @@ static void arm_any_initfn(Object *obj)
20
#define dh_alias_int i32
19
set_feature(&cpu->env, ARM_FEATURE_V8_PMULL);
21
#define dh_alias_i64 i64
20
set_feature(&cpu->env, ARM_FEATURE_CRC);
22
#define dh_alias_s64 i64
21
set_feature(&cpu->env, ARM_FEATURE_V8_RDM);
23
+#define dh_alias_f16 i32
22
+ set_feature(&cpu->env, ARM_FEATURE_V8_FCMA);
24
#define dh_alias_f32 i32
23
cpu->midr = 0xffffffff;
25
#define dh_alias_f64 i64
24
}
26
#define dh_alias_ptr ptr
25
#endif
27
@@ -XXX,XX +XXX,XX @@
26
diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
28
#define dh_ctype_int int
27
index XXXXXXX..XXXXXXX 100644
29
#define dh_ctype_i64 uint64_t
28
--- a/target/arm/cpu64.c
30
#define dh_ctype_s64 int64_t
29
+++ b/target/arm/cpu64.c
31
+#define dh_ctype_f16 float16
30
@@ -XXX,XX +XXX,XX @@ static void aarch64_any_initfn(Object *obj)
32
#define dh_ctype_f32 float32
31
set_feature(&cpu->env, ARM_FEATURE_CRC);
33
#define dh_ctype_f64 float64
32
set_feature(&cpu->env, ARM_FEATURE_V8_RDM);
34
#define dh_ctype_ptr void *
33
set_feature(&cpu->env, ARM_FEATURE_V8_FP16);
35
@@ -XXX,XX +XXX,XX @@
34
+ set_feature(&cpu->env, ARM_FEATURE_V8_FCMA);
36
#define dh_is_signed_s32 1
35
cpu->ctr = 0x80038003; /* 32 byte I and D cacheline size, VIPT icache */
37
#define dh_is_signed_i64 0
36
cpu->dcz_blocksize = 7; /* 512 bytes */
38
#define dh_is_signed_s64 1
37
}
39
+#define dh_is_signed_f16 0
40
#define dh_is_signed_f32 0
41
#define dh_is_signed_f64 0
42
#define dh_is_signed_tl 0
43
--
38
--
44
2.16.2
39
2.16.2
45
40
46
41
diff view generated by jsdifflib